On Mon, Feb 13, 2017 at 6:00 PM, Deucher, Alexander <Alexander.Deucher at amd.com> wrote: >> -----Original Message----- >> From: amd-gfx [mailto:amd-gfx-bounces at lists.freedesktop.org] On Behalf >> Of Marek Olšák >> Sent: Monday, February 13, 2017 11:58 AM >> To: amd-gfx at lists.freedesktop.org >> Subject: [PATCH] drm/radeon: allow unaligned shader loads on CIK >> >> From: Marek Olšák <marek.olsak at amd.com> >> >> Signed-off-by: Marek Olšák <marek.olsak at amd.com> > > Add a better patch description. With that fixed: > Reviewed-by: Alex Deucher <alexander.deucher at amd.com> What's a better patch description? "drm/radeon: set SH_MEM_CONFIG.ALIGNMENT_MODE = UNALIGNED on CIK"? Marek > > >> --- >> drivers/gpu/drm/radeon/cik.c | 7 +++++-- >> drivers/gpu/drm/radeon/radeon_drv.c | 3 ++- >> 2 files changed, 7 insertions(+), 3 deletions(-) >> >> diff --git a/drivers/gpu/drm/radeon/cik.c b/drivers/gpu/drm/radeon/cik.c >> index f6ff41a..ac0d939 100644 >> --- a/drivers/gpu/drm/radeon/cik.c >> +++ b/drivers/gpu/drm/radeon/cik.c >> @@ -28,20 +28,23 @@ >> #include "radeon.h" >> #include "radeon_asic.h" >> #include "radeon_audio.h" >> #include "cikd.h" >> #include "atom.h" >> #include "cik_blit_shaders.h" >> #include "radeon_ucode.h" >> #include "clearstate_ci.h" >> #include "radeon_kfd.h" >> >> +#define SH_MEM_CONFIG_GFX_DEFAULT \ >> + ALIGNMENT_MODE(SH_MEM_ALIGNMENT_MODE_UNALIGNED) >> + >> MODULE_FIRMWARE("radeon/BONAIRE_pfp.bin"); >> MODULE_FIRMWARE("radeon/BONAIRE_me.bin"); >> MODULE_FIRMWARE("radeon/BONAIRE_ce.bin"); >> MODULE_FIRMWARE("radeon/BONAIRE_mec.bin"); >> MODULE_FIRMWARE("radeon/BONAIRE_mc.bin"); >> MODULE_FIRMWARE("radeon/BONAIRE_mc2.bin"); >> MODULE_FIRMWARE("radeon/BONAIRE_rlc.bin"); >> MODULE_FIRMWARE("radeon/BONAIRE_sdma.bin"); >> MODULE_FIRMWARE("radeon/BONAIRE_smc.bin"); >> >> @@ -5580,21 +5583,21 @@ static int cik_pcie_gart_enable(struct >> radeon_device *rdev) >> tmp &= ~BYPASS_VM; >> WREG32(CHUB_CONTROL, tmp); >> } >> >> /* XXX SH_MEM regs */ >> /* where to put LDS, scratch, GPUVM in FSA64 space */ >> mutex_lock(&rdev->srbm_mutex); >> for (i = 0; i < 16; i++) { >> cik_srbm_select(rdev, 0, 0, 0, i); >> /* CP and shaders */ >> - WREG32(SH_MEM_CONFIG, 0); >> + WREG32(SH_MEM_CONFIG, >> SH_MEM_CONFIG_GFX_DEFAULT); >> WREG32(SH_MEM_APE1_BASE, 1); >> WREG32(SH_MEM_APE1_LIMIT, 0); >> WREG32(SH_MEM_BASES, 0); >> /* SDMA GFX */ >> WREG32(SDMA0_GFX_VIRTUAL_ADDR + >> SDMA0_REGISTER_OFFSET, 0); >> WREG32(SDMA0_GFX_APE1_CNTL + >> SDMA0_REGISTER_OFFSET, 0); >> WREG32(SDMA0_GFX_VIRTUAL_ADDR + >> SDMA1_REGISTER_OFFSET, 0); >> WREG32(SDMA0_GFX_APE1_CNTL + >> SDMA1_REGISTER_OFFSET, 0); >> /* XXX SDMA RLC - todo */ >> } >> @@ -5787,21 +5790,21 @@ void cik_vm_flush(struct radeon_device *rdev, >> struct radeon_ring *ring, >> radeon_ring_write(ring, 0); >> radeon_ring_write(ring, VMID(vm_id)); >> >> radeon_ring_write(ring, PACKET3(PACKET3_WRITE_DATA, 6)); >> radeon_ring_write(ring, (WRITE_DATA_ENGINE_SEL(usepfp) | >> WRITE_DATA_DST_SEL(0))); >> radeon_ring_write(ring, SH_MEM_BASES >> 2); >> radeon_ring_write(ring, 0); >> >> radeon_ring_write(ring, 0); /* SH_MEM_BASES */ >> - radeon_ring_write(ring, 0); /* SH_MEM_CONFIG */ >> + radeon_ring_write(ring, SH_MEM_CONFIG_GFX_DEFAULT); /* >> SH_MEM_CONFIG */ >> radeon_ring_write(ring, 1); /* SH_MEM_APE1_BASE */ >> radeon_ring_write(ring, 0); /* SH_MEM_APE1_LIMIT */ >> >> radeon_ring_write(ring, PACKET3(PACKET3_WRITE_DATA, 3)); >> radeon_ring_write(ring, (WRITE_DATA_ENGINE_SEL(usepfp) | >> WRITE_DATA_DST_SEL(0))); >> radeon_ring_write(ring, SRBM_GFX_CNTL >> 2); >> radeon_ring_write(ring, 0); >> radeon_ring_write(ring, VMID(0)); >> >> diff --git a/drivers/gpu/drm/radeon/radeon_drv.c >> b/drivers/gpu/drm/radeon/radeon_drv.c >> index 30bd4a6..2e5d680 100644 >> --- a/drivers/gpu/drm/radeon/radeon_drv.c >> +++ b/drivers/gpu/drm/radeon/radeon_drv.c >> @@ -91,23 +91,24 @@ >> * CS to GPU on >= r600 >> * 2.41.0 - evergreen/cayman: Add SET_BASE/DRAW_INDIRECT command >> parsing support >> * 2.42.0 - Add VCE/VUI (Video Usability Information) support >> * 2.43.0 - RADEON_INFO_GPU_RESET_COUNTER >> * 2.44.0 - SET_APPEND_CNT packet3 support >> * 2.45.0 - Allow setting shader registers using DMA/COPY packet3 on SI >> * 2.46.0 - Add PFP_SYNC_ME support on evergreen >> * 2.47.0 - Add UVD_NO_OP register support >> * 2.48.0 - TA_CS_BC_BASE_ADDR allowed on SI >> * 2.49.0 - DRM_RADEON_GEM_INFO ioctl returns correct vram_size/visible >> values >> + * 2.50.0 - Allows unaligned shader loads on CIK. (needed by OpenGL) >> */ >> #define KMS_DRIVER_MAJOR 2 >> -#define KMS_DRIVER_MINOR 49 >> +#define KMS_DRIVER_MINOR 50 >> #define KMS_DRIVER_PATCHLEVEL 0 >> int radeon_driver_load_kms(struct drm_device *dev, unsigned long flags); >> int radeon_driver_unload_kms(struct drm_device *dev); >> void radeon_driver_lastclose_kms(struct drm_device *dev); >> int radeon_driver_open_kms(struct drm_device *dev, struct drm_file >> *file_priv); >> void radeon_driver_postclose_kms(struct drm_device *dev, >> struct drm_file *file_priv); >> void radeon_driver_preclose_kms(struct drm_device *dev, >> struct drm_file *file_priv); >> int radeon_suspend_kms(struct drm_device *dev, bool suspend, >> -- >> 2.7.4 >> >> _______________________________________________ >> amd-gfx mailing list >> amd-gfx at lists.freedesktop.org >> https://lists.freedesktop.org/mailman/listinfo/amd-gfx