diff options
Diffstat (limited to 'meta-amd-bsp/recipes-kernel/linux/linux-yocto-4.19.8/1822-drm-amdgpu-Remap-hdp-coherency-registers.patch')
-rw-r--r-- | meta-amd-bsp/recipes-kernel/linux/linux-yocto-4.19.8/1822-drm-amdgpu-Remap-hdp-coherency-registers.patch | 197 |
1 files changed, 197 insertions, 0 deletions
diff --git a/meta-amd-bsp/recipes-kernel/linux/linux-yocto-4.19.8/1822-drm-amdgpu-Remap-hdp-coherency-registers.patch b/meta-amd-bsp/recipes-kernel/linux/linux-yocto-4.19.8/1822-drm-amdgpu-Remap-hdp-coherency-registers.patch new file mode 100644 index 00000000..99db195b --- /dev/null +++ b/meta-amd-bsp/recipes-kernel/linux/linux-yocto-4.19.8/1822-drm-amdgpu-Remap-hdp-coherency-registers.patch @@ -0,0 +1,197 @@ +From 93811cb3c190dee86fe629bc9bed2d586a86813f Mon Sep 17 00:00:00 2001 +From: Oak Zeng <Oak.Zeng@amd.com> +Date: Thu, 4 Apr 2019 15:47:34 -0500 +Subject: [PATCH 1822/2940] drm/amdgpu: Remap hdp coherency registers + +Remap HDP_MEM_COHERENCY_FLUSH_CNTL and HDP_REG_COHERENCY_FLUSH_CNTL +to an empty page in mmio space. We will later map this page to process +space so application can flush hdp. This can't be done properly at +those registers' original location because it will expose more than +desired registers to process space. + +v2: Use explicit register hole location +v3: Moved remapped hdp registers into adev struct +v4: Use more generic name for remapped page + Expose register offset in kfd_ioctl.h +v5: Move hdp register remap function to nbio ip function +v6: Fixed operator precedence issue and other bugs + +Change-Id: Ia8d27c0c9a082711d16bbf55602bf5712a47b6d6 +Signed-off-by: Oak Zeng <Oak.Zeng@amd.com> +Reviewed-by: Felix Kuehling <Felix.Kuehling@amd.com> +Signed-off-by: Chaudhary Amit Kumar <Chaudharyamit.Kumar@amd.com> +--- + drivers/gpu/drm/amd/amdgpu/amdgpu.h | 7 +++++++ + drivers/gpu/drm/amd/amdgpu/nbio_v7_0.c | 15 ++++++++++++--- + drivers/gpu/drm/amd/amdgpu/nbio_v7_4.c | 15 ++++++++++++--- + drivers/gpu/drm/amd/amdgpu/soc15.c | 11 +++++++++++ + 4 files changed, 42 insertions(+), 6 deletions(-) + +diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu.h b/drivers/gpu/drm/amd/amdgpu/amdgpu.h +index dcc54022579f..b458019e4cea 100644 +--- a/drivers/gpu/drm/amd/amdgpu/amdgpu.h ++++ b/drivers/gpu/drm/amd/amdgpu/amdgpu.h +@@ -655,6 +655,11 @@ struct nbio_hdp_flush_reg { + u32 ref_and_mask_sdma1; + }; + ++struct amdgpu_mmio_remap { ++ u32 reg_offset; ++ resource_size_t bus_addr; ++}; ++ + struct amdgpu_nbio_funcs { + const struct nbio_hdp_flush_reg *hdp_flush_reg; + u32 (*get_hdp_flush_req_offset)(struct amdgpu_device *adev); +@@ -682,6 +687,7 @@ struct amdgpu_nbio_funcs { + void (*ih_control)(struct amdgpu_device *adev); + void (*init_registers)(struct amdgpu_device *adev); + void (*detect_hw_virt)(struct amdgpu_device *adev); ++ void (*remap_hdp_registers)(struct amdgpu_device *adev); + }; + + struct amdgpu_df_funcs { +@@ -804,6 +810,7 @@ struct amdgpu_device { + void __iomem *rmmio; + /* protects concurrent MM_INDEX/DATA based register access */ + spinlock_t mmio_idx_lock; ++ struct amdgpu_mmio_remap rmmio_remap; + /* protects concurrent SMC based register access */ + spinlock_t smc_idx_lock; + amdgpu_rreg_t smc_rreg; +diff --git a/drivers/gpu/drm/amd/amdgpu/nbio_v7_0.c b/drivers/gpu/drm/amd/amdgpu/nbio_v7_0.c +index 150ca8e4fd7c..f73fb25ba242 100644 +--- a/drivers/gpu/drm/amd/amdgpu/nbio_v7_0.c ++++ b/drivers/gpu/drm/amd/amdgpu/nbio_v7_0.c +@@ -29,6 +29,7 @@ + #include "nbio/nbio_7_0_sh_mask.h" + #include "nbio/nbio_7_0_smn.h" + #include "vega10_enum.h" ++#include <uapi/linux/kfd_ioctl.h> + + #define smnNBIF_MGCG_CTRL_LCLK 0x1013a05c + +@@ -36,6 +37,14 @@ + #define mmRCC_DEV0_EPF0_STRAP0_VG20 0x0011 + #define mmRCC_DEV0_EPF0_STRAP0_VG20_BASE_IDX 2 + ++static void nbio_v7_0_remap_hdp_registers(struct amdgpu_device *adev) ++{ ++ WREG32_SOC15(NBIO, 0, mmREMAP_HDP_MEM_FLUSH_CNTL, ++ adev->rmmio_remap.reg_offset + KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL); ++ WREG32_SOC15(NBIO, 0, mmREMAP_HDP_REG_FLUSH_CNTL, ++ adev->rmmio_remap.reg_offset + KFD_MMIO_REMAP_HDP_REG_FLUSH_CNTL); ++} ++ + static u32 nbio_v7_0_get_rev_id(struct amdgpu_device *adev) + { + u32 tmp = RREG32_SOC15(NBIO, 0, mmRCC_DEV0_EPF0_STRAP0); +@@ -64,10 +73,9 @@ static void nbio_v7_0_hdp_flush(struct amdgpu_device *adev, + struct amdgpu_ring *ring) + { + if (!ring || !ring->funcs->emit_wreg) +- WREG32_SOC15_NO_KIQ(NBIO, 0, mmHDP_MEM_COHERENCY_FLUSH_CNTL, 0); ++ WREG32_NO_KIQ((adev->rmmio_remap.reg_offset + KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2, 0); + else +- amdgpu_ring_emit_wreg(ring, SOC15_REG_OFFSET( +- NBIO, 0, mmHDP_MEM_COHERENCY_FLUSH_CNTL), 0); ++ amdgpu_ring_emit_wreg(ring, (adev->rmmio_remap.reg_offset + KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2, 0); + } + + static u32 nbio_v7_0_get_memsize(struct amdgpu_device *adev) +@@ -299,4 +307,5 @@ const struct amdgpu_nbio_funcs nbio_v7_0_funcs = { + .ih_control = nbio_v7_0_ih_control, + .init_registers = nbio_v7_0_init_registers, + .detect_hw_virt = nbio_v7_0_detect_hw_virt, ++ .remap_hdp_registers = nbio_v7_0_remap_hdp_registers, + }; +diff --git a/drivers/gpu/drm/amd/amdgpu/nbio_v7_4.c b/drivers/gpu/drm/amd/amdgpu/nbio_v7_4.c +index c69d51598cfe..bfaaa327ae3c 100644 +--- a/drivers/gpu/drm/amd/amdgpu/nbio_v7_4.c ++++ b/drivers/gpu/drm/amd/amdgpu/nbio_v7_4.c +@@ -27,9 +27,18 @@ + #include "nbio/nbio_7_4_offset.h" + #include "nbio/nbio_7_4_sh_mask.h" + #include "nbio/nbio_7_4_0_smn.h" ++#include <uapi/linux/kfd_ioctl.h> + + #define smnNBIF_MGCG_CTRL_LCLK 0x1013a21c + ++static void nbio_v7_4_remap_hdp_registers(struct amdgpu_device *adev) ++{ ++ WREG32_SOC15(NBIO, 0, mmREMAP_HDP_MEM_FLUSH_CNTL, ++ adev->rmmio_remap.reg_offset + KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL); ++ WREG32_SOC15(NBIO, 0, mmREMAP_HDP_REG_FLUSH_CNTL, ++ adev->rmmio_remap.reg_offset + KFD_MMIO_REMAP_HDP_REG_FLUSH_CNTL); ++} ++ + static u32 nbio_v7_4_get_rev_id(struct amdgpu_device *adev) + { + u32 tmp = RREG32_SOC15(NBIO, 0, mmRCC_DEV0_EPF0_STRAP0); +@@ -53,10 +62,9 @@ static void nbio_v7_4_hdp_flush(struct amdgpu_device *adev, + struct amdgpu_ring *ring) + { + if (!ring || !ring->funcs->emit_wreg) +- WREG32_SOC15_NO_KIQ(NBIO, 0, mmHDP_MEM_COHERENCY_FLUSH_CNTL, 0); ++ WREG32_NO_KIQ((adev->rmmio_remap.reg_offset + KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2, 0); + else +- amdgpu_ring_emit_wreg(ring, SOC15_REG_OFFSET( +- NBIO, 0, mmHDP_MEM_COHERENCY_FLUSH_CNTL), 0); ++ amdgpu_ring_emit_wreg(ring, (adev->rmmio_remap.reg_offset + KFD_MMIO_REMAP_HDP_MEM_FLUSH_CNTL) >> 2, 0); + } + + static u32 nbio_v7_4_get_memsize(struct amdgpu_device *adev) +@@ -262,4 +270,5 @@ const struct amdgpu_nbio_funcs nbio_v7_4_funcs = { + .ih_control = nbio_v7_4_ih_control, + .init_registers = nbio_v7_4_init_registers, + .detect_hw_virt = nbio_v7_4_detect_hw_virt, ++ .remap_hdp_registers = nbio_v7_4_remap_hdp_registers, + }; +diff --git a/drivers/gpu/drm/amd/amdgpu/soc15.c b/drivers/gpu/drm/amd/amdgpu/soc15.c +index 1788fb938aed..278ccd65a8d2 100644 +--- a/drivers/gpu/drm/amd/amdgpu/soc15.c ++++ b/drivers/gpu/drm/amd/amdgpu/soc15.c +@@ -44,6 +44,7 @@ + #include "smuio/smuio_9_0_offset.h" + #include "smuio/smuio_9_0_sh_mask.h" + #include "nbio/nbio_7_0_default.h" ++#include "nbio/nbio_7_0_offset.h" + #include "nbio/nbio_7_0_sh_mask.h" + #include "nbio/nbio_7_0_smn.h" + #include "mp/mp_9_0_offset.h" +@@ -64,6 +65,7 @@ + #include "dce_virtual.h" + #include "mxgpu_ai.h" + #include "amdgpu_smu.h" ++#include <uapi/linux/kfd_ioctl.h> + + #define mmMP0_MISC_CGTT_CTRL0 0x01b9 + #define mmMP0_MISC_CGTT_CTRL0_BASE_IDX 0 +@@ -783,8 +785,11 @@ static const struct amdgpu_asic_funcs vega20_asic_funcs = + + static int soc15_common_early_init(void *handle) + { ++#define MMIO_REG_HOLE_OFFSET (0x80000 - PAGE_SIZE) + struct amdgpu_device *adev = (struct amdgpu_device *)handle; + ++ adev->rmmio_remap.reg_offset = MMIO_REG_HOLE_OFFSET; ++ adev->rmmio_remap.bus_addr = adev->rmmio_base + MMIO_REG_HOLE_OFFSET; + adev->smc_rreg = NULL; + adev->smc_wreg = NULL; + adev->pcie_rreg = &soc15_pcie_rreg; +@@ -1013,6 +1018,12 @@ static int soc15_common_hw_init(void *handle) + soc15_program_aspm(adev); + /* setup nbio registers */ + adev->nbio_funcs->init_registers(adev); ++ /* remap HDP registers to a hole in mmio space, ++ * for the purpose of expose those registers ++ * to process space ++ */ ++ if (adev->nbio_funcs->remap_hdp_registers) ++ adev->nbio_funcs->remap_hdp_registers(adev); + /* enable the doorbell aperture */ + soc15_enable_doorbell_aperture(adev, true); + /* HW doorbell routing policy: doorbell writing not +-- +2.17.1 + |