aboutsummaryrefslogtreecommitdiffstats
path: root/meta-amd-bsp/recipes-kernel/linux/linux-yocto-4.19.8/3358-drm-amdgpu-create-mmhub-ras-framework.patch
diff options
context:
space:
mode:
Diffstat (limited to 'meta-amd-bsp/recipes-kernel/linux/linux-yocto-4.19.8/3358-drm-amdgpu-create-mmhub-ras-framework.patch')
-rw-r--r--meta-amd-bsp/recipes-kernel/linux/linux-yocto-4.19.8/3358-drm-amdgpu-create-mmhub-ras-framework.patch230
1 files changed, 230 insertions, 0 deletions
diff --git a/meta-amd-bsp/recipes-kernel/linux/linux-yocto-4.19.8/3358-drm-amdgpu-create-mmhub-ras-framework.patch b/meta-amd-bsp/recipes-kernel/linux/linux-yocto-4.19.8/3358-drm-amdgpu-create-mmhub-ras-framework.patch
new file mode 100644
index 00000000..659018c6
--- /dev/null
+++ b/meta-amd-bsp/recipes-kernel/linux/linux-yocto-4.19.8/3358-drm-amdgpu-create-mmhub-ras-framework.patch
@@ -0,0 +1,230 @@
+From 61356ce21d437598963b0261c740a0495b3e677e Mon Sep 17 00:00:00 2001
+From: Tao Zhou <tao.zhou1@amd.com>
+Date: Wed, 7 Aug 2019 12:21:22 +0800
+Subject: [PATCH 3358/4256] drm/amdgpu: create mmhub ras framework
+
+enable mmhub ras feature and create sysfs/debugfs node for mmhub
+
+Signed-off-by: Tao Zhou <tao.zhou1@amd.com>
+Reviewed-by: Hawking Zhang <Hawking.Zhang@amd.com>
+---
+ drivers/gpu/drm/amd/amdgpu/amdgpu_gmc.h | 3 +-
+ drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c | 112 +++++++++++++++++-------
+ 2 files changed, 82 insertions(+), 33 deletions(-)
+
+diff --git a/drivers/gpu/drm/amd/amdgpu/amdgpu_gmc.h b/drivers/gpu/drm/amd/amdgpu/amdgpu_gmc.h
+index e43036cefb64..f614ae0302cb 100644
+--- a/drivers/gpu/drm/amd/amdgpu/amdgpu_gmc.h
++++ b/drivers/gpu/drm/amd/amdgpu/amdgpu_gmc.h
+@@ -177,7 +177,8 @@ struct amdgpu_gmc {
+
+ struct amdgpu_xgmi xgmi;
+ struct amdgpu_irq_src ecc_irq;
+- struct ras_common_if *ras_if;
++ struct ras_common_if *umc_ras_if;
++ struct ras_common_if *mmhub_ras_if;
+ };
+
+ #define amdgpu_gmc_flush_gpu_tlb(adev, vmid, type) (adev)->gmc.gmc_funcs->flush_gpu_tlb((adev), (vmid), (type))
+diff --git a/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c b/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c
+index ca9c06b8e02c..37c0d085d5c9 100644
+--- a/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c
++++ b/drivers/gpu/drm/amd/amdgpu/gmc_v9_0.c
+@@ -263,7 +263,7 @@ static int gmc_v9_0_process_ecc_irq(struct amdgpu_device *adev,
+ struct amdgpu_irq_src *source,
+ struct amdgpu_iv_entry *entry)
+ {
+- struct ras_common_if *ras_if = adev->gmc.ras_if;
++ struct ras_common_if *ras_if = adev->gmc.umc_ras_if;
+ struct ras_dispatch_if ih_data = {
+ .entry = entry,
+ };
+@@ -734,27 +734,25 @@ static int gmc_v9_0_allocate_vm_inv_eng(struct amdgpu_device *adev)
+ return 0;
+ }
+
+-static int gmc_v9_0_ecc_late_init(void *handle)
++static int gmc_v9_0_ecc_ras_block_late_init(void *handle,
++ struct ras_fs_if *fs_info, struct ras_common_if *ras_block)
+ {
+ struct amdgpu_device *adev = (struct amdgpu_device *)handle;
+- struct ras_common_if **ras_if = &adev->gmc.ras_if;
++ struct ras_common_if **ras_if = NULL;
+ struct ras_ih_if ih_info = {
+ .cb = gmc_v9_0_process_ras_data_cb,
+ };
+- struct ras_fs_if fs_info = {
+- .sysfs_name = "umc_err_count",
+- .debugfs_name = "umc_err_inject",
+- };
+- struct ras_common_if ras_block = {
+- .block = AMDGPU_RAS_BLOCK__UMC,
+- .type = AMDGPU_RAS_ERROR__MULTI_UNCORRECTABLE,
+- .sub_block_index = 0,
+- .name = "umc",
+- };
+ int r;
+
+- if (!amdgpu_ras_is_supported(adev, AMDGPU_RAS_BLOCK__UMC)) {
+- amdgpu_ras_feature_enable_on_boot(adev, &ras_block, 0);
++ if (ras_block->block == AMDGPU_RAS_BLOCK__UMC)
++ ras_if = &adev->gmc.umc_ras_if;
++ else if (ras_block->block == AMDGPU_RAS_BLOCK__MMHUB)
++ ras_if = &adev->gmc.mmhub_ras_if;
++ else
++ BUG();
++
++ if (!amdgpu_ras_is_supported(adev, ras_block->block)) {
++ amdgpu_ras_feature_enable_on_boot(adev, ras_block, 0);
+ return 0;
+ }
+
+@@ -769,7 +767,7 @@ static int gmc_v9_0_ecc_late_init(void *handle)
+ if (r == -EAGAIN) {
+ /* request a gpu reset. will run again. */
+ amdgpu_ras_request_reset_on_boot(adev,
+- AMDGPU_RAS_BLOCK__UMC);
++ ras_block->block);
+ return 0;
+ }
+ /* fail to enable ras, cleanup all. */
+@@ -783,41 +781,46 @@ static int gmc_v9_0_ecc_late_init(void *handle)
+ if (!*ras_if)
+ return -ENOMEM;
+
+- **ras_if = ras_block;
++ **ras_if = *ras_block;
+
+ r = amdgpu_ras_feature_enable_on_boot(adev, *ras_if, 1);
+ if (r) {
+ if (r == -EAGAIN) {
+ amdgpu_ras_request_reset_on_boot(adev,
+- AMDGPU_RAS_BLOCK__UMC);
++ ras_block->block);
+ r = 0;
+ }
+ goto feature;
+ }
+
+ ih_info.head = **ras_if;
+- fs_info.head = **ras_if;
++ fs_info->head = **ras_if;
+
+- r = amdgpu_ras_interrupt_add_handler(adev, &ih_info);
+- if (r)
+- goto interrupt;
++ if (ras_block->block == AMDGPU_RAS_BLOCK__UMC) {
++ r = amdgpu_ras_interrupt_add_handler(adev, &ih_info);
++ if (r)
++ goto interrupt;
++ }
+
+- amdgpu_ras_debugfs_create(adev, &fs_info);
++ amdgpu_ras_debugfs_create(adev, fs_info);
+
+- r = amdgpu_ras_sysfs_create(adev, &fs_info);
++ r = amdgpu_ras_sysfs_create(adev, fs_info);
+ if (r)
+ goto sysfs;
+ resume:
+- r = amdgpu_irq_get(adev, &adev->gmc.ecc_irq, 0);
+- if (r)
+- goto irq;
++ if (ras_block->block == AMDGPU_RAS_BLOCK__UMC) {
++ r = amdgpu_irq_get(adev, &adev->gmc.ecc_irq, 0);
++ if (r)
++ goto irq;
++ }
+
+ return 0;
+ irq:
+ amdgpu_ras_sysfs_remove(adev, *ras_if);
+ sysfs:
+ amdgpu_ras_debugfs_remove(adev, *ras_if);
+- amdgpu_ras_interrupt_remove_handler(adev, &ih_info);
++ if (ras_block->block == AMDGPU_RAS_BLOCK__UMC)
++ amdgpu_ras_interrupt_remove_handler(adev, &ih_info);
+ interrupt:
+ amdgpu_ras_feature_enable(adev, *ras_if, 0);
+ feature:
+@@ -826,6 +829,40 @@ static int gmc_v9_0_ecc_late_init(void *handle)
+ return r;
+ }
+
++static int gmc_v9_0_ecc_late_init(void *handle)
++{
++ int r;
++
++ struct ras_fs_if umc_fs_info = {
++ .sysfs_name = "umc_err_count",
++ .debugfs_name = "umc_err_inject",
++ };
++ struct ras_common_if umc_ras_block = {
++ .block = AMDGPU_RAS_BLOCK__UMC,
++ .type = AMDGPU_RAS_ERROR__MULTI_UNCORRECTABLE,
++ .sub_block_index = 0,
++ .name = "umc",
++ };
++ struct ras_fs_if mmhub_fs_info = {
++ .sysfs_name = "mmhub_err_count",
++ .debugfs_name = "mmhub_err_inject",
++ };
++ struct ras_common_if mmhub_ras_block = {
++ .block = AMDGPU_RAS_BLOCK__MMHUB,
++ .type = AMDGPU_RAS_ERROR__MULTI_UNCORRECTABLE,
++ .sub_block_index = 0,
++ .name = "mmhub",
++ };
++
++ r = gmc_v9_0_ecc_ras_block_late_init(handle,
++ &umc_fs_info, &umc_ras_block);
++ if (r)
++ return r;
++
++ r = gmc_v9_0_ecc_ras_block_late_init(handle,
++ &mmhub_fs_info, &mmhub_ras_block);
++ return r;
++}
+
+ static int gmc_v9_0_late_init(void *handle)
+ {
+@@ -1186,21 +1223,32 @@ static int gmc_v9_0_sw_fini(void *handle)
+ struct amdgpu_device *adev = (struct amdgpu_device *)handle;
+
+ if (amdgpu_ras_is_supported(adev, AMDGPU_RAS_BLOCK__UMC) &&
+- adev->gmc.ras_if) {
+- struct ras_common_if *ras_if = adev->gmc.ras_if;
++ adev->gmc.umc_ras_if) {
++ struct ras_common_if *ras_if = adev->gmc.umc_ras_if;
+ struct ras_ih_if ih_info = {
+ .head = *ras_if,
+ };
+
+- /*remove fs first*/
++ /* remove fs first */
+ amdgpu_ras_debugfs_remove(adev, ras_if);
+ amdgpu_ras_sysfs_remove(adev, ras_if);
+- /*remove the IH*/
++ /* remove the IH */
+ amdgpu_ras_interrupt_remove_handler(adev, &ih_info);
+ amdgpu_ras_feature_enable(adev, ras_if, 0);
+ kfree(ras_if);
+ }
+
++ if (amdgpu_ras_is_supported(adev, AMDGPU_RAS_BLOCK__MMHUB) &&
++ adev->gmc.mmhub_ras_if) {
++ struct ras_common_if *ras_if = adev->gmc.mmhub_ras_if;
++
++ /* remove fs and disable ras feature */
++ amdgpu_ras_debugfs_remove(adev, ras_if);
++ amdgpu_ras_sysfs_remove(adev, ras_if);
++ amdgpu_ras_feature_enable(adev, ras_if, 0);
++ kfree(ras_if);
++ }
++
+ amdgpu_gem_force_release(adev);
+ amdgpu_vm_manager_fini(adev);
+
+--
+2.17.1
+