OSDN Git Service

drm/amdgpu/sriov add amdgpu_amdkfd_pre_reset in gpu reset
authorJack Zhang <Jack.Zhang1@amd.com>
Thu, 2 Apr 2020 07:10:24 +0000 (15:10 +0800)
committerAlex Deucher <alexander.deucher@amd.com>
Thu, 9 Apr 2020 14:43:14 +0000 (10:43 -0400)
kfd_pre_reset will free mem_objs allocated by kfd_gtt_sa_allocate

Without this change, sriov tdr code path will never free those allocated
memories and get memory leak.

v2:add a bugfix for kiq ring test fail

Signed-off-by: Jack Zhang <Jack.Zhang1@amd.com>
Reviewed-by: Monk Liu <monk.liu@amd.com>
Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
drivers/gpu/drm/amd/amdgpu/amdgpu_amdkfd_gfx_v10.c
drivers/gpu/drm/amd/amdgpu/amdgpu_amdkfd_gfx_v9.c
drivers/gpu/drm/amd/amdgpu/amdgpu_device.c

index 4ec6d0c..bdc1f5a 100644 (file)
@@ -543,6 +543,9 @@ static int kgd_hqd_destroy(struct kgd_dev *kgd, void *mqd,
        uint32_t temp;
        struct v10_compute_mqd *m = get_mqd(mqd);
 
+       if (amdgpu_sriov_vf(adev) && adev->in_gpu_reset)
+               return 0;
+
 #if 0
        unsigned long flags;
        int retry;
index df841c2..c2562d6 100644 (file)
@@ -541,6 +541,9 @@ int kgd_gfx_v9_hqd_destroy(struct kgd_dev *kgd, void *mqd,
        uint32_t temp;
        struct v9_mqd *m = get_mqd(mqd);
 
+       if (amdgpu_sriov_vf(adev) && adev->in_gpu_reset)
+               return 0;
+
        if (adev->in_gpu_reset)
                return -EIO;
 
index 9060196..626b46f 100644 (file)
@@ -3852,6 +3852,8 @@ static int amdgpu_device_reset_sriov(struct amdgpu_device *adev,
        if (r)
                return r;
 
+       amdgpu_amdkfd_pre_reset(adev);
+
        /* Resume IP prior to SMC */
        r = amdgpu_device_ip_reinit_early_sriov(adev);
        if (r)