drm/amdgpu: removed GFX RAS support check in UMC ECC callback
authorJohn Clements <john.clements@amd.com>
Fri, 3 Jan 2020 09:27:48 +0000 (17:27 +0800)
committerAlex Deucher <alexander.deucher@amd.com>
Tue, 7 Jan 2020 16:59:37 +0000 (11:59 -0500)
enable GPU recovery in event of uncorrectable UMC error

Signed-off-by: John Clements <john.clements@amd.com>
Reviewed-by: Hawking Zhang <Hawking.Zhang@amd.com>
Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
drivers/gpu/drm/amd/amdgpu/amdgpu_umc.c

index 8a6c733..f4d4085 100644 (file)
@@ -95,13 +95,6 @@ int amdgpu_umc_process_ras_data_cb(struct amdgpu_device *adev,
 {
        struct ras_err_data *err_data = (struct ras_err_data *)ras_error_status;
 
-       /* When “Full RAS” is enabled, the per-IP interrupt sources should
-        * be disabled and the driver should only look for the aggregated
-        * interrupt via sync flood
-        */
-       if (amdgpu_ras_is_supported(adev, AMDGPU_RAS_BLOCK__GFX))
-               return AMDGPU_RAS_SUCCESS;
-
        kgd2kfd_set_sram_ecc_flag(adev->kfd.dev);
        if (adev->umc.funcs &&
            adev->umc.funcs->query_ras_error_count)
@@ -113,6 +106,7 @@ int amdgpu_umc_process_ras_data_cb(struct amdgpu_device *adev,
                err_data->err_addr =
                        kcalloc(adev->umc.max_ras_err_cnt_per_query,
                                sizeof(struct eeprom_table_record), GFP_KERNEL);
+
                /* still call query_ras_error_address to clear error status
                 * even NOMEM error is encountered
                 */