drm/amdgpu: add sdma ras error reset callback for aldebaran
authorHawking Zhang <Hawking.Zhang@amd.com>
Wed, 18 Nov 2020 16:25:09 +0000 (00:25 +0800)
committerAlex Deucher <alexander.deucher@amd.com>
Wed, 24 Mar 2021 02:55:39 +0000 (22:55 -0400)
The callback will be invoked to reset sdma ras error
counters when needed.

Signed-off-by: Hawking Zhang <Hawking.Zhang@amd.com>
Reviewed-by: Dennis Li<Dennis.Li@amd.com>
Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
drivers/gpu/drm/amd/amdgpu/sdma_v4_4.c

index 3a5d0a6bc5785018e4fe5f3f40527a158098ae1e..6fcb95c89999313dc7b90a0b54f3281370eed137 100644 (file)
@@ -208,8 +208,25 @@ static int sdma_v4_4_query_ras_error_count(struct amdgpu_device *adev,
        return 0;
 };
 
+static void sdma_v4_4_reset_ras_error_count(struct amdgpu_device *adev)
+{
+       int i;
+       uint32_t reg_offset;
+
+       /* write 0 to EDC_COUNTER reg to clear sdma edc counters */
+       if (amdgpu_ras_is_supported(adev, AMDGPU_RAS_BLOCK__SDMA)) {
+               for (i = 0; i < adev->sdma.num_instances; i++) {
+                       reg_offset = sdma_v4_4_get_reg_offset(adev, i, regSDMA0_EDC_COUNTER);
+                       WREG32(reg_offset, 0);
+                       reg_offset = sdma_v4_4_get_reg_offset(adev, i, regSDMA0_EDC_COUNTER2);
+                       WREG32(reg_offset, 0);
+               }
+       }
+}
+
 const struct amdgpu_sdma_ras_funcs sdma_v4_4_ras_funcs = {
        .ras_late_init = amdgpu_sdma_ras_late_init,
        .ras_fini = amdgpu_sdma_ras_fini,
        .query_ras_error_count = sdma_v4_4_query_ras_error_count,
+       .reset_ras_error_count = sdma_v4_4_reset_ras_error_count,
 };