drm/amd/pm: Retrieve UMC ODECC error count from aca bank
authorCandice Li <candice.li@amd.com>
Fri, 2 Feb 2024 10:27:32 +0000 (18:27 +0800)
committerAlex Deucher <alexander.deucher@amd.com>
Wed, 7 Feb 2024 17:26:22 +0000 (12:26 -0500)
Instead of software managed counters.

Signed-off-by: Candice Li <candice.li@amd.com>
Reviewed-by: Hawking Zhang <Hawking.Zhang@amd.com>
Reviewed-by: Tao Zhou <tao.zhou1@amd.com>
Signed-off-by: Alex Deucher <alexander.deucher@amd.com>
drivers/gpu/drm/amd/pm/swsmu/smu13/smu_v13_0_6_ppt.c

index d6e14a5f406e63cf29e362ee718d8b435bae72cd..03873d784be6d6def1eb4b84f8b00becf68ef886 100644 (file)
@@ -2552,8 +2552,12 @@ static int mca_umc_mca_get_err_count(const struct mca_ras_info *mca_ras, struct
                                     enum amdgpu_mca_error_type type, struct mca_bank_entry *entry, uint32_t *count)
 {
        uint64_t status0;
+       uint32_t ext_error_code;
+       uint32_t odecc_err_cnt;
 
        status0 = entry->regs[MCA_REG_IDX_STATUS];
+       ext_error_code = MCA_REG__STATUS__ERRORCODEEXT(status0);
+       odecc_err_cnt = MCA_REG__MISC0__ERRCNT(entry->regs[MCA_REG_IDX_MISC0]);
 
        if (!REG_GET_FIELD(status0, MCMP1_STATUST0, Val)) {
                *count = 0;
@@ -2563,7 +2567,7 @@ static int mca_umc_mca_get_err_count(const struct mca_ras_info *mca_ras, struct
        if (umc_v12_0_is_deferred_error(adev, status0) ||
            umc_v12_0_is_uncorrectable_error(adev, status0) ||
            umc_v12_0_is_correctable_error(adev, status0))
-               *count = 1;
+               *count = (ext_error_code == 0) ? odecc_err_cnt : 1;
 
        return 0;
 }