0001
0002
0003
0004
0005
0006
0007
0008
0009
0010
0011
0012
0013
0014
0015
0016
0017
0018
0019
0020
0021
0022
0023 #include "amdgpu_ras.h"
0024 #include "amdgpu.h"
0025 #include "amdgpu_mca.h"
0026
0027 #include "umc/umc_6_7_0_offset.h"
0028 #include "umc/umc_6_7_0_sh_mask.h"
0029
0030 void amdgpu_mca_query_correctable_error_count(struct amdgpu_device *adev,
0031 uint64_t mc_status_addr,
0032 unsigned long *error_count)
0033 {
0034 uint64_t mc_status = RREG64_PCIE(mc_status_addr);
0035
0036 if (REG_GET_FIELD(mc_status, MCA_UMC_UMC0_MCUMC_STATUST0, Val) == 1 &&
0037 REG_GET_FIELD(mc_status, MCA_UMC_UMC0_MCUMC_STATUST0, CECC) == 1)
0038 *error_count += 1;
0039 }
0040
0041 void amdgpu_mca_query_uncorrectable_error_count(struct amdgpu_device *adev,
0042 uint64_t mc_status_addr,
0043 unsigned long *error_count)
0044 {
0045 uint64_t mc_status = RREG64_PCIE(mc_status_addr);
0046
0047 if ((REG_GET_FIELD(mc_status, MCA_UMC_UMC0_MCUMC_STATUST0, Val) == 1) &&
0048 (REG_GET_FIELD(mc_status, MCA_UMC_UMC0_MCUMC_STATUST0, Deferred) == 1 ||
0049 REG_GET_FIELD(mc_status, MCA_UMC_UMC0_MCUMC_STATUST0, UECC) == 1 ||
0050 REG_GET_FIELD(mc_status, MCA_UMC_UMC0_MCUMC_STATUST0, PCC) == 1 ||
0051 REG_GET_FIELD(mc_status, MCA_UMC_UMC0_MCUMC_STATUST0, UC) == 1 ||
0052 REG_GET_FIELD(mc_status, MCA_UMC_UMC0_MCUMC_STATUST0, TCC) == 1))
0053 *error_count += 1;
0054 }
0055
0056 void amdgpu_mca_reset_error_count(struct amdgpu_device *adev,
0057 uint64_t mc_status_addr)
0058 {
0059 WREG64_PCIE(mc_status_addr, 0x0ULL);
0060 }
0061
0062 void amdgpu_mca_query_ras_error_count(struct amdgpu_device *adev,
0063 uint64_t mc_status_addr,
0064 void *ras_error_status)
0065 {
0066 struct ras_err_data *err_data = (struct ras_err_data *)ras_error_status;
0067
0068 amdgpu_mca_query_correctable_error_count(adev, mc_status_addr, &(err_data->ce_count));
0069 amdgpu_mca_query_uncorrectable_error_count(adev, mc_status_addr, &(err_data->ue_count));
0070
0071 amdgpu_mca_reset_error_count(adev, mc_status_addr);
0072 }