| .. | .. |
|---|
| 10 | 10 | |
|---|
| 11 | 11 | /* MCG_CAP register defines */ |
|---|
| 12 | 12 | #define MCG_BANKCNT_MASK 0xff /* Number of Banks */ |
|---|
| 13 | | -#define MCG_CTL_P (1ULL<<8) /* MCG_CTL register available */ |
|---|
| 14 | | -#define MCG_EXT_P (1ULL<<9) /* Extended registers available */ |
|---|
| 15 | | -#define MCG_CMCI_P (1ULL<<10) /* CMCI supported */ |
|---|
| 13 | +#define MCG_CTL_P BIT_ULL(8) /* MCG_CTL register available */ |
|---|
| 14 | +#define MCG_EXT_P BIT_ULL(9) /* Extended registers available */ |
|---|
| 15 | +#define MCG_CMCI_P BIT_ULL(10) /* CMCI supported */ |
|---|
| 16 | 16 | #define MCG_EXT_CNT_MASK 0xff0000 /* Number of Extended registers */ |
|---|
| 17 | 17 | #define MCG_EXT_CNT_SHIFT 16 |
|---|
| 18 | 18 | #define MCG_EXT_CNT(c) (((c) & MCG_EXT_CNT_MASK) >> MCG_EXT_CNT_SHIFT) |
|---|
| 19 | | -#define MCG_SER_P (1ULL<<24) /* MCA recovery/new status bits */ |
|---|
| 20 | | -#define MCG_ELOG_P (1ULL<<26) /* Extended error log supported */ |
|---|
| 21 | | -#define MCG_LMCE_P (1ULL<<27) /* Local machine check supported */ |
|---|
| 19 | +#define MCG_SER_P BIT_ULL(24) /* MCA recovery/new status bits */ |
|---|
| 20 | +#define MCG_ELOG_P BIT_ULL(26) /* Extended error log supported */ |
|---|
| 21 | +#define MCG_LMCE_P BIT_ULL(27) /* Local machine check supported */ |
|---|
| 22 | 22 | |
|---|
| 23 | 23 | /* MCG_STATUS register defines */ |
|---|
| 24 | | -#define MCG_STATUS_RIPV (1ULL<<0) /* restart ip valid */ |
|---|
| 25 | | -#define MCG_STATUS_EIPV (1ULL<<1) /* ip points to correct instruction */ |
|---|
| 26 | | -#define MCG_STATUS_MCIP (1ULL<<2) /* machine check in progress */ |
|---|
| 27 | | -#define MCG_STATUS_LMCES (1ULL<<3) /* LMCE signaled */ |
|---|
| 24 | +#define MCG_STATUS_RIPV BIT_ULL(0) /* restart ip valid */ |
|---|
| 25 | +#define MCG_STATUS_EIPV BIT_ULL(1) /* ip points to correct instruction */ |
|---|
| 26 | +#define MCG_STATUS_MCIP BIT_ULL(2) /* machine check in progress */ |
|---|
| 27 | +#define MCG_STATUS_LMCES BIT_ULL(3) /* LMCE signaled */ |
|---|
| 28 | 28 | |
|---|
| 29 | 29 | /* MCG_EXT_CTL register defines */ |
|---|
| 30 | | -#define MCG_EXT_CTL_LMCE_EN (1ULL<<0) /* Enable LMCE */ |
|---|
| 30 | +#define MCG_EXT_CTL_LMCE_EN BIT_ULL(0) /* Enable LMCE */ |
|---|
| 31 | 31 | |
|---|
| 32 | 32 | /* MCi_STATUS register defines */ |
|---|
| 33 | | -#define MCI_STATUS_VAL (1ULL<<63) /* valid error */ |
|---|
| 34 | | -#define MCI_STATUS_OVER (1ULL<<62) /* previous errors lost */ |
|---|
| 35 | | -#define MCI_STATUS_UC (1ULL<<61) /* uncorrected error */ |
|---|
| 36 | | -#define MCI_STATUS_EN (1ULL<<60) /* error enabled */ |
|---|
| 37 | | -#define MCI_STATUS_MISCV (1ULL<<59) /* misc error reg. valid */ |
|---|
| 38 | | -#define MCI_STATUS_ADDRV (1ULL<<58) /* addr reg. valid */ |
|---|
| 39 | | -#define MCI_STATUS_PCC (1ULL<<57) /* processor context corrupt */ |
|---|
| 40 | | -#define MCI_STATUS_S (1ULL<<56) /* Signaled machine check */ |
|---|
| 41 | | -#define MCI_STATUS_AR (1ULL<<55) /* Action required */ |
|---|
| 33 | +#define MCI_STATUS_VAL BIT_ULL(63) /* valid error */ |
|---|
| 34 | +#define MCI_STATUS_OVER BIT_ULL(62) /* previous errors lost */ |
|---|
| 35 | +#define MCI_STATUS_UC BIT_ULL(61) /* uncorrected error */ |
|---|
| 36 | +#define MCI_STATUS_EN BIT_ULL(60) /* error enabled */ |
|---|
| 37 | +#define MCI_STATUS_MISCV BIT_ULL(59) /* misc error reg. valid */ |
|---|
| 38 | +#define MCI_STATUS_ADDRV BIT_ULL(58) /* addr reg. valid */ |
|---|
| 39 | +#define MCI_STATUS_PCC BIT_ULL(57) /* processor context corrupt */ |
|---|
| 40 | +#define MCI_STATUS_S BIT_ULL(56) /* Signaled machine check */ |
|---|
| 41 | +#define MCI_STATUS_AR BIT_ULL(55) /* Action required */ |
|---|
| 42 | +#define MCI_STATUS_CEC_SHIFT 38 /* Corrected Error Count */ |
|---|
| 43 | +#define MCI_STATUS_CEC_MASK GENMASK_ULL(52,38) |
|---|
| 44 | +#define MCI_STATUS_CEC(c) (((c) & MCI_STATUS_CEC_MASK) >> MCI_STATUS_CEC_SHIFT) |
|---|
| 42 | 45 | |
|---|
| 43 | 46 | /* AMD-specific bits */ |
|---|
| 44 | | -#define MCI_STATUS_TCC (1ULL<<55) /* Task context corrupt */ |
|---|
| 45 | | -#define MCI_STATUS_SYNDV (1ULL<<53) /* synd reg. valid */ |
|---|
| 46 | | -#define MCI_STATUS_DEFERRED (1ULL<<44) /* uncorrected error, deferred exception */ |
|---|
| 47 | | -#define MCI_STATUS_POISON (1ULL<<43) /* access poisonous data */ |
|---|
| 47 | +#define MCI_STATUS_TCC BIT_ULL(55) /* Task context corrupt */ |
|---|
| 48 | +#define MCI_STATUS_SYNDV BIT_ULL(53) /* synd reg. valid */ |
|---|
| 49 | +#define MCI_STATUS_DEFERRED BIT_ULL(44) /* uncorrected error, deferred exception */ |
|---|
| 50 | +#define MCI_STATUS_POISON BIT_ULL(43) /* access poisonous data */ |
|---|
| 51 | +#define MCI_STATUS_SCRUB BIT_ULL(40) /* Error detected during scrub operation */ |
|---|
| 48 | 52 | |
|---|
| 49 | 53 | /* |
|---|
| 50 | 54 | * McaX field if set indicates a given bank supports MCA extensions: |
|---|
| .. | .. |
|---|
| 84 | 88 | #define MCI_MISC_ADDR_GENERIC 7 /* generic */ |
|---|
| 85 | 89 | |
|---|
| 86 | 90 | /* CTL2 register defines */ |
|---|
| 87 | | -#define MCI_CTL2_CMCI_EN (1ULL << 30) |
|---|
| 91 | +#define MCI_CTL2_CMCI_EN BIT_ULL(30) |
|---|
| 88 | 92 | #define MCI_CTL2_CMCI_THRESHOLD_MASK 0x7fffULL |
|---|
| 89 | 93 | |
|---|
| 90 | 94 | #define MCJ_CTX_MASK 3 |
|---|
| .. | .. |
|---|
| 98 | 102 | |
|---|
| 99 | 103 | #define MCE_OVERFLOW 0 /* bit 0 in flags means overflow */ |
|---|
| 100 | 104 | |
|---|
| 101 | | -#define MCE_LOG_LEN 32 |
|---|
| 105 | +#define MCE_LOG_MIN_LEN 32U |
|---|
| 102 | 106 | #define MCE_LOG_SIGNATURE "MACHINECHECK" |
|---|
| 103 | 107 | |
|---|
| 104 | 108 | /* AMD Scalable MCA */ |
|---|
| .. | .. |
|---|
| 123 | 127 | #define MSR_AMD64_SMCA_MCx_DEADDR(x) (MSR_AMD64_SMCA_MC0_DEADDR + 0x10*(x)) |
|---|
| 124 | 128 | #define MSR_AMD64_SMCA_MCx_MISCy(x, y) ((MSR_AMD64_SMCA_MC0_MISC1 + y) + (0x10*(x))) |
|---|
| 125 | 129 | |
|---|
| 130 | +#define XEC(x, mask) (((x) >> 16) & mask) |
|---|
| 131 | + |
|---|
| 132 | +/* mce.kflags flag bits for logging etc. */ |
|---|
| 133 | +#define MCE_HANDLED_CEC BIT_ULL(0) |
|---|
| 134 | +#define MCE_HANDLED_UC BIT_ULL(1) |
|---|
| 135 | +#define MCE_HANDLED_EXTLOG BIT_ULL(2) |
|---|
| 136 | +#define MCE_HANDLED_NFIT BIT_ULL(3) |
|---|
| 137 | +#define MCE_HANDLED_EDAC BIT_ULL(4) |
|---|
| 138 | +#define MCE_HANDLED_MCELOG BIT_ULL(5) |
|---|
| 139 | + |
|---|
| 140 | +/* |
|---|
| 141 | + * Indicates an MCE which has happened in kernel space but from |
|---|
| 142 | + * which the kernel can recover simply by executing fixup_exception() |
|---|
| 143 | + * so that an error is returned to the caller of the function that |
|---|
| 144 | + * hit the machine check. |
|---|
| 145 | + */ |
|---|
| 146 | +#define MCE_IN_KERNEL_RECOV BIT_ULL(6) |
|---|
| 147 | + |
|---|
| 148 | +/* |
|---|
| 149 | + * Indicates an MCE that happened in kernel space while copying data |
|---|
| 150 | + * from user. In this case fixup_exception() gets the kernel to the |
|---|
| 151 | + * error exit for the copy function. Machine check handler can then |
|---|
| 152 | + * treat it like a fault taken in user mode. |
|---|
| 153 | + */ |
|---|
| 154 | +#define MCE_IN_KERNEL_COPYIN BIT_ULL(7) |
|---|
| 155 | + |
|---|
| 126 | 156 | /* |
|---|
| 127 | 157 | * This structure contains all data related to the MCE log. Also |
|---|
| 128 | 158 | * carries a signature to make it easier to find from external |
|---|
| .. | .. |
|---|
| 131 | 161 | */ |
|---|
| 132 | 162 | struct mce_log_buffer { |
|---|
| 133 | 163 | char signature[12]; /* "MACHINECHECK" */ |
|---|
| 134 | | - unsigned len; /* = MCE_LOG_LEN */ |
|---|
| 164 | + unsigned len; /* = elements in .mce_entry[] */ |
|---|
| 135 | 165 | unsigned next; |
|---|
| 136 | 166 | unsigned flags; |
|---|
| 137 | 167 | unsigned recordlen; /* length of struct mce */ |
|---|
| 138 | | - struct mce entry[MCE_LOG_LEN]; |
|---|
| 168 | + struct mce entry[]; |
|---|
| 139 | 169 | }; |
|---|
| 140 | 170 | |
|---|
| 171 | +/* Highest last */ |
|---|
| 141 | 172 | enum mce_notifier_prios { |
|---|
| 142 | | - MCE_PRIO_FIRST = INT_MAX, |
|---|
| 143 | | - MCE_PRIO_SRAO = INT_MAX - 1, |
|---|
| 144 | | - MCE_PRIO_EXTLOG = INT_MAX - 2, |
|---|
| 145 | | - MCE_PRIO_NFIT = INT_MAX - 3, |
|---|
| 146 | | - MCE_PRIO_EDAC = INT_MAX - 4, |
|---|
| 147 | | - MCE_PRIO_MCELOG = 1, |
|---|
| 148 | | - MCE_PRIO_LOWEST = 0, |
|---|
| 173 | + MCE_PRIO_LOWEST, |
|---|
| 174 | + MCE_PRIO_MCELOG, |
|---|
| 175 | + MCE_PRIO_EDAC, |
|---|
| 176 | + MCE_PRIO_NFIT, |
|---|
| 177 | + MCE_PRIO_EXTLOG, |
|---|
| 178 | + MCE_PRIO_UC, |
|---|
| 179 | + MCE_PRIO_EARLY, |
|---|
| 180 | + MCE_PRIO_CEC, |
|---|
| 181 | + MCE_PRIO_HIGHEST = MCE_PRIO_CEC |
|---|
| 149 | 182 | }; |
|---|
| 150 | 183 | |
|---|
| 151 | 184 | struct notifier_block; |
|---|
| .. | .. |
|---|
| 156 | 189 | #include <linux/atomic.h> |
|---|
| 157 | 190 | |
|---|
| 158 | 191 | extern int mce_p5_enabled; |
|---|
| 192 | + |
|---|
| 193 | +#ifdef CONFIG_ARCH_HAS_COPY_MC |
|---|
| 194 | +extern void enable_copy_mc_fragile(void); |
|---|
| 195 | +unsigned long __must_check copy_mc_fragile(void *dst, const void *src, unsigned cnt); |
|---|
| 196 | +#else |
|---|
| 197 | +static inline void enable_copy_mc_fragile(void) |
|---|
| 198 | +{ |
|---|
| 199 | +} |
|---|
| 200 | +#endif |
|---|
| 159 | 201 | |
|---|
| 160 | 202 | #ifdef CONFIG_X86_MCE |
|---|
| 161 | 203 | int mcheck_init(void); |
|---|
| .. | .. |
|---|
| 183 | 225 | void mce_log(struct mce *m); |
|---|
| 184 | 226 | DECLARE_PER_CPU(struct device *, mce_device); |
|---|
| 185 | 227 | |
|---|
| 186 | | -/* |
|---|
| 187 | | - * Maximum banks number. |
|---|
| 188 | | - * This is the limit of the current register layout on |
|---|
| 189 | | - * Intel CPUs. |
|---|
| 190 | | - */ |
|---|
| 191 | | -#define MAX_NR_BANKS 32 |
|---|
| 228 | +/* Maximum number of MCA banks per CPU. */ |
|---|
| 229 | +#define MAX_NR_BANKS 64 |
|---|
| 192 | 230 | |
|---|
| 193 | 231 | #ifdef CONFIG_X86_MCE_INTEL |
|---|
| 194 | 232 | void mce_intel_feature_init(struct cpuinfo_x86 *c); |
|---|
| .. | .. |
|---|
| 206 | 244 | static inline void cmci_recheck(void) {} |
|---|
| 207 | 245 | #endif |
|---|
| 208 | 246 | |
|---|
| 209 | | -#ifdef CONFIG_X86_MCE_AMD |
|---|
| 210 | | -void mce_amd_feature_init(struct cpuinfo_x86 *c); |
|---|
| 211 | | -int umc_normaddr_to_sysaddr(u64 norm_addr, u16 nid, u8 umc, u64 *sys_addr); |
|---|
| 212 | | -#else |
|---|
| 213 | | -static inline void mce_amd_feature_init(struct cpuinfo_x86 *c) { } |
|---|
| 214 | | -static inline int umc_normaddr_to_sysaddr(u64 norm_addr, u16 nid, u8 umc, u64 *sys_addr) { return -EINVAL; }; |
|---|
| 215 | | -#endif |
|---|
| 216 | | - |
|---|
| 217 | 247 | int mce_available(struct cpuinfo_x86 *c); |
|---|
| 218 | 248 | bool mce_is_memory_error(struct mce *m); |
|---|
| 219 | 249 | bool mce_is_correctable(struct mce *m); |
|---|
| .. | .. |
|---|
| 229 | 259 | MCP_TIMESTAMP = BIT(0), /* log time stamp */ |
|---|
| 230 | 260 | MCP_UC = BIT(1), /* log uncorrected errors */ |
|---|
| 231 | 261 | MCP_DONTLOG = BIT(2), /* only clear, don't log */ |
|---|
| 262 | + MCP_QUEUE_LOG = BIT(3), /* only queue to genpool */ |
|---|
| 232 | 263 | }; |
|---|
| 233 | 264 | bool machine_check_poll(enum mcp_flags flags, mce_banks_t *b); |
|---|
| 234 | 265 | |
|---|
| .. | .. |
|---|
| 242 | 273 | /* |
|---|
| 243 | 274 | * Exception handler |
|---|
| 244 | 275 | */ |
|---|
| 245 | | - |
|---|
| 246 | | -/* Call the installed machine check handler for this CPU setup. */ |
|---|
| 247 | | -extern void (*machine_check_vector)(struct pt_regs *, long error_code); |
|---|
| 248 | | -void do_machine_check(struct pt_regs *, long); |
|---|
| 276 | +void do_machine_check(struct pt_regs *pt_regs); |
|---|
| 249 | 277 | |
|---|
| 250 | 278 | /* |
|---|
| 251 | 279 | * Threshold handler |
|---|
| .. | .. |
|---|
| 294 | 322 | /* These may be used by multiple smca_hwid_mcatypes */ |
|---|
| 295 | 323 | enum smca_bank_types { |
|---|
| 296 | 324 | SMCA_LS = 0, /* Load Store */ |
|---|
| 325 | + SMCA_LS_V2, /* Load Store */ |
|---|
| 297 | 326 | SMCA_IF, /* Instruction Fetch */ |
|---|
| 298 | 327 | SMCA_L2_CACHE, /* L2 Cache */ |
|---|
| 299 | 328 | SMCA_DE, /* Decoder Unit */ |
|---|
| .. | .. |
|---|
| 302 | 331 | SMCA_FP, /* Floating Point */ |
|---|
| 303 | 332 | SMCA_L3_CACHE, /* L3 Cache */ |
|---|
| 304 | 333 | SMCA_CS, /* Coherent Slave */ |
|---|
| 334 | + SMCA_CS_V2, /* Coherent Slave */ |
|---|
| 305 | 335 | SMCA_PIE, /* Power, Interrupts, etc. */ |
|---|
| 306 | 336 | SMCA_UMC, /* Unified Memory Controller */ |
|---|
| 307 | 337 | SMCA_PB, /* Parameter Block */ |
|---|
| 308 | 338 | SMCA_PSP, /* Platform Security Processor */ |
|---|
| 339 | + SMCA_PSP_V2, /* Platform Security Processor */ |
|---|
| 309 | 340 | SMCA_SMU, /* System Management Unit */ |
|---|
| 341 | + SMCA_SMU_V2, /* System Management Unit */ |
|---|
| 342 | + SMCA_MP5, /* Microprocessor 5 Unit */ |
|---|
| 343 | + SMCA_NBIO, /* Northbridge IO Unit */ |
|---|
| 344 | + SMCA_PCIE, /* PCI Express Unit */ |
|---|
| 310 | 345 | N_SMCA_BANK_TYPES |
|---|
| 311 | 346 | }; |
|---|
| 312 | 347 | |
|---|
| .. | .. |
|---|
| 315 | 350 | struct smca_hwid { |
|---|
| 316 | 351 | unsigned int bank_type; /* Use with smca_bank_types for easy indexing. */ |
|---|
| 317 | 352 | u32 hwid_mcatype; /* (hwid,mcatype) tuple */ |
|---|
| 318 | | - u32 xec_bitmap; /* Bitmap of valid ExtErrorCodes; current max is 21. */ |
|---|
| 319 | 353 | u8 count; /* Number of instances. */ |
|---|
| 320 | 354 | }; |
|---|
| 321 | 355 | |
|---|
| .. | .. |
|---|
| 333 | 367 | extern int mce_threshold_create_device(unsigned int cpu); |
|---|
| 334 | 368 | extern int mce_threshold_remove_device(unsigned int cpu); |
|---|
| 335 | 369 | |
|---|
| 370 | +void mce_amd_feature_init(struct cpuinfo_x86 *c); |
|---|
| 371 | +int umc_normaddr_to_sysaddr(u64 norm_addr, u16 nid, u8 umc, u64 *sys_addr); |
|---|
| 372 | + |
|---|
| 336 | 373 | #else |
|---|
| 337 | 374 | |
|---|
| 338 | | -static inline int mce_threshold_create_device(unsigned int cpu) { return 0; }; |
|---|
| 339 | | -static inline int mce_threshold_remove_device(unsigned int cpu) { return 0; }; |
|---|
| 340 | | -static inline bool amd_mce_is_memory_error(struct mce *m) { return false; }; |
|---|
| 341 | | - |
|---|
| 375 | +static inline int mce_threshold_create_device(unsigned int cpu) { return 0; }; |
|---|
| 376 | +static inline int mce_threshold_remove_device(unsigned int cpu) { return 0; }; |
|---|
| 377 | +static inline bool amd_mce_is_memory_error(struct mce *m) { return false; }; |
|---|
| 378 | +static inline void mce_amd_feature_init(struct cpuinfo_x86 *c) { } |
|---|
| 379 | +static inline int |
|---|
| 380 | +umc_normaddr_to_sysaddr(u64 norm_addr, u16 nid, u8 umc, u64 *sys_addr) { return -EINVAL; }; |
|---|
| 342 | 381 | #endif |
|---|
| 343 | 382 | |
|---|
| 383 | +static inline void mce_hygon_feature_init(struct cpuinfo_x86 *c) { return mce_amd_feature_init(c); } |
|---|
| 344 | 384 | #endif /* _ASM_X86_MCE_H */ |
|---|