xref: /openbmc/linux/arch/x86/kernel/cpu/mce/internal.h (revision 234489ac)
1 /* SPDX-License-Identifier: GPL-2.0 */
2 #ifndef __X86_MCE_INTERNAL_H__
3 #define __X86_MCE_INTERNAL_H__
4 
5 #undef pr_fmt
6 #define pr_fmt(fmt) "mce: " fmt
7 
8 #include <linux/device.h>
9 #include <asm/mce.h>
10 
11 enum severity_level {
12 	MCE_NO_SEVERITY,
13 	MCE_DEFERRED_SEVERITY,
14 	MCE_UCNA_SEVERITY = MCE_DEFERRED_SEVERITY,
15 	MCE_KEEP_SEVERITY,
16 	MCE_SOME_SEVERITY,
17 	MCE_AO_SEVERITY,
18 	MCE_UC_SEVERITY,
19 	MCE_AR_SEVERITY,
20 	MCE_PANIC_SEVERITY,
21 };
22 
23 extern struct blocking_notifier_head x86_mce_decoder_chain;
24 
25 #define INITIAL_CHECK_INTERVAL	5 * 60 /* 5 minutes */
26 
27 struct mce_evt_llist {
28 	struct llist_node llnode;
29 	struct mce mce;
30 };
31 
32 void mce_gen_pool_process(struct work_struct *__unused);
33 bool mce_gen_pool_empty(void);
34 int mce_gen_pool_add(struct mce *mce);
35 int mce_gen_pool_init(void);
36 struct llist_node *mce_gen_pool_prepare_records(void);
37 
38 int mce_severity(struct mce *a, struct pt_regs *regs, char **msg, bool is_excp);
39 struct dentry *mce_get_debugfs_dir(void);
40 
41 extern mce_banks_t mce_banks_ce_disabled;
42 
43 #ifdef CONFIG_X86_MCE_INTEL
44 unsigned long cmci_intel_adjust_timer(unsigned long interval);
45 bool mce_intel_cmci_poll(void);
46 void mce_intel_hcpu_update(unsigned long cpu);
47 void cmci_disable_bank(int bank);
48 void intel_init_cmci(void);
49 void intel_init_lmce(void);
50 void intel_clear_lmce(void);
51 bool intel_filter_mce(struct mce *m);
52 #else
53 # define cmci_intel_adjust_timer mce_adjust_timer_default
54 static inline bool mce_intel_cmci_poll(void) { return false; }
55 static inline void mce_intel_hcpu_update(unsigned long cpu) { }
56 static inline void cmci_disable_bank(int bank) { }
57 static inline void intel_init_cmci(void) { }
58 static inline void intel_init_lmce(void) { }
59 static inline void intel_clear_lmce(void) { }
60 static inline bool intel_filter_mce(struct mce *m) { return false; }
61 #endif
62 
63 void mce_timer_kick(unsigned long interval);
64 
65 #ifdef CONFIG_ACPI_APEI
66 int apei_write_mce(struct mce *m);
67 ssize_t apei_read_mce(struct mce *m, u64 *record_id);
68 int apei_check_mce(void);
69 int apei_clear_mce(u64 record_id);
70 #else
71 static inline int apei_write_mce(struct mce *m)
72 {
73 	return -EINVAL;
74 }
75 static inline ssize_t apei_read_mce(struct mce *m, u64 *record_id)
76 {
77 	return 0;
78 }
79 static inline int apei_check_mce(void)
80 {
81 	return 0;
82 }
83 static inline int apei_clear_mce(u64 record_id)
84 {
85 	return -EINVAL;
86 }
87 #endif
88 
89 /*
90  * We consider records to be equivalent if bank+status+addr+misc all match.
91  * This is only used when the system is going down because of a fatal error
92  * to avoid cluttering the console log with essentially repeated information.
93  * In normal processing all errors seen are logged.
94  */
95 static inline bool mce_cmp(struct mce *m1, struct mce *m2)
96 {
97 	return m1->bank != m2->bank ||
98 		m1->status != m2->status ||
99 		m1->addr != m2->addr ||
100 		m1->misc != m2->misc;
101 }
102 
103 extern struct device_attribute dev_attr_trigger;
104 
105 #ifdef CONFIG_X86_MCELOG_LEGACY
106 void mce_work_trigger(void);
107 void mce_register_injector_chain(struct notifier_block *nb);
108 void mce_unregister_injector_chain(struct notifier_block *nb);
109 #else
110 static inline void mce_work_trigger(void)	{ }
111 static inline void mce_register_injector_chain(struct notifier_block *nb)	{ }
112 static inline void mce_unregister_injector_chain(struct notifier_block *nb)	{ }
113 #endif
114 
115 struct mca_config {
116 	__u64 lmce_disabled		: 1,
117 	      disabled			: 1,
118 	      ser			: 1,
119 	      recovery			: 1,
120 	      bios_cmci_threshold	: 1,
121 	      /* Proper #MC exception handler is set */
122 	      initialized		: 1,
123 	      __reserved		: 58;
124 
125 	bool dont_log_ce;
126 	bool cmci_disabled;
127 	bool ignore_ce;
128 	bool print_all;
129 
130 	int monarch_timeout;
131 	int panic_timeout;
132 	u32 rip_msr;
133 	s8 bootlog;
134 };
135 
136 extern struct mca_config mca_cfg;
137 DECLARE_PER_CPU_READ_MOSTLY(unsigned int, mce_num_banks);
138 
139 struct mce_vendor_flags {
140 	/*
141 	 * Indicates that overflow conditions are not fatal, when set.
142 	 */
143 	__u64 overflow_recov	: 1,
144 
145 	/*
146 	 * (AMD) SUCCOR stands for S/W UnCorrectable error COntainment and
147 	 * Recovery. It indicates support for data poisoning in HW and deferred
148 	 * error interrupts.
149 	 */
150 	succor			: 1,
151 
152 	/*
153 	 * (AMD) SMCA: This bit indicates support for Scalable MCA which expands
154 	 * the register space for each MCA bank and also increases number of
155 	 * banks. Also, to accommodate the new banks and registers, the MCA
156 	 * register space is moved to a new MSR range.
157 	 */
158 	smca			: 1,
159 
160 	/* AMD-style error thresholding banks present. */
161 	amd_threshold		: 1,
162 
163 	/* Pentium, family 5-style MCA */
164 	p5			: 1,
165 
166 	/* Centaur Winchip C6-style MCA */
167 	winchip			: 1,
168 
169 	/* SandyBridge IFU quirk */
170 	snb_ifu_quirk		: 1,
171 
172 	/* Skylake, Cascade Lake, Cooper Lake REP;MOVS* quirk */
173 	skx_repmov_quirk	: 1,
174 
175 	__reserved_0		: 56;
176 };
177 
178 extern struct mce_vendor_flags mce_flags;
179 
180 struct mce_bank {
181 	/* subevents to enable */
182 	u64			ctl;
183 
184 	/* initialise bank? */
185 	__u64 init		: 1,
186 
187 	/*
188 	 * (AMD) MCA_CONFIG[McaLsbInStatusSupported]: When set, this bit indicates
189 	 * the LSB field is found in MCA_STATUS and not in MCA_ADDR.
190 	 */
191 	lsb_in_status		: 1,
192 
193 	__reserved_1		: 62;
194 };
195 
196 DECLARE_PER_CPU_READ_MOSTLY(struct mce_bank[MAX_NR_BANKS], mce_banks_array);
197 
198 enum mca_msr {
199 	MCA_CTL,
200 	MCA_STATUS,
201 	MCA_ADDR,
202 	MCA_MISC,
203 };
204 
205 /* Decide whether to add MCE record to MCE event pool or filter it out. */
206 extern bool filter_mce(struct mce *m);
207 
208 #ifdef CONFIG_X86_MCE_AMD
209 extern bool amd_filter_mce(struct mce *m);
210 
211 /*
212  * If MCA_CONFIG[McaLsbInStatusSupported] is set, extract ErrAddr in bits
213  * [56:0] of MCA_STATUS, else in bits [55:0] of MCA_ADDR.
214  */
215 static __always_inline void smca_extract_err_addr(struct mce *m)
216 {
217 	u8 lsb;
218 
219 	if (!mce_flags.smca)
220 		return;
221 
222 	if (this_cpu_ptr(mce_banks_array)[m->bank].lsb_in_status) {
223 		lsb = (m->status >> 24) & 0x3f;
224 
225 		m->addr &= GENMASK_ULL(56, lsb);
226 
227 		return;
228 	}
229 
230 	lsb = (m->addr >> 56) & 0x3f;
231 
232 	m->addr &= GENMASK_ULL(55, lsb);
233 }
234 
235 #else
236 static inline bool amd_filter_mce(struct mce *m) { return false; }
237 static inline void smca_extract_err_addr(struct mce *m) { }
238 #endif
239 
240 #ifdef CONFIG_X86_ANCIENT_MCE
241 void intel_p5_mcheck_init(struct cpuinfo_x86 *c);
242 void winchip_mcheck_init(struct cpuinfo_x86 *c);
243 noinstr void pentium_machine_check(struct pt_regs *regs);
244 noinstr void winchip_machine_check(struct pt_regs *regs);
245 static inline void enable_p5_mce(void) { mce_p5_enabled = 1; }
246 #else
247 static __always_inline void intel_p5_mcheck_init(struct cpuinfo_x86 *c) {}
248 static __always_inline void winchip_mcheck_init(struct cpuinfo_x86 *c) {}
249 static __always_inline void enable_p5_mce(void) {}
250 static __always_inline void pentium_machine_check(struct pt_regs *regs) {}
251 static __always_inline void winchip_machine_check(struct pt_regs *regs) {}
252 #endif
253 
254 noinstr u64 mce_rdmsrl(u32 msr);
255 
256 static __always_inline u32 mca_msr_reg(int bank, enum mca_msr reg)
257 {
258 	if (cpu_feature_enabled(X86_FEATURE_SMCA)) {
259 		switch (reg) {
260 		case MCA_CTL:	 return MSR_AMD64_SMCA_MCx_CTL(bank);
261 		case MCA_ADDR:	 return MSR_AMD64_SMCA_MCx_ADDR(bank);
262 		case MCA_MISC:	 return MSR_AMD64_SMCA_MCx_MISC(bank);
263 		case MCA_STATUS: return MSR_AMD64_SMCA_MCx_STATUS(bank);
264 		}
265 	}
266 
267 	switch (reg) {
268 	case MCA_CTL:	 return MSR_IA32_MCx_CTL(bank);
269 	case MCA_ADDR:	 return MSR_IA32_MCx_ADDR(bank);
270 	case MCA_MISC:	 return MSR_IA32_MCx_MISC(bank);
271 	case MCA_STATUS: return MSR_IA32_MCx_STATUS(bank);
272 	}
273 
274 	return 0;
275 }
276 
277 #endif /* __X86_MCE_INTERNAL_H__ */
278