blob: ea549a94361bd6119935170c35d72db2292cd2ed [file] [log] [blame]
Borislav Petkovb70ef012009-06-25 19:32:38 +02001#include <linux/module.h>
Borislav Petkov888ab8e2010-08-18 15:11:35 +02002#include <linux/slab.h>
3
Borislav Petkov47ca08a2010-09-27 15:30:39 +02004#include "mce_amd.h"
Doug Thompsonb52401ce2009-05-06 17:57:20 +02005
Borislav Petkov888ab8e2010-08-18 15:11:35 +02006static struct amd_decoder_ops *fam_ops;
7
Borislav Petkov2be64bf2010-09-17 19:11:47 +02008static u8 xec_mask = 0xf;
Borislav Petkov5ce88f62010-08-31 18:28:08 +02009
Borislav Petkov549d0422009-07-24 13:51:42 +020010static bool report_gart_errors;
Borislav Petkovb0b07a22011-08-24 18:44:22 +020011static void (*nb_bus_decoder)(int node_id, struct mce *m);
Borislav Petkov549d0422009-07-24 13:51:42 +020012
13void amd_report_gart_errors(bool v)
14{
15 report_gart_errors = v;
16}
17EXPORT_SYMBOL_GPL(amd_report_gart_errors);
18
Borislav Petkovb0b07a22011-08-24 18:44:22 +020019void amd_register_ecc_decoder(void (*f)(int, struct mce *))
Borislav Petkov549d0422009-07-24 13:51:42 +020020{
21 nb_bus_decoder = f;
22}
23EXPORT_SYMBOL_GPL(amd_register_ecc_decoder);
24
Borislav Petkovb0b07a22011-08-24 18:44:22 +020025void amd_unregister_ecc_decoder(void (*f)(int, struct mce *))
Borislav Petkov549d0422009-07-24 13:51:42 +020026{
27 if (nb_bus_decoder) {
28 WARN_ON(nb_bus_decoder != f);
29
30 nb_bus_decoder = NULL;
31 }
32}
33EXPORT_SYMBOL_GPL(amd_unregister_ecc_decoder);
34
Doug Thompsonb52401ce2009-05-06 17:57:20 +020035/*
36 * string representation for the different MCA reported error types, see F3x48
37 * or MSR0000_0411.
38 */
Borislav Petkov63375832010-09-06 18:13:39 +020039
40/* transaction type */
Borislav Petkov0f086692012-12-23 12:40:45 +010041static const char * const tt_msgs[] = { "INSN", "DATA", "GEN", "RESV" };
Doug Thompsonb52401ce2009-05-06 17:57:20 +020042
Borislav Petkov63375832010-09-06 18:13:39 +020043/* cache level */
Borislav Petkov0f086692012-12-23 12:40:45 +010044static const char * const ll_msgs[] = { "RESV", "L1", "L2", "L3/GEN" };
Doug Thompsonb52401ce2009-05-06 17:57:20 +020045
Borislav Petkov63375832010-09-06 18:13:39 +020046/* memory transaction type */
Borislav Petkov0f086692012-12-23 12:40:45 +010047static const char * const rrrr_msgs[] = {
Borislav Petkov63375832010-09-06 18:13:39 +020048 "GEN", "RD", "WR", "DRD", "DWR", "IRD", "PRF", "EV", "SNP"
Doug Thompsonb52401ce2009-05-06 17:57:20 +020049};
50
Borislav Petkov63375832010-09-06 18:13:39 +020051/* participating processor */
Borislav Petkovebe2aea2011-11-29 19:03:25 +010052const char * const pp_msgs[] = { "SRC", "RES", "OBS", "GEN" };
Borislav Petkovb70ef012009-06-25 19:32:38 +020053EXPORT_SYMBOL_GPL(pp_msgs);
Doug Thompsonb52401ce2009-05-06 17:57:20 +020054
Borislav Petkov63375832010-09-06 18:13:39 +020055/* request timeout */
Borislav Petkov0f086692012-12-23 12:40:45 +010056static const char * const to_msgs[] = { "no timeout", "timed out" };
Doug Thompsonb52401ce2009-05-06 17:57:20 +020057
Borislav Petkov63375832010-09-06 18:13:39 +020058/* memory or i/o */
Borislav Petkov0f086692012-12-23 12:40:45 +010059static const char * const ii_msgs[] = { "MEM", "RESV", "IO", "GEN" };
Doug Thompsonb52401ce2009-05-06 17:57:20 +020060
Jacob Shin980eec82012-12-18 15:06:11 -060061/* internal error type */
Borislav Petkov0f086692012-12-23 12:40:45 +010062static const char * const uu_msgs[] = { "RESV", "RESV", "HWA", "RESV" };
Jacob Shin980eec82012-12-18 15:06:11 -060063
Borislav Petkovf05c41a2012-09-11 18:57:43 +020064static const char * const f15h_mc1_mce_desc[] = {
Borislav Petkov86039cd2010-11-08 15:03:35 +010065 "UC during a demand linefill from L2",
66 "Parity error during data load from IC",
67 "Parity error for IC valid bit",
68 "Main tag parity error",
69 "Parity error in prediction queue",
70 "PFB data/address parity error",
71 "Parity error in the branch status reg",
72 "PFB promotion address error",
73 "Tag error during probe/victimization",
74 "Parity error for IC probe tag valid bit",
75 "PFB non-cacheable bit parity error",
76 "PFB valid bit parity error", /* xec = 0xd */
Borislav Petkov6c1173a2011-11-21 19:45:34 +010077 "Microcode Patch Buffer", /* xec = 010 */
Borislav Petkov86039cd2010-11-08 15:03:35 +010078 "uop queue",
79 "insn buffer",
80 "predecode buffer",
Aravind Gopalakrishnaneba4bfb2014-07-14 16:58:19 +020081 "fetch address FIFO",
82 "dispatch uop queue"
Borislav Petkov86039cd2010-11-08 15:03:35 +010083};
84
Borislav Petkovf05c41a2012-09-11 18:57:43 +020085static const char * const f15h_mc2_mce_desc[] = {
Borislav Petkov70fdb492010-09-21 20:45:10 +020086 "Fill ECC error on data fills", /* xec = 0x4 */
87 "Fill parity error on insn fills",
88 "Prefetcher request FIFO parity error",
89 "PRQ address parity error",
90 "PRQ data parity error",
91 "WCC Tag ECC error",
92 "WCC Data ECC error",
93 "WCB Data parity error",
Borislav Petkovb64a99c2011-11-23 14:50:44 +010094 "VB Data ECC or parity error",
Borislav Petkov70fdb492010-09-21 20:45:10 +020095 "L2 Tag ECC error", /* xec = 0x10 */
96 "Hard L2 Tag ECC error",
97 "Multiple hits on L2 tag",
98 "XAB parity error",
99 "PRB address parity error"
100};
101
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200102static const char * const mc4_mce_desc[] = {
Borislav Petkov68782672011-11-24 21:29:57 +0100103 "DRAM ECC error detected on the NB",
104 "CRC error detected on HT link",
105 "Link-defined sync error packets detected on HT link",
106 "HT Master abort",
107 "HT Target abort",
108 "Invalid GART PTE entry during GART table walk",
109 "Unsupported atomic RMW received from an IO link",
110 "Watchdog timeout due to lack of progress",
111 "DRAM ECC error detected on the NB",
112 "SVM DMA Exclusion Vector error",
113 "HT data error detected on link",
114 "Protocol error (link, L3, probe filter)",
115 "NB internal arrays parity error",
116 "DRAM addr/ctl signals parity error",
117 "IO link transmission error",
118 "L3 data cache ECC error", /* xec = 0x1c */
119 "L3 cache tag error",
120 "L3 LRU parity bits error",
121 "ECC Error in the Probe Filter directory"
122};
123
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200124static const char * const mc5_mce_desc[] = {
Borislav Petkov8259a7e2010-09-22 15:28:59 +0200125 "CPU Watchdog timer expire",
126 "Wakeup array dest tag",
127 "AG payload array",
128 "EX payload array",
129 "IDRF array",
130 "Retire dispatch queue",
131 "Mapper checkpoint array",
132 "Physical register file EX0 port",
133 "Physical register file EX1 port",
134 "Physical register file AG0 port",
135 "Physical register file AG1 port",
136 "Flag register file",
Aravind Gopalakrishnanaad19e52013-06-05 15:50:03 -0500137 "DE error occurred",
138 "Retire status queue"
Borislav Petkov8259a7e2010-09-22 15:28:59 +0200139};
140
Aravind Gopalakrishnanbc4febe2014-11-04 11:41:08 -0600141static const char * const mc6_mce_desc[] = {
142 "Hardware Assertion",
143 "Free List",
144 "Physical Register File",
145 "Retire Queue",
146 "Scheduler table",
147 "Status Register File",
148};
149
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100150/* Scalable MCA error strings */
Yazen Ghannam856095b2016-09-12 09:59:33 +0200151static const char * const smca_ls_mce_desc[] = {
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100152 "Load queue parity",
153 "Store queue parity",
154 "Miss address buffer payload parity",
155 "L1 TLB parity",
Yazen Ghannam856095b2016-09-12 09:59:33 +0200156 "Reserved",
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100157 "DC tag error type 6",
158 "DC tag error type 1",
159 "Internal error type 1",
160 "Internal error type 2",
161 "Sys Read data error thread 0",
162 "Sys read data error thread 1",
163 "DC tag error type 2",
164 "DC data error type 1 (poison comsumption)",
165 "DC data error type 2",
166 "DC data error type 3",
167 "DC tag error type 4",
168 "L2 TLB parity",
169 "PDC parity error",
170 "DC tag error type 3",
171 "DC tag error type 5",
172 "L2 fill data error",
173};
174
Yazen Ghannam856095b2016-09-12 09:59:33 +0200175static const char * const smca_if_mce_desc[] = {
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100176 "microtag probe port parity error",
177 "IC microtag or full tag multi-hit error",
178 "IC full tag parity",
179 "IC data array parity",
180 "Decoupling queue phys addr parity error",
181 "L0 ITLB parity error",
182 "L1 ITLB parity error",
183 "L2 ITLB parity error",
184 "BPQ snoop parity on Thread 0",
185 "BPQ snoop parity on Thread 1",
186 "L1 BTB multi-match error",
187 "L2 BTB multi-match error",
Yazen Ghannamc019b952016-09-12 09:59:32 +0200188 "L2 Cache Response Poison error",
189 "System Read Data error",
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100190};
191
Yazen Ghannam856095b2016-09-12 09:59:33 +0200192static const char * const smca_l2_mce_desc[] = {
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100193 "L2M tag multi-way-hit error",
194 "L2M tag ECC error",
195 "L2M data ECC error",
196 "HW assert",
197};
198
Yazen Ghannam856095b2016-09-12 09:59:33 +0200199static const char * const smca_de_mce_desc[] = {
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100200 "uop cache tag parity error",
201 "uop cache data parity error",
202 "Insn buffer parity error",
Yazen Ghannamc019b952016-09-12 09:59:32 +0200203 "uop queue parity error",
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100204 "Insn dispatch queue parity error",
205 "Fetch address FIFO parity",
206 "Patch RAM data parity",
207 "Patch RAM sequencer parity",
208 "uop buffer parity"
209};
210
Yazen Ghannam856095b2016-09-12 09:59:33 +0200211static const char * const smca_ex_mce_desc[] = {
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100212 "Watchdog timeout error",
213 "Phy register file parity",
214 "Flag register file parity",
215 "Immediate displacement register file parity",
216 "Address generator payload parity",
217 "EX payload parity",
218 "Checkpoint queue parity",
219 "Retire dispatch queue parity",
Yazen Ghannamc019b952016-09-12 09:59:32 +0200220 "Retire status queue parity error",
221 "Scheduling queue parity error",
222 "Branch buffer queue parity error",
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100223};
224
Yazen Ghannam856095b2016-09-12 09:59:33 +0200225static const char * const smca_fp_mce_desc[] = {
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100226 "Physical register file parity",
227 "Freelist parity error",
228 "Schedule queue parity",
229 "NSQ parity error",
230 "Retire queue parity",
231 "Status register file parity",
Yazen Ghannamc019b952016-09-12 09:59:32 +0200232 "Hardware assertion",
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100233};
234
Yazen Ghannam856095b2016-09-12 09:59:33 +0200235static const char * const smca_l3_mce_desc[] = {
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100236 "Shadow tag macro ECC error",
237 "Shadow tag macro multi-way-hit error",
238 "L3M tag ECC error",
239 "L3M tag multi-way-hit error",
240 "L3M data ECC error",
241 "XI parity, L3 fill done channel error",
242 "L3 victim queue parity",
243 "L3 HW assert",
244};
245
Yazen Ghannam856095b2016-09-12 09:59:33 +0200246static const char * const smca_cs_mce_desc[] = {
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100247 "Illegal request from transport layer",
248 "Address violation",
249 "Security violation",
250 "Illegal response from transport layer",
251 "Unexpected response",
252 "Parity error on incoming request or probe response data",
253 "Parity error on incoming read response data",
254 "Atomic request parity",
255 "ECC error on probe filter access",
256};
257
Yazen Ghannam856095b2016-09-12 09:59:33 +0200258static const char * const smca_pie_mce_desc[] = {
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100259 "HW assert",
260 "Internal PIE register security violation",
261 "Error on GMI link",
262 "Poison data written to internal PIE register",
263};
264
Yazen Ghannam856095b2016-09-12 09:59:33 +0200265static const char * const smca_umc_mce_desc[] = {
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100266 "DRAM ECC error",
267 "Data poison error on DRAM",
268 "SDP parity error",
269 "Advanced peripheral bus error",
270 "Command/address parity error",
271 "Write data CRC error",
272};
273
Yazen Ghannam856095b2016-09-12 09:59:33 +0200274static const char * const smca_pb_mce_desc[] = {
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100275 "Parameter Block RAM ECC error",
276};
277
Yazen Ghannam856095b2016-09-12 09:59:33 +0200278static const char * const smca_psp_mce_desc[] = {
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100279 "PSP RAM ECC or parity error",
280};
281
Yazen Ghannam856095b2016-09-12 09:59:33 +0200282static const char * const smca_smu_mce_desc[] = {
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100283 "SMU RAM ECC or parity error",
284};
285
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200286static bool f12h_mc0_mce(u16 ec, u8 xec)
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200287{
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200288 bool ret = false;
289
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200290 if (MEM_ERROR(ec)) {
Borislav Petkov62452882010-09-22 16:08:37 +0200291 u8 ll = LL(ec);
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200292 ret = true;
293
294 if (ll == LL_L2)
295 pr_cont("during L1 linefill from L2.\n");
296 else if (ll == LL_L1)
Borislav Petkov62452882010-09-22 16:08:37 +0200297 pr_cont("Data/Tag %s error.\n", R4_MSG(ec));
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200298 else
299 ret = false;
300 }
301 return ret;
302}
303
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200304static bool f10h_mc0_mce(u16 ec, u8 xec)
Borislav Petkov9be0bb12010-09-16 15:08:14 +0200305{
Borislav Petkov62452882010-09-22 16:08:37 +0200306 if (R4(ec) == R4_GEN && LL(ec) == LL_L1) {
Borislav Petkov9be0bb12010-09-16 15:08:14 +0200307 pr_cont("during data scrub.\n");
308 return true;
309 }
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200310 return f12h_mc0_mce(ec, xec);
Borislav Petkov9be0bb12010-09-16 15:08:14 +0200311}
312
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200313static bool k8_mc0_mce(u16 ec, u8 xec)
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200314{
315 if (BUS_ERROR(ec)) {
316 pr_cont("during system linefill.\n");
317 return true;
318 }
319
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200320 return f10h_mc0_mce(ec, xec);
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200321}
322
Jacob Shin980eec82012-12-18 15:06:11 -0600323static bool cat_mc0_mce(u16 ec, u8 xec)
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200324{
Borislav Petkov62452882010-09-22 16:08:37 +0200325 u8 r4 = R4(ec);
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200326 bool ret = true;
327
328 if (MEM_ERROR(ec)) {
329
Borislav Petkov62452882010-09-22 16:08:37 +0200330 if (TT(ec) != TT_DATA || LL(ec) != LL_L1)
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200331 return false;
332
333 switch (r4) {
334 case R4_DRD:
335 case R4_DWR:
336 pr_cont("Data/Tag parity error due to %s.\n",
337 (r4 == R4_DRD ? "load/hw prf" : "store"));
338 break;
339 case R4_EVICT:
340 pr_cont("Copyback parity error on a tag miss.\n");
341 break;
342 case R4_SNOOP:
343 pr_cont("Tag parity error during snoop.\n");
344 break;
345 default:
346 ret = false;
347 }
348 } else if (BUS_ERROR(ec)) {
349
Borislav Petkov62452882010-09-22 16:08:37 +0200350 if ((II(ec) != II_MEM && II(ec) != II_IO) || LL(ec) != LL_LG)
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200351 return false;
352
353 pr_cont("System read data error on a ");
354
355 switch (r4) {
356 case R4_RD:
357 pr_cont("TLB reload.\n");
358 break;
359 case R4_DWR:
360 pr_cont("store.\n");
361 break;
362 case R4_DRD:
363 pr_cont("load.\n");
364 break;
365 default:
366 ret = false;
367 }
368 } else {
369 ret = false;
370 }
371
372 return ret;
373}
374
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200375static bool f15h_mc0_mce(u16 ec, u8 xec)
Borislav Petkov25a4f8b2010-09-17 19:22:34 +0200376{
377 bool ret = true;
378
379 if (MEM_ERROR(ec)) {
380
381 switch (xec) {
382 case 0x0:
383 pr_cont("Data Array access error.\n");
384 break;
385
386 case 0x1:
387 pr_cont("UC error during a linefill from L2/NB.\n");
388 break;
389
390 case 0x2:
391 case 0x11:
392 pr_cont("STQ access error.\n");
393 break;
394
395 case 0x3:
396 pr_cont("SCB access error.\n");
397 break;
398
399 case 0x10:
400 pr_cont("Tag error.\n");
401 break;
402
403 case 0x12:
404 pr_cont("LDQ access error.\n");
405 break;
406
407 default:
408 ret = false;
409 }
410 } else if (BUS_ERROR(ec)) {
411
412 if (!xec)
Borislav Petkov344f0a02011-11-15 17:10:58 +0100413 pr_cont("System Read Data Error.\n");
Borislav Petkov25a4f8b2010-09-17 19:22:34 +0200414 else
Borislav Petkov344f0a02011-11-15 17:10:58 +0100415 pr_cont(" Internal error condition type %d.\n", xec);
Aravind Gopalakrishnaneba4bfb2014-07-14 16:58:19 +0200416 } else if (INT_ERROR(ec)) {
417 if (xec <= 0x1f)
418 pr_cont("Hardware Assert.\n");
419 else
420 ret = false;
421
Borislav Petkov25a4f8b2010-09-17 19:22:34 +0200422 } else
423 ret = false;
424
425 return ret;
426}
427
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200428static void decode_mc0_mce(struct mce *m)
Borislav Petkov51966242009-07-28 13:50:43 +0200429{
Borislav Petkov62452882010-09-22 16:08:37 +0200430 u16 ec = EC(m->status);
431 u8 xec = XEC(m->status, xec_mask);
Borislav Petkov51966242009-07-28 13:50:43 +0200432
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200433 pr_emerg(HW_ERR "MC0 Error: ");
Borislav Petkov51966242009-07-28 13:50:43 +0200434
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200435 /* TLB error signatures are the same across families */
436 if (TLB_ERROR(ec)) {
Borislav Petkov62452882010-09-22 16:08:37 +0200437 if (TT(ec) == TT_DATA) {
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200438 pr_cont("%s TLB %s.\n", LL_MSG(ec),
Borislav Petkov25a4f8b2010-09-17 19:22:34 +0200439 ((xec == 2) ? "locked miss"
440 : (xec ? "multimatch" : "parity")));
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200441 return;
442 }
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200443 } else if (fam_ops->mc0_mce(ec, xec))
Borislav Petkov25a4f8b2010-09-17 19:22:34 +0200444 ;
445 else
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200446 pr_emerg(HW_ERR "Corrupted MC0 MCE info?\n");
Borislav Petkov51966242009-07-28 13:50:43 +0200447}
448
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200449static bool k8_mc1_mce(u16 ec, u8 xec)
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200450{
Borislav Petkov62452882010-09-22 16:08:37 +0200451 u8 ll = LL(ec);
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200452 bool ret = true;
453
454 if (!MEM_ERROR(ec))
455 return false;
456
457 if (ll == 0x2)
458 pr_cont("during a linefill from L2.\n");
459 else if (ll == 0x1) {
Borislav Petkov62452882010-09-22 16:08:37 +0200460 switch (R4(ec)) {
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200461 case R4_IRD:
462 pr_cont("Parity error during data load.\n");
463 break;
464
465 case R4_EVICT:
466 pr_cont("Copyback Parity/Victim error.\n");
467 break;
468
469 case R4_SNOOP:
470 pr_cont("Tag Snoop error.\n");
471 break;
472
473 default:
474 ret = false;
475 break;
476 }
477 } else
478 ret = false;
479
480 return ret;
481}
482
Jacob Shin980eec82012-12-18 15:06:11 -0600483static bool cat_mc1_mce(u16 ec, u8 xec)
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200484{
Borislav Petkov62452882010-09-22 16:08:37 +0200485 u8 r4 = R4(ec);
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200486 bool ret = true;
487
Jacob Shin980eec82012-12-18 15:06:11 -0600488 if (!MEM_ERROR(ec))
489 return false;
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200490
Jacob Shin980eec82012-12-18 15:06:11 -0600491 if (TT(ec) != TT_INSTR)
492 return false;
493
494 if (r4 == R4_IRD)
495 pr_cont("Data/tag array parity error for a tag hit.\n");
496 else if (r4 == R4_SNOOP)
497 pr_cont("Tag error during snoop/victimization.\n");
498 else if (xec == 0x0)
499 pr_cont("Tag parity error from victim castout.\n");
500 else if (xec == 0x2)
501 pr_cont("Microcode patch RAM parity error.\n");
502 else
503 ret = false;
504
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200505 return ret;
506}
507
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200508static bool f15h_mc1_mce(u16 ec, u8 xec)
Borislav Petkov86039cd2010-11-08 15:03:35 +0100509{
510 bool ret = true;
511
512 if (!MEM_ERROR(ec))
513 return false;
514
515 switch (xec) {
516 case 0x0 ... 0xa:
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200517 pr_cont("%s.\n", f15h_mc1_mce_desc[xec]);
Borislav Petkov86039cd2010-11-08 15:03:35 +0100518 break;
519
520 case 0xd:
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200521 pr_cont("%s.\n", f15h_mc1_mce_desc[xec-2]);
Borislav Petkov86039cd2010-11-08 15:03:35 +0100522 break;
523
Borislav Petkov6c1173a2011-11-21 19:45:34 +0100524 case 0x10:
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200525 pr_cont("%s.\n", f15h_mc1_mce_desc[xec-4]);
Borislav Petkov6c1173a2011-11-21 19:45:34 +0100526 break;
527
Aravind Gopalakrishnaneba4bfb2014-07-14 16:58:19 +0200528 case 0x11 ... 0x15:
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200529 pr_cont("Decoder %s parity error.\n", f15h_mc1_mce_desc[xec-4]);
Borislav Petkov86039cd2010-11-08 15:03:35 +0100530 break;
531
532 default:
533 ret = false;
534 }
535 return ret;
536}
537
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200538static void decode_mc1_mce(struct mce *m)
Borislav Petkovab5535e2009-07-28 14:06:26 +0200539{
Borislav Petkov62452882010-09-22 16:08:37 +0200540 u16 ec = EC(m->status);
541 u8 xec = XEC(m->status, xec_mask);
Borislav Petkovab5535e2009-07-28 14:06:26 +0200542
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200543 pr_emerg(HW_ERR "MC1 Error: ");
Borislav Petkovab5535e2009-07-28 14:06:26 +0200544
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200545 if (TLB_ERROR(ec))
546 pr_cont("%s TLB %s.\n", LL_MSG(ec),
547 (xec ? "multimatch" : "parity error"));
548 else if (BUS_ERROR(ec)) {
Borislav Petkov525906b2010-10-15 15:27:02 +0200549 bool k8 = (boot_cpu_data.x86 == 0xf && (m->status & BIT_64(58)));
Borislav Petkovab5535e2009-07-28 14:06:26 +0200550
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200551 pr_cont("during %s.\n", (k8 ? "system linefill" : "NB data read"));
Aravind Gopalakrishnaneba4bfb2014-07-14 16:58:19 +0200552 } else if (INT_ERROR(ec)) {
553 if (xec <= 0x3f)
554 pr_cont("Hardware Assert.\n");
555 else
556 goto wrong_mc1_mce;
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200557 } else if (fam_ops->mc1_mce(ec, xec))
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200558 ;
559 else
Aravind Gopalakrishnaneba4bfb2014-07-14 16:58:19 +0200560 goto wrong_mc1_mce;
561
562 return;
563
564wrong_mc1_mce:
565 pr_emerg(HW_ERR "Corrupted MC1 MCE info?\n");
Borislav Petkovab5535e2009-07-28 14:06:26 +0200566}
567
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600568static bool k8_mc2_mce(u16 ec, u8 xec)
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200569{
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600570 bool ret = true;
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200571
572 if (xec == 0x1)
573 pr_cont(" in the write data buffers.\n");
574 else if (xec == 0x3)
575 pr_cont(" in the victim data buffers.\n");
576 else if (xec == 0x2 && MEM_ERROR(ec))
Borislav Petkov62452882010-09-22 16:08:37 +0200577 pr_cont(": %s error in the L2 cache tags.\n", R4_MSG(ec));
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200578 else if (xec == 0x0) {
579 if (TLB_ERROR(ec))
Borislav Petkov50872cc2014-11-22 13:41:01 +0100580 pr_cont("%s error in a Page Descriptor Cache or Guest TLB.\n",
581 TT_MSG(ec));
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200582 else if (BUS_ERROR(ec))
583 pr_cont(": %s/ECC error in data read from NB: %s.\n",
Borislav Petkov62452882010-09-22 16:08:37 +0200584 R4_MSG(ec), PP_MSG(ec));
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200585 else if (MEM_ERROR(ec)) {
Borislav Petkov62452882010-09-22 16:08:37 +0200586 u8 r4 = R4(ec);
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200587
Borislav Petkov62452882010-09-22 16:08:37 +0200588 if (r4 >= 0x7)
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200589 pr_cont(": %s error during data copyback.\n",
Borislav Petkov62452882010-09-22 16:08:37 +0200590 R4_MSG(ec));
591 else if (r4 <= 0x1)
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200592 pr_cont(": %s parity/ECC error during data "
Borislav Petkov62452882010-09-22 16:08:37 +0200593 "access from L2.\n", R4_MSG(ec));
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200594 else
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600595 ret = false;
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200596 } else
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600597 ret = false;
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200598 } else
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600599 ret = false;
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200600
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600601 return ret;
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200602}
603
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600604static bool f15h_mc2_mce(u16 ec, u8 xec)
Borislav Petkov70fdb492010-09-21 20:45:10 +0200605{
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600606 bool ret = true;
Borislav Petkov70fdb492010-09-21 20:45:10 +0200607
608 if (TLB_ERROR(ec)) {
609 if (xec == 0x0)
610 pr_cont("Data parity TLB read error.\n");
611 else if (xec == 0x1)
612 pr_cont("Poison data provided for TLB fill.\n");
613 else
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600614 ret = false;
Borislav Petkov70fdb492010-09-21 20:45:10 +0200615 } else if (BUS_ERROR(ec)) {
616 if (xec > 2)
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600617 ret = false;
Borislav Petkov70fdb492010-09-21 20:45:10 +0200618
619 pr_cont("Error during attempted NB data read.\n");
620 } else if (MEM_ERROR(ec)) {
621 switch (xec) {
622 case 0x4 ... 0xc:
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200623 pr_cont("%s.\n", f15h_mc2_mce_desc[xec - 0x4]);
Borislav Petkov70fdb492010-09-21 20:45:10 +0200624 break;
625
626 case 0x10 ... 0x14:
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200627 pr_cont("%s.\n", f15h_mc2_mce_desc[xec - 0x7]);
Borislav Petkov70fdb492010-09-21 20:45:10 +0200628 break;
629
630 default:
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600631 ret = false;
Borislav Petkov70fdb492010-09-21 20:45:10 +0200632 }
Aravind Gopalakrishnaneba4bfb2014-07-14 16:58:19 +0200633 } else if (INT_ERROR(ec)) {
634 if (xec <= 0x3f)
635 pr_cont("Hardware Assert.\n");
636 else
637 ret = false;
Borislav Petkov70fdb492010-09-21 20:45:10 +0200638 }
639
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600640 return ret;
641}
Borislav Petkov70fdb492010-09-21 20:45:10 +0200642
Jacob Shin980eec82012-12-18 15:06:11 -0600643static bool f16h_mc2_mce(u16 ec, u8 xec)
644{
645 u8 r4 = R4(ec);
646
647 if (!MEM_ERROR(ec))
648 return false;
649
650 switch (xec) {
651 case 0x04 ... 0x05:
652 pr_cont("%cBUFF parity error.\n", (r4 == R4_RD) ? 'I' : 'O');
653 break;
654
655 case 0x09 ... 0x0b:
656 case 0x0d ... 0x0f:
657 pr_cont("ECC error in L2 tag (%s).\n",
658 ((r4 == R4_GEN) ? "BankReq" :
659 ((r4 == R4_SNOOP) ? "Prb" : "Fill")));
660 break;
661
662 case 0x10 ... 0x19:
663 case 0x1b:
664 pr_cont("ECC error in L2 data array (%s).\n",
665 (((r4 == R4_RD) && !(xec & 0x3)) ? "Hit" :
666 ((r4 == R4_GEN) ? "Attr" :
667 ((r4 == R4_EVICT) ? "Vict" : "Fill"))));
668 break;
669
670 case 0x1c ... 0x1d:
671 case 0x1f:
672 pr_cont("Parity error in L2 attribute bits (%s).\n",
673 ((r4 == R4_RD) ? "Hit" :
674 ((r4 == R4_GEN) ? "Attr" : "Fill")));
675 break;
676
677 default:
678 return false;
679 }
680
681 return true;
682}
683
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600684static void decode_mc2_mce(struct mce *m)
685{
686 u16 ec = EC(m->status);
687 u8 xec = XEC(m->status, xec_mask);
688
689 pr_emerg(HW_ERR "MC2 Error: ");
690
691 if (!fam_ops->mc2_mce(ec, xec))
692 pr_cont(HW_ERR "Corrupted MC2 MCE info?\n");
Borislav Petkov70fdb492010-09-21 20:45:10 +0200693}
694
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200695static void decode_mc3_mce(struct mce *m)
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200696{
Borislav Petkov62452882010-09-22 16:08:37 +0200697 u16 ec = EC(m->status);
698 u8 xec = XEC(m->status, xec_mask);
Borislav Petkovded50622010-08-27 17:03:34 +0200699
Borislav Petkovb18434c2010-09-22 11:53:32 +0200700 if (boot_cpu_data.x86 >= 0x14) {
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200701 pr_emerg("You shouldn't be seeing MC3 MCE on this cpu family,"
Borislav Petkovded50622010-08-27 17:03:34 +0200702 " please report on LKML.\n");
703 return;
704 }
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200705
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200706 pr_emerg(HW_ERR "MC3 Error");
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200707
708 if (xec == 0x0) {
Borislav Petkov62452882010-09-22 16:08:37 +0200709 u8 r4 = R4(ec);
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200710
Borislav Petkovded50622010-08-27 17:03:34 +0200711 if (!BUS_ERROR(ec) || (r4 != R4_DRD && r4 != R4_DWR))
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200712 goto wrong_mc3_mce;
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200713
Borislav Petkov62452882010-09-22 16:08:37 +0200714 pr_cont(" during %s.\n", R4_MSG(ec));
Borislav Petkovded50622010-08-27 17:03:34 +0200715 } else
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200716 goto wrong_mc3_mce;
Borislav Petkovded50622010-08-27 17:03:34 +0200717
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200718 return;
719
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200720 wrong_mc3_mce:
721 pr_emerg(HW_ERR "Corrupted MC3 MCE info?\n");
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200722}
723
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200724static void decode_mc4_mce(struct mce *m)
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200725{
Borislav Petkov68782672011-11-24 21:29:57 +0100726 struct cpuinfo_x86 *c = &boot_cpu_data;
727 int node_id = amd_get_nb_id(m->extcpu);
728 u16 ec = EC(m->status);
729 u8 xec = XEC(m->status, 0x1f);
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200730 u8 offset = 0;
731
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200732 pr_emerg(HW_ERR "MC4 Error (node %d): ", node_id);
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200733
Borislav Petkov68782672011-11-24 21:29:57 +0100734 switch (xec) {
735 case 0x0 ... 0xe:
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200736
Borislav Petkov68782672011-11-24 21:29:57 +0100737 /* special handling for DRAM ECCs */
738 if (xec == 0x0 || xec == 0x8) {
739 /* no ECCs on F11h */
740 if (c->x86 == 0x11)
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200741 goto wrong_mc4_mce;
Borislav Petkov68782672011-11-24 21:29:57 +0100742
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200743 pr_cont("%s.\n", mc4_mce_desc[xec]);
Borislav Petkov68782672011-11-24 21:29:57 +0100744
745 if (nb_bus_decoder)
746 nb_bus_decoder(node_id, m);
747 return;
748 }
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200749 break;
750
751 case 0xf:
752 if (TLB_ERROR(ec))
753 pr_cont("GART Table Walk data error.\n");
754 else if (BUS_ERROR(ec))
755 pr_cont("DMA Exclusion Vector Table Walk error.\n");
756 else
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200757 goto wrong_mc4_mce;
Borislav Petkov68782672011-11-24 21:29:57 +0100758 return;
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200759
Borislav Petkov05cd6672010-09-22 15:06:24 +0200760 case 0x19:
Jacob Shin980eec82012-12-18 15:06:11 -0600761 if (boot_cpu_data.x86 == 0x15 || boot_cpu_data.x86 == 0x16)
Borislav Petkov05cd6672010-09-22 15:06:24 +0200762 pr_cont("Compute Unit Data Error.\n");
763 else
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200764 goto wrong_mc4_mce;
Borislav Petkov68782672011-11-24 21:29:57 +0100765 return;
Borislav Petkov05cd6672010-09-22 15:06:24 +0200766
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200767 case 0x1c ... 0x1f:
Borislav Petkov68782672011-11-24 21:29:57 +0100768 offset = 13;
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200769 break;
770
771 default:
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200772 goto wrong_mc4_mce;
Borislav Petkov68782672011-11-24 21:29:57 +0100773 }
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200774
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200775 pr_cont("%s.\n", mc4_mce_desc[xec - offset]);
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200776 return;
777
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200778 wrong_mc4_mce:
779 pr_emerg(HW_ERR "Corrupted MC4 MCE info?\n");
Borislav Petkovd93cc222009-07-28 10:56:15 +0200780}
Borislav Petkovd93cc222009-07-28 10:56:15 +0200781
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200782static void decode_mc5_mce(struct mce *m)
Borislav Petkov53bd5fe2009-07-28 14:20:46 +0200783{
Borislav Petkov8259a7e2010-09-22 15:28:59 +0200784 struct cpuinfo_x86 *c = &boot_cpu_data;
Aravind Gopalakrishnaneba4bfb2014-07-14 16:58:19 +0200785 u16 ec = EC(m->status);
Borislav Petkov62452882010-09-22 16:08:37 +0200786 u8 xec = XEC(m->status, xec_mask);
Borislav Petkov8259a7e2010-09-22 15:28:59 +0200787
788 if (c->x86 == 0xf || c->x86 == 0x11)
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200789 goto wrong_mc5_mce;
Borislav Petkovfe4ea262010-08-31 18:38:24 +0200790
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200791 pr_emerg(HW_ERR "MC5 Error: ");
Borislav Petkov8259a7e2010-09-22 15:28:59 +0200792
Aravind Gopalakrishnaneba4bfb2014-07-14 16:58:19 +0200793 if (INT_ERROR(ec)) {
794 if (xec <= 0x1f) {
795 pr_cont("Hardware Assert.\n");
796 return;
797 } else
798 goto wrong_mc5_mce;
799 }
800
Borislav Petkov8259a7e2010-09-22 15:28:59 +0200801 if (xec == 0x0 || xec == 0xc)
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200802 pr_cont("%s.\n", mc5_mce_desc[xec]);
Aravind Gopalakrishnanaad19e52013-06-05 15:50:03 -0500803 else if (xec <= 0xd)
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200804 pr_cont("%s parity error.\n", mc5_mce_desc[xec]);
Borislav Petkov8259a7e2010-09-22 15:28:59 +0200805 else
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200806 goto wrong_mc5_mce;
Borislav Petkov8259a7e2010-09-22 15:28:59 +0200807
808 return;
Borislav Petkovfe4ea262010-08-31 18:38:24 +0200809
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200810 wrong_mc5_mce:
811 pr_emerg(HW_ERR "Corrupted MC5 MCE info?\n");
Borislav Petkov53bd5fe2009-07-28 14:20:46 +0200812}
813
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200814static void decode_mc6_mce(struct mce *m)
Borislav Petkovb8f85c42010-09-22 15:37:58 +0200815{
Borislav Petkov62452882010-09-22 16:08:37 +0200816 u8 xec = XEC(m->status, xec_mask);
Borislav Petkovb8f85c42010-09-22 15:37:58 +0200817
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200818 pr_emerg(HW_ERR "MC6 Error: ");
Borislav Petkovb8f85c42010-09-22 15:37:58 +0200819
Aravind Gopalakrishnanbc4febe2014-11-04 11:41:08 -0600820 if (xec > 0x5)
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200821 goto wrong_mc6_mce;
Borislav Petkovb8f85c42010-09-22 15:37:58 +0200822
Aravind Gopalakrishnanbc4febe2014-11-04 11:41:08 -0600823 pr_cont("%s parity error.\n", mc6_mce_desc[xec]);
Borislav Petkovb8f85c42010-09-22 15:37:58 +0200824 return;
825
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200826 wrong_mc6_mce:
827 pr_emerg(HW_ERR "Corrupted MC6 MCE info?\n");
Borislav Petkovb8f85c42010-09-22 15:37:58 +0200828}
829
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100830static void decode_f17h_core_errors(const char *ip_name, u8 xec,
831 unsigned int mca_type)
832{
833 const char * const *error_desc_array;
834 size_t len;
835
836 pr_emerg(HW_ERR "%s Error: ", ip_name);
837
838 switch (mca_type) {
839 case SMCA_LS:
Yazen Ghannam856095b2016-09-12 09:59:33 +0200840 error_desc_array = smca_ls_mce_desc;
841 len = ARRAY_SIZE(smca_ls_mce_desc) - 1;
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100842
843 if (xec == 0x4) {
844 pr_cont("Unrecognized LS MCA error code.\n");
845 return;
846 }
847 break;
848
849 case SMCA_IF:
Yazen Ghannam856095b2016-09-12 09:59:33 +0200850 error_desc_array = smca_if_mce_desc;
851 len = ARRAY_SIZE(smca_if_mce_desc) - 1;
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100852 break;
853
854 case SMCA_L2_CACHE:
Yazen Ghannam856095b2016-09-12 09:59:33 +0200855 error_desc_array = smca_l2_mce_desc;
856 len = ARRAY_SIZE(smca_l2_mce_desc) - 1;
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100857 break;
858
859 case SMCA_DE:
Yazen Ghannam856095b2016-09-12 09:59:33 +0200860 error_desc_array = smca_de_mce_desc;
861 len = ARRAY_SIZE(smca_de_mce_desc) - 1;
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100862 break;
863
864 case SMCA_EX:
Yazen Ghannam856095b2016-09-12 09:59:33 +0200865 error_desc_array = smca_ex_mce_desc;
866 len = ARRAY_SIZE(smca_ex_mce_desc) - 1;
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100867 break;
868
869 case SMCA_FP:
Yazen Ghannam856095b2016-09-12 09:59:33 +0200870 error_desc_array = smca_fp_mce_desc;
871 len = ARRAY_SIZE(smca_fp_mce_desc) - 1;
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100872 break;
873
874 case SMCA_L3_CACHE:
Yazen Ghannam856095b2016-09-12 09:59:33 +0200875 error_desc_array = smca_l3_mce_desc;
876 len = ARRAY_SIZE(smca_l3_mce_desc) - 1;
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100877 break;
878
879 default:
880 pr_cont("Corrupted MCA core error info.\n");
881 return;
882 }
883
884 if (xec > len) {
885 pr_cont("Unrecognized %s MCA bank error code.\n",
886 amd_core_mcablock_names[mca_type]);
887 return;
888 }
889
890 pr_cont("%s.\n", error_desc_array[xec]);
891}
892
893static void decode_df_errors(u8 xec, unsigned int mca_type)
894{
895 const char * const *error_desc_array;
896 size_t len;
897
898 pr_emerg(HW_ERR "Data Fabric Error: ");
899
900 switch (mca_type) {
901 case SMCA_CS:
Yazen Ghannam856095b2016-09-12 09:59:33 +0200902 error_desc_array = smca_cs_mce_desc;
903 len = ARRAY_SIZE(smca_cs_mce_desc) - 1;
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100904 break;
905
906 case SMCA_PIE:
Yazen Ghannam856095b2016-09-12 09:59:33 +0200907 error_desc_array = smca_pie_mce_desc;
908 len = ARRAY_SIZE(smca_pie_mce_desc) - 1;
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100909 break;
910
911 default:
912 pr_cont("Corrupted MCA Data Fabric info.\n");
913 return;
914 }
915
916 if (xec > len) {
917 pr_cont("Unrecognized %s MCA bank error code.\n",
918 amd_df_mcablock_names[mca_type]);
919 return;
920 }
921
922 pr_cont("%s.\n", error_desc_array[xec]);
923}
924
925/* Decode errors according to Scalable MCA specification */
926static void decode_smca_errors(struct mce *m)
927{
928 u32 addr = MSR_AMD64_SMCA_MCx_IPID(m->bank);
929 unsigned int hwid, mca_type, i;
930 u8 xec = XEC(m->status, xec_mask);
931 const char * const *error_desc_array;
932 const char *ip_name;
933 u32 low, high;
934 size_t len;
935
936 if (rdmsr_safe(addr, &low, &high)) {
Yazen Ghannamb300e872016-09-12 09:59:29 +0200937 pr_emerg(HW_ERR "Invalid IP block specified.\n");
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100938 return;
939 }
940
941 hwid = high & MCI_IPID_HWID;
942 mca_type = (high & MCI_IPID_MCATYPE) >> 16;
943
944 pr_emerg(HW_ERR "MC%d IPID value: 0x%08x%08x\n", m->bank, high, low);
945
946 /*
947 * Based on hwid and mca_type values, decode errors from respective IPs.
948 * Note: mca_type values make sense only in the context of an hwid.
949 */
950 for (i = 0; i < ARRAY_SIZE(amd_hwids); i++)
951 if (amd_hwids[i].hwid == hwid)
952 break;
953
954 switch (i) {
955 case SMCA_F17H_CORE:
956 ip_name = (mca_type == SMCA_L3_CACHE) ?
957 "L3 Cache" : "F17h Core";
958 return decode_f17h_core_errors(ip_name, xec, mca_type);
959 break;
960
961 case SMCA_DF:
962 return decode_df_errors(xec, mca_type);
963 break;
964
965 case SMCA_UMC:
Yazen Ghannam856095b2016-09-12 09:59:33 +0200966 error_desc_array = smca_umc_mce_desc;
967 len = ARRAY_SIZE(smca_umc_mce_desc) - 1;
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100968 break;
969
970 case SMCA_PB:
Yazen Ghannam856095b2016-09-12 09:59:33 +0200971 error_desc_array = smca_pb_mce_desc;
972 len = ARRAY_SIZE(smca_pb_mce_desc) - 1;
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100973 break;
974
975 case SMCA_PSP:
Yazen Ghannam856095b2016-09-12 09:59:33 +0200976 error_desc_array = smca_psp_mce_desc;
977 len = ARRAY_SIZE(smca_psp_mce_desc) - 1;
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100978 break;
979
980 case SMCA_SMU:
Yazen Ghannam856095b2016-09-12 09:59:33 +0200981 error_desc_array = smca_smu_mce_desc;
982 len = ARRAY_SIZE(smca_smu_mce_desc) - 1;
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100983 break;
984
985 default:
986 pr_emerg(HW_ERR "HWID:%d does not match any existing IPs.\n", hwid);
987 return;
988 }
989
990 ip_name = amd_hwids[i].name;
991 pr_emerg(HW_ERR "%s Error: ", ip_name);
992
993 if (xec > len) {
994 pr_cont("Unrecognized %s MCA bank error code.\n", ip_name);
995 return;
996 }
997
998 pr_cont("%s.\n", error_desc_array[xec]);
999}
1000
Borislav Petkov63375832010-09-06 18:13:39 +02001001static inline void amd_decode_err_code(u16 ec)
Borislav Petkovd93cc222009-07-28 10:56:15 +02001002{
Jacob Shin980eec82012-12-18 15:06:11 -06001003 if (INT_ERROR(ec)) {
1004 pr_emerg(HW_ERR "internal: %s\n", UU_MSG(ec));
1005 return;
1006 }
Borislav Petkovfa7ae8c2010-09-22 17:42:27 +02001007
1008 pr_emerg(HW_ERR "cache level: %s", LL_MSG(ec));
1009
1010 if (BUS_ERROR(ec))
1011 pr_cont(", mem/io: %s", II_MSG(ec));
1012 else
1013 pr_cont(", tx: %s", TT_MSG(ec));
1014
1015 if (MEM_ERROR(ec) || BUS_ERROR(ec)) {
1016 pr_cont(", mem-tx: %s", R4_MSG(ec));
1017
1018 if (BUS_ERROR(ec))
1019 pr_cont(", part-proc: %s (%s)", PP_MSG(ec), TO_MSG(ec));
1020 }
1021
1022 pr_cont("\n");
Borislav Petkov549d0422009-07-24 13:51:42 +02001023}
Borislav Petkov549d0422009-07-24 13:51:42 +02001024
Borislav Petkov5ce88f62010-08-31 18:28:08 +02001025/*
1026 * Filter out unwanted MCE signatures here.
1027 */
1028static bool amd_filter_mce(struct mce *m)
1029{
1030 u8 xec = (m->status >> 16) & 0x1f;
1031
1032 /*
1033 * NB GART TLB error reporting is disabled by default.
1034 */
1035 if (m->bank == 4 && xec == 0x5 && !report_gart_errors)
1036 return true;
1037
1038 return false;
1039}
1040
Borislav Petkovd5c67702012-09-14 20:25:37 +02001041static const char *decode_error_status(struct mce *m)
1042{
1043 if (m->status & MCI_STATUS_UC) {
1044 if (m->status & MCI_STATUS_PCC)
1045 return "System Fatal error.";
1046 if (m->mcgstatus & MCG_STATUS_RIPV)
1047 return "Uncorrected, software restartable error.";
1048 return "Uncorrected, software containable error.";
1049 }
1050
1051 if (m->status & MCI_STATUS_DEFERRED)
1052 return "Deferred error.";
1053
1054 return "Corrected error, no action required.";
1055}
1056
Borislav Petkov9cdeb402010-09-02 18:33:24 +02001057int amd_decode_mce(struct notifier_block *nb, unsigned long val, void *data)
Borislav Petkov549d0422009-07-24 13:51:42 +02001058{
Borislav Petkovfb253192009-10-07 13:20:38 +02001059 struct mce *m = (struct mce *)data;
Borislav Petkovf89f8382012-09-13 15:14:22 +02001060 struct cpuinfo_x86 *c = &cpu_data(m->extcpu);
Borislav Petkovb0b07a22011-08-24 18:44:22 +02001061 int ecc;
Borislav Petkov549d0422009-07-24 13:51:42 +02001062
Borislav Petkov5ce88f62010-08-31 18:28:08 +02001063 if (amd_filter_mce(m))
1064 return NOTIFY_STOP;
1065
Borislav Petkovfd0f5fff2014-02-17 20:51:52 +01001066 pr_emerg(HW_ERR "%s\n", decode_error_status(m));
1067
1068 pr_emerg(HW_ERR "CPU:%d (%x:%x:%x) MC%d_STATUS[%s|%s|%s|%s|%s",
1069 m->extcpu,
1070 c->x86, c->x86_model, c->x86_mask,
1071 m->bank,
1072 ((m->status & MCI_STATUS_OVER) ? "Over" : "-"),
Aravind Gopalakrishnan99e1dfb2015-07-13 06:53:02 -05001073 ((m->status & MCI_STATUS_UC) ? "UE" :
1074 (m->status & MCI_STATUS_DEFERRED) ? "-" : "CE"),
Borislav Petkovfd0f5fff2014-02-17 20:51:52 +01001075 ((m->status & MCI_STATUS_MISCV) ? "MiscV" : "-"),
1076 ((m->status & MCI_STATUS_PCC) ? "PCC" : "-"),
1077 ((m->status & MCI_STATUS_ADDRV) ? "AddrV" : "-"));
1078
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +01001079 if (c->x86 >= 0x15)
Borislav Petkovfd0f5fff2014-02-17 20:51:52 +01001080 pr_cont("|%s|%s",
1081 ((m->status & MCI_STATUS_DEFERRED) ? "Deferred" : "-"),
1082 ((m->status & MCI_STATUS_POISON) ? "Poison" : "-"));
1083
Yazen Ghannama348ed82016-05-11 14:58:28 +02001084 if (boot_cpu_has(X86_FEATURE_SMCA)) {
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +01001085 u32 low, high;
1086 u32 addr = MSR_AMD64_SMCA_MCx_CONFIG(m->bank);
1087
Yazen Ghannamb300e872016-09-12 09:59:29 +02001088 pr_cont("|%s", ((m->status & MCI_STATUS_SYNDV) ? "SyndV" : "-"));
1089
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +01001090 if (!rdmsr_safe(addr, &low, &high) &&
1091 (low & MCI_CONFIG_MCAX))
1092 pr_cont("|%s", ((m->status & MCI_STATUS_TCC) ? "TCC" : "-"));
1093 }
1094
Borislav Petkovfd0f5fff2014-02-17 20:51:52 +01001095 /* do the two bits[14:13] together */
1096 ecc = (m->status >> 45) & 0x3;
1097 if (ecc)
1098 pr_cont("|%sECC", ((ecc == 2) ? "C" : "U"));
1099
1100 pr_cont("]: 0x%016llx\n", m->status);
1101
1102 if (m->status & MCI_STATUS_ADDRV)
Yazen Ghannamb300e872016-09-12 09:59:29 +02001103 pr_emerg(HW_ERR "Error Addr: 0x%016llx", m->addr);
Borislav Petkovfd0f5fff2014-02-17 20:51:52 +01001104
Yazen Ghannama348ed82016-05-11 14:58:28 +02001105 if (boot_cpu_has(X86_FEATURE_SMCA)) {
Yazen Ghannamb300e872016-09-12 09:59:29 +02001106 if (m->status & MCI_STATUS_SYNDV)
1107 pr_cont(", Syndrome: 0x%016llx", m->synd);
1108
1109 pr_cont("\n");
1110
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +01001111 decode_smca_errors(m);
1112 goto err_code;
Yazen Ghannamb300e872016-09-12 09:59:29 +02001113 } else
1114 pr_cont("\n");
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +01001115
Borislav Petkovfd0f5fff2014-02-17 20:51:52 +01001116 if (!fam_ops)
1117 goto err_code;
1118
Borislav Petkov51966242009-07-28 13:50:43 +02001119 switch (m->bank) {
1120 case 0:
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001121 decode_mc0_mce(m);
Borislav Petkov51966242009-07-28 13:50:43 +02001122 break;
Borislav Petkovd93cc222009-07-28 10:56:15 +02001123
Borislav Petkovab5535e2009-07-28 14:06:26 +02001124 case 1:
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001125 decode_mc1_mce(m);
Borislav Petkovab5535e2009-07-28 14:06:26 +02001126 break;
1127
Borislav Petkov56cad2d2009-07-28 14:14:24 +02001128 case 2:
Jacob Shin4a73d3d2012-12-18 15:06:10 -06001129 decode_mc2_mce(m);
Borislav Petkov56cad2d2009-07-28 14:14:24 +02001130 break;
1131
Borislav Petkovf9350ef2009-07-28 14:17:30 +02001132 case 3:
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001133 decode_mc3_mce(m);
Borislav Petkovf9350ef2009-07-28 14:17:30 +02001134 break;
1135
Borislav Petkov51966242009-07-28 13:50:43 +02001136 case 4:
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001137 decode_mc4_mce(m);
Borislav Petkov51966242009-07-28 13:50:43 +02001138 break;
1139
Borislav Petkov53bd5fe2009-07-28 14:20:46 +02001140 case 5:
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001141 decode_mc5_mce(m);
Borislav Petkov53bd5fe2009-07-28 14:20:46 +02001142 break;
1143
Borislav Petkovb8f85c42010-09-22 15:37:58 +02001144 case 6:
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001145 decode_mc6_mce(m);
Borislav Petkovb8f85c42010-09-22 15:37:58 +02001146 break;
1147
Borislav Petkov51966242009-07-28 13:50:43 +02001148 default:
1149 break;
Borislav Petkovb69b29d2009-07-27 16:21:14 +02001150 }
Borislav Petkov51966242009-07-28 13:50:43 +02001151
Borislav Petkovfd0f5fff2014-02-17 20:51:52 +01001152 err_code:
Borislav Petkov51966242009-07-28 13:50:43 +02001153 amd_decode_err_code(m->status & 0xffff);
Borislav Petkovfb253192009-10-07 13:20:38 +02001154
1155 return NOTIFY_STOP;
Borislav Petkov549d0422009-07-24 13:51:42 +02001156}
Borislav Petkov9cdeb402010-09-02 18:33:24 +02001157EXPORT_SYMBOL_GPL(amd_decode_mce);
Ingo Molnarf436f8b2009-10-01 16:14:32 +02001158
Borislav Petkovfb253192009-10-07 13:20:38 +02001159static struct notifier_block amd_mce_dec_nb = {
1160 .notifier_call = amd_decode_mce,
1161};
1162
Ingo Molnarf436f8b2009-10-01 16:14:32 +02001163static int __init mce_amd_init(void)
1164{
Borislav Petkovbad11e02010-09-22 17:44:51 +02001165 struct cpuinfo_x86 *c = &boot_cpu_data;
1166
1167 if (c->x86_vendor != X86_VENDOR_AMD)
Borislav Petkovfd0f5fff2014-02-17 20:51:52 +01001168 return -ENODEV;
Borislav Petkove045c292010-08-06 18:55:45 +02001169
Borislav Petkov888ab8e2010-08-18 15:11:35 +02001170 fam_ops = kzalloc(sizeof(struct amd_decoder_ops), GFP_KERNEL);
1171 if (!fam_ops)
1172 return -ENOMEM;
1173
Borislav Petkovbad11e02010-09-22 17:44:51 +02001174 switch (c->x86) {
Borislav Petkov888ab8e2010-08-18 15:11:35 +02001175 case 0xf:
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001176 fam_ops->mc0_mce = k8_mc0_mce;
1177 fam_ops->mc1_mce = k8_mc1_mce;
Jacob Shin4a73d3d2012-12-18 15:06:10 -06001178 fam_ops->mc2_mce = k8_mc2_mce;
Borislav Petkov888ab8e2010-08-18 15:11:35 +02001179 break;
1180
1181 case 0x10:
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001182 fam_ops->mc0_mce = f10h_mc0_mce;
1183 fam_ops->mc1_mce = k8_mc1_mce;
Jacob Shin4a73d3d2012-12-18 15:06:10 -06001184 fam_ops->mc2_mce = k8_mc2_mce;
Borislav Petkov888ab8e2010-08-18 15:11:35 +02001185 break;
1186
Borislav Petkovf0157b32010-10-05 19:07:16 +02001187 case 0x11:
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001188 fam_ops->mc0_mce = k8_mc0_mce;
1189 fam_ops->mc1_mce = k8_mc1_mce;
Jacob Shin4a73d3d2012-12-18 15:06:10 -06001190 fam_ops->mc2_mce = k8_mc2_mce;
Borislav Petkovf0157b32010-10-05 19:07:16 +02001191 break;
1192
Borislav Petkov9be0bb12010-09-16 15:08:14 +02001193 case 0x12:
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001194 fam_ops->mc0_mce = f12h_mc0_mce;
1195 fam_ops->mc1_mce = k8_mc1_mce;
Jacob Shin4a73d3d2012-12-18 15:06:10 -06001196 fam_ops->mc2_mce = k8_mc2_mce;
Borislav Petkov9be0bb12010-09-16 15:08:14 +02001197 break;
1198
Borislav Petkov888ab8e2010-08-18 15:11:35 +02001199 case 0x14:
Jacob Shin980eec82012-12-18 15:06:11 -06001200 fam_ops->mc0_mce = cat_mc0_mce;
1201 fam_ops->mc1_mce = cat_mc1_mce;
Jacob Shin4a73d3d2012-12-18 15:06:10 -06001202 fam_ops->mc2_mce = k8_mc2_mce;
Borislav Petkov888ab8e2010-08-18 15:11:35 +02001203 break;
1204
Borislav Petkov2be64bf2010-09-17 19:11:47 +02001205 case 0x15:
Aravind Gopalakrishnaneba4bfb2014-07-14 16:58:19 +02001206 xec_mask = c->x86_model == 0x60 ? 0x3f : 0x1f;
1207
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001208 fam_ops->mc0_mce = f15h_mc0_mce;
1209 fam_ops->mc1_mce = f15h_mc1_mce;
Jacob Shin4a73d3d2012-12-18 15:06:10 -06001210 fam_ops->mc2_mce = f15h_mc2_mce;
Borislav Petkov2be64bf2010-09-17 19:11:47 +02001211 break;
1212
Jacob Shin980eec82012-12-18 15:06:11 -06001213 case 0x16:
1214 xec_mask = 0x1f;
1215 fam_ops->mc0_mce = cat_mc0_mce;
1216 fam_ops->mc1_mce = cat_mc1_mce;
1217 fam_ops->mc2_mce = f16h_mc2_mce;
1218 break;
1219
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +01001220 case 0x17:
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +01001221 xec_mask = 0x3f;
Yazen Ghannama348ed82016-05-11 14:58:28 +02001222 if (!boot_cpu_has(X86_FEATURE_SMCA)) {
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +01001223 printk(KERN_WARNING "Decoding supported only on Scalable MCA processors.\n");
1224 goto err_out;
1225 }
1226 break;
1227
Borislav Petkov888ab8e2010-08-18 15:11:35 +02001228 default:
Borislav Petkovec3e82d2012-04-04 14:21:02 +02001229 printk(KERN_WARNING "Huh? What family is it: 0x%x?!\n", c->x86);
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +01001230 goto err_out;
Borislav Petkov888ab8e2010-08-18 15:11:35 +02001231 }
1232
Borislav Petkov9530d602010-09-06 15:05:45 +02001233 pr_info("MCE: In-kernel MCE decoding enabled.\n");
1234
Borislav Petkov3653ada2011-12-04 15:12:09 +01001235 mce_register_decode_chain(&amd_mce_dec_nb);
Ingo Molnarf436f8b2009-10-01 16:14:32 +02001236
1237 return 0;
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +01001238
1239err_out:
1240 kfree(fam_ops);
1241 fam_ops = NULL;
1242 return -EINVAL;
Ingo Molnarf436f8b2009-10-01 16:14:32 +02001243}
1244early_initcall(mce_amd_init);
Borislav Petkov0d18b2e2009-10-02 15:31:48 +02001245
1246#ifdef MODULE
1247static void __exit mce_amd_exit(void)
1248{
Borislav Petkov3653ada2011-12-04 15:12:09 +01001249 mce_unregister_decode_chain(&amd_mce_dec_nb);
Borislav Petkov888ab8e2010-08-18 15:11:35 +02001250 kfree(fam_ops);
Borislav Petkov0d18b2e2009-10-02 15:31:48 +02001251}
1252
1253MODULE_DESCRIPTION("AMD MCE decoder");
1254MODULE_ALIAS("edac-mce-amd");
1255MODULE_LICENSE("GPL");
1256module_exit(mce_amd_exit);
1257#endif