blob: 49768c08ac0734345007a1faaae7eef70cd34f60 [file] [log] [blame]
Borislav Petkovb70ef012009-06-25 19:32:38 +02001#include <linux/module.h>
Borislav Petkov888ab8e2010-08-18 15:11:35 +02002#include <linux/slab.h>
3
Borislav Petkov47ca08a2010-09-27 15:30:39 +02004#include "mce_amd.h"
Doug Thompsonb52401ce2009-05-06 17:57:20 +02005
Borislav Petkov888ab8e2010-08-18 15:11:35 +02006static struct amd_decoder_ops *fam_ops;
7
Borislav Petkov2be64bf2010-09-17 19:11:47 +02008static u8 xec_mask = 0xf;
Borislav Petkov5ce88f62010-08-31 18:28:08 +02009
Borislav Petkov549d0422009-07-24 13:51:42 +020010static bool report_gart_errors;
Borislav Petkovb0b07a22011-08-24 18:44:22 +020011static void (*nb_bus_decoder)(int node_id, struct mce *m);
Borislav Petkov549d0422009-07-24 13:51:42 +020012
13void amd_report_gart_errors(bool v)
14{
15 report_gart_errors = v;
16}
17EXPORT_SYMBOL_GPL(amd_report_gart_errors);
18
Borislav Petkovb0b07a22011-08-24 18:44:22 +020019void amd_register_ecc_decoder(void (*f)(int, struct mce *))
Borislav Petkov549d0422009-07-24 13:51:42 +020020{
21 nb_bus_decoder = f;
22}
23EXPORT_SYMBOL_GPL(amd_register_ecc_decoder);
24
Borislav Petkovb0b07a22011-08-24 18:44:22 +020025void amd_unregister_ecc_decoder(void (*f)(int, struct mce *))
Borislav Petkov549d0422009-07-24 13:51:42 +020026{
27 if (nb_bus_decoder) {
28 WARN_ON(nb_bus_decoder != f);
29
30 nb_bus_decoder = NULL;
31 }
32}
33EXPORT_SYMBOL_GPL(amd_unregister_ecc_decoder);
34
Doug Thompsonb52401ce2009-05-06 17:57:20 +020035/*
36 * string representation for the different MCA reported error types, see F3x48
37 * or MSR0000_0411.
38 */
Borislav Petkov63375832010-09-06 18:13:39 +020039
40/* transaction type */
Borislav Petkov0f086692012-12-23 12:40:45 +010041static const char * const tt_msgs[] = { "INSN", "DATA", "GEN", "RESV" };
Doug Thompsonb52401ce2009-05-06 17:57:20 +020042
Borislav Petkov63375832010-09-06 18:13:39 +020043/* cache level */
Borislav Petkov0f086692012-12-23 12:40:45 +010044static const char * const ll_msgs[] = { "RESV", "L1", "L2", "L3/GEN" };
Doug Thompsonb52401ce2009-05-06 17:57:20 +020045
Borislav Petkov63375832010-09-06 18:13:39 +020046/* memory transaction type */
Borislav Petkov0f086692012-12-23 12:40:45 +010047static const char * const rrrr_msgs[] = {
Borislav Petkov63375832010-09-06 18:13:39 +020048 "GEN", "RD", "WR", "DRD", "DWR", "IRD", "PRF", "EV", "SNP"
Doug Thompsonb52401ce2009-05-06 17:57:20 +020049};
50
Borislav Petkov63375832010-09-06 18:13:39 +020051/* participating processor */
Borislav Petkovebe2aea2011-11-29 19:03:25 +010052const char * const pp_msgs[] = { "SRC", "RES", "OBS", "GEN" };
Borislav Petkovb70ef012009-06-25 19:32:38 +020053EXPORT_SYMBOL_GPL(pp_msgs);
Doug Thompsonb52401ce2009-05-06 17:57:20 +020054
Borislav Petkov63375832010-09-06 18:13:39 +020055/* request timeout */
Borislav Petkov0f086692012-12-23 12:40:45 +010056static const char * const to_msgs[] = { "no timeout", "timed out" };
Doug Thompsonb52401ce2009-05-06 17:57:20 +020057
Borislav Petkov63375832010-09-06 18:13:39 +020058/* memory or i/o */
Borislav Petkov0f086692012-12-23 12:40:45 +010059static const char * const ii_msgs[] = { "MEM", "RESV", "IO", "GEN" };
Doug Thompsonb52401ce2009-05-06 17:57:20 +020060
Jacob Shin980eec82012-12-18 15:06:11 -060061/* internal error type */
Borislav Petkov0f086692012-12-23 12:40:45 +010062static const char * const uu_msgs[] = { "RESV", "RESV", "HWA", "RESV" };
Jacob Shin980eec82012-12-18 15:06:11 -060063
Borislav Petkovf05c41a2012-09-11 18:57:43 +020064static const char * const f15h_mc1_mce_desc[] = {
Borislav Petkov86039cd2010-11-08 15:03:35 +010065 "UC during a demand linefill from L2",
66 "Parity error during data load from IC",
67 "Parity error for IC valid bit",
68 "Main tag parity error",
69 "Parity error in prediction queue",
70 "PFB data/address parity error",
71 "Parity error in the branch status reg",
72 "PFB promotion address error",
73 "Tag error during probe/victimization",
74 "Parity error for IC probe tag valid bit",
75 "PFB non-cacheable bit parity error",
76 "PFB valid bit parity error", /* xec = 0xd */
Borislav Petkov6c1173a2011-11-21 19:45:34 +010077 "Microcode Patch Buffer", /* xec = 010 */
Borislav Petkov86039cd2010-11-08 15:03:35 +010078 "uop queue",
79 "insn buffer",
80 "predecode buffer",
Aravind Gopalakrishnaneba4bfb2014-07-14 16:58:19 +020081 "fetch address FIFO",
82 "dispatch uop queue"
Borislav Petkov86039cd2010-11-08 15:03:35 +010083};
84
Borislav Petkovf05c41a2012-09-11 18:57:43 +020085static const char * const f15h_mc2_mce_desc[] = {
Borislav Petkov70fdb492010-09-21 20:45:10 +020086 "Fill ECC error on data fills", /* xec = 0x4 */
87 "Fill parity error on insn fills",
88 "Prefetcher request FIFO parity error",
89 "PRQ address parity error",
90 "PRQ data parity error",
91 "WCC Tag ECC error",
92 "WCC Data ECC error",
93 "WCB Data parity error",
Borislav Petkovb64a99c2011-11-23 14:50:44 +010094 "VB Data ECC or parity error",
Borislav Petkov70fdb492010-09-21 20:45:10 +020095 "L2 Tag ECC error", /* xec = 0x10 */
96 "Hard L2 Tag ECC error",
97 "Multiple hits on L2 tag",
98 "XAB parity error",
99 "PRB address parity error"
100};
101
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200102static const char * const mc4_mce_desc[] = {
Borislav Petkov68782672011-11-24 21:29:57 +0100103 "DRAM ECC error detected on the NB",
104 "CRC error detected on HT link",
105 "Link-defined sync error packets detected on HT link",
106 "HT Master abort",
107 "HT Target abort",
108 "Invalid GART PTE entry during GART table walk",
109 "Unsupported atomic RMW received from an IO link",
110 "Watchdog timeout due to lack of progress",
111 "DRAM ECC error detected on the NB",
112 "SVM DMA Exclusion Vector error",
113 "HT data error detected on link",
114 "Protocol error (link, L3, probe filter)",
115 "NB internal arrays parity error",
116 "DRAM addr/ctl signals parity error",
117 "IO link transmission error",
118 "L3 data cache ECC error", /* xec = 0x1c */
119 "L3 cache tag error",
120 "L3 LRU parity bits error",
121 "ECC Error in the Probe Filter directory"
122};
123
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200124static const char * const mc5_mce_desc[] = {
Borislav Petkov8259a7e2010-09-22 15:28:59 +0200125 "CPU Watchdog timer expire",
126 "Wakeup array dest tag",
127 "AG payload array",
128 "EX payload array",
129 "IDRF array",
130 "Retire dispatch queue",
131 "Mapper checkpoint array",
132 "Physical register file EX0 port",
133 "Physical register file EX1 port",
134 "Physical register file AG0 port",
135 "Physical register file AG1 port",
136 "Flag register file",
Aravind Gopalakrishnanaad19e52013-06-05 15:50:03 -0500137 "DE error occurred",
138 "Retire status queue"
Borislav Petkov8259a7e2010-09-22 15:28:59 +0200139};
140
Aravind Gopalakrishnanbc4febe2014-11-04 11:41:08 -0600141static const char * const mc6_mce_desc[] = {
142 "Hardware Assertion",
143 "Free List",
144 "Physical Register File",
145 "Retire Queue",
146 "Scheduler table",
147 "Status Register File",
148};
149
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100150/* Scalable MCA error strings */
151static const char * const f17h_ls_mce_desc[] = {
152 "Load queue parity",
153 "Store queue parity",
154 "Miss address buffer payload parity",
155 "L1 TLB parity",
156 "", /* reserved */
157 "DC tag error type 6",
158 "DC tag error type 1",
159 "Internal error type 1",
160 "Internal error type 2",
161 "Sys Read data error thread 0",
162 "Sys read data error thread 1",
163 "DC tag error type 2",
164 "DC data error type 1 (poison comsumption)",
165 "DC data error type 2",
166 "DC data error type 3",
167 "DC tag error type 4",
168 "L2 TLB parity",
169 "PDC parity error",
170 "DC tag error type 3",
171 "DC tag error type 5",
172 "L2 fill data error",
173};
174
175static const char * const f17h_if_mce_desc[] = {
176 "microtag probe port parity error",
177 "IC microtag or full tag multi-hit error",
178 "IC full tag parity",
179 "IC data array parity",
180 "Decoupling queue phys addr parity error",
181 "L0 ITLB parity error",
182 "L1 ITLB parity error",
183 "L2 ITLB parity error",
184 "BPQ snoop parity on Thread 0",
185 "BPQ snoop parity on Thread 1",
186 "L1 BTB multi-match error",
187 "L2 BTB multi-match error",
188};
189
190static const char * const f17h_l2_mce_desc[] = {
191 "L2M tag multi-way-hit error",
192 "L2M tag ECC error",
193 "L2M data ECC error",
194 "HW assert",
195};
196
197static const char * const f17h_de_mce_desc[] = {
198 "uop cache tag parity error",
199 "uop cache data parity error",
200 "Insn buffer parity error",
201 "Insn dispatch queue parity error",
202 "Fetch address FIFO parity",
203 "Patch RAM data parity",
204 "Patch RAM sequencer parity",
205 "uop buffer parity"
206};
207
208static const char * const f17h_ex_mce_desc[] = {
209 "Watchdog timeout error",
210 "Phy register file parity",
211 "Flag register file parity",
212 "Immediate displacement register file parity",
213 "Address generator payload parity",
214 "EX payload parity",
215 "Checkpoint queue parity",
216 "Retire dispatch queue parity",
217};
218
219static const char * const f17h_fp_mce_desc[] = {
220 "Physical register file parity",
221 "Freelist parity error",
222 "Schedule queue parity",
223 "NSQ parity error",
224 "Retire queue parity",
225 "Status register file parity",
226};
227
228static const char * const f17h_l3_mce_desc[] = {
229 "Shadow tag macro ECC error",
230 "Shadow tag macro multi-way-hit error",
231 "L3M tag ECC error",
232 "L3M tag multi-way-hit error",
233 "L3M data ECC error",
234 "XI parity, L3 fill done channel error",
235 "L3 victim queue parity",
236 "L3 HW assert",
237};
238
239static const char * const f17h_cs_mce_desc[] = {
240 "Illegal request from transport layer",
241 "Address violation",
242 "Security violation",
243 "Illegal response from transport layer",
244 "Unexpected response",
245 "Parity error on incoming request or probe response data",
246 "Parity error on incoming read response data",
247 "Atomic request parity",
248 "ECC error on probe filter access",
249};
250
251static const char * const f17h_pie_mce_desc[] = {
252 "HW assert",
253 "Internal PIE register security violation",
254 "Error on GMI link",
255 "Poison data written to internal PIE register",
256};
257
258static const char * const f17h_umc_mce_desc[] = {
259 "DRAM ECC error",
260 "Data poison error on DRAM",
261 "SDP parity error",
262 "Advanced peripheral bus error",
263 "Command/address parity error",
264 "Write data CRC error",
265};
266
267static const char * const f17h_pb_mce_desc[] = {
268 "Parameter Block RAM ECC error",
269};
270
271static const char * const f17h_psp_mce_desc[] = {
272 "PSP RAM ECC or parity error",
273};
274
275static const char * const f17h_smu_mce_desc[] = {
276 "SMU RAM ECC or parity error",
277};
278
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200279static bool f12h_mc0_mce(u16 ec, u8 xec)
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200280{
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200281 bool ret = false;
282
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200283 if (MEM_ERROR(ec)) {
Borislav Petkov62452882010-09-22 16:08:37 +0200284 u8 ll = LL(ec);
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200285 ret = true;
286
287 if (ll == LL_L2)
288 pr_cont("during L1 linefill from L2.\n");
289 else if (ll == LL_L1)
Borislav Petkov62452882010-09-22 16:08:37 +0200290 pr_cont("Data/Tag %s error.\n", R4_MSG(ec));
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200291 else
292 ret = false;
293 }
294 return ret;
295}
296
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200297static bool f10h_mc0_mce(u16 ec, u8 xec)
Borislav Petkov9be0bb12010-09-16 15:08:14 +0200298{
Borislav Petkov62452882010-09-22 16:08:37 +0200299 if (R4(ec) == R4_GEN && LL(ec) == LL_L1) {
Borislav Petkov9be0bb12010-09-16 15:08:14 +0200300 pr_cont("during data scrub.\n");
301 return true;
302 }
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200303 return f12h_mc0_mce(ec, xec);
Borislav Petkov9be0bb12010-09-16 15:08:14 +0200304}
305
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200306static bool k8_mc0_mce(u16 ec, u8 xec)
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200307{
308 if (BUS_ERROR(ec)) {
309 pr_cont("during system linefill.\n");
310 return true;
311 }
312
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200313 return f10h_mc0_mce(ec, xec);
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200314}
315
Jacob Shin980eec82012-12-18 15:06:11 -0600316static bool cat_mc0_mce(u16 ec, u8 xec)
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200317{
Borislav Petkov62452882010-09-22 16:08:37 +0200318 u8 r4 = R4(ec);
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200319 bool ret = true;
320
321 if (MEM_ERROR(ec)) {
322
Borislav Petkov62452882010-09-22 16:08:37 +0200323 if (TT(ec) != TT_DATA || LL(ec) != LL_L1)
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200324 return false;
325
326 switch (r4) {
327 case R4_DRD:
328 case R4_DWR:
329 pr_cont("Data/Tag parity error due to %s.\n",
330 (r4 == R4_DRD ? "load/hw prf" : "store"));
331 break;
332 case R4_EVICT:
333 pr_cont("Copyback parity error on a tag miss.\n");
334 break;
335 case R4_SNOOP:
336 pr_cont("Tag parity error during snoop.\n");
337 break;
338 default:
339 ret = false;
340 }
341 } else if (BUS_ERROR(ec)) {
342
Borislav Petkov62452882010-09-22 16:08:37 +0200343 if ((II(ec) != II_MEM && II(ec) != II_IO) || LL(ec) != LL_LG)
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200344 return false;
345
346 pr_cont("System read data error on a ");
347
348 switch (r4) {
349 case R4_RD:
350 pr_cont("TLB reload.\n");
351 break;
352 case R4_DWR:
353 pr_cont("store.\n");
354 break;
355 case R4_DRD:
356 pr_cont("load.\n");
357 break;
358 default:
359 ret = false;
360 }
361 } else {
362 ret = false;
363 }
364
365 return ret;
366}
367
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200368static bool f15h_mc0_mce(u16 ec, u8 xec)
Borislav Petkov25a4f8b2010-09-17 19:22:34 +0200369{
370 bool ret = true;
371
372 if (MEM_ERROR(ec)) {
373
374 switch (xec) {
375 case 0x0:
376 pr_cont("Data Array access error.\n");
377 break;
378
379 case 0x1:
380 pr_cont("UC error during a linefill from L2/NB.\n");
381 break;
382
383 case 0x2:
384 case 0x11:
385 pr_cont("STQ access error.\n");
386 break;
387
388 case 0x3:
389 pr_cont("SCB access error.\n");
390 break;
391
392 case 0x10:
393 pr_cont("Tag error.\n");
394 break;
395
396 case 0x12:
397 pr_cont("LDQ access error.\n");
398 break;
399
400 default:
401 ret = false;
402 }
403 } else if (BUS_ERROR(ec)) {
404
405 if (!xec)
Borislav Petkov344f0a02011-11-15 17:10:58 +0100406 pr_cont("System Read Data Error.\n");
Borislav Petkov25a4f8b2010-09-17 19:22:34 +0200407 else
Borislav Petkov344f0a02011-11-15 17:10:58 +0100408 pr_cont(" Internal error condition type %d.\n", xec);
Aravind Gopalakrishnaneba4bfb2014-07-14 16:58:19 +0200409 } else if (INT_ERROR(ec)) {
410 if (xec <= 0x1f)
411 pr_cont("Hardware Assert.\n");
412 else
413 ret = false;
414
Borislav Petkov25a4f8b2010-09-17 19:22:34 +0200415 } else
416 ret = false;
417
418 return ret;
419}
420
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200421static void decode_mc0_mce(struct mce *m)
Borislav Petkov51966242009-07-28 13:50:43 +0200422{
Borislav Petkov62452882010-09-22 16:08:37 +0200423 u16 ec = EC(m->status);
424 u8 xec = XEC(m->status, xec_mask);
Borislav Petkov51966242009-07-28 13:50:43 +0200425
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200426 pr_emerg(HW_ERR "MC0 Error: ");
Borislav Petkov51966242009-07-28 13:50:43 +0200427
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200428 /* TLB error signatures are the same across families */
429 if (TLB_ERROR(ec)) {
Borislav Petkov62452882010-09-22 16:08:37 +0200430 if (TT(ec) == TT_DATA) {
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200431 pr_cont("%s TLB %s.\n", LL_MSG(ec),
Borislav Petkov25a4f8b2010-09-17 19:22:34 +0200432 ((xec == 2) ? "locked miss"
433 : (xec ? "multimatch" : "parity")));
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200434 return;
435 }
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200436 } else if (fam_ops->mc0_mce(ec, xec))
Borislav Petkov25a4f8b2010-09-17 19:22:34 +0200437 ;
438 else
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200439 pr_emerg(HW_ERR "Corrupted MC0 MCE info?\n");
Borislav Petkov51966242009-07-28 13:50:43 +0200440}
441
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200442static bool k8_mc1_mce(u16 ec, u8 xec)
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200443{
Borislav Petkov62452882010-09-22 16:08:37 +0200444 u8 ll = LL(ec);
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200445 bool ret = true;
446
447 if (!MEM_ERROR(ec))
448 return false;
449
450 if (ll == 0x2)
451 pr_cont("during a linefill from L2.\n");
452 else if (ll == 0x1) {
Borislav Petkov62452882010-09-22 16:08:37 +0200453 switch (R4(ec)) {
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200454 case R4_IRD:
455 pr_cont("Parity error during data load.\n");
456 break;
457
458 case R4_EVICT:
459 pr_cont("Copyback Parity/Victim error.\n");
460 break;
461
462 case R4_SNOOP:
463 pr_cont("Tag Snoop error.\n");
464 break;
465
466 default:
467 ret = false;
468 break;
469 }
470 } else
471 ret = false;
472
473 return ret;
474}
475
Jacob Shin980eec82012-12-18 15:06:11 -0600476static bool cat_mc1_mce(u16 ec, u8 xec)
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200477{
Borislav Petkov62452882010-09-22 16:08:37 +0200478 u8 r4 = R4(ec);
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200479 bool ret = true;
480
Jacob Shin980eec82012-12-18 15:06:11 -0600481 if (!MEM_ERROR(ec))
482 return false;
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200483
Jacob Shin980eec82012-12-18 15:06:11 -0600484 if (TT(ec) != TT_INSTR)
485 return false;
486
487 if (r4 == R4_IRD)
488 pr_cont("Data/tag array parity error for a tag hit.\n");
489 else if (r4 == R4_SNOOP)
490 pr_cont("Tag error during snoop/victimization.\n");
491 else if (xec == 0x0)
492 pr_cont("Tag parity error from victim castout.\n");
493 else if (xec == 0x2)
494 pr_cont("Microcode patch RAM parity error.\n");
495 else
496 ret = false;
497
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200498 return ret;
499}
500
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200501static bool f15h_mc1_mce(u16 ec, u8 xec)
Borislav Petkov86039cd2010-11-08 15:03:35 +0100502{
503 bool ret = true;
504
505 if (!MEM_ERROR(ec))
506 return false;
507
508 switch (xec) {
509 case 0x0 ... 0xa:
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200510 pr_cont("%s.\n", f15h_mc1_mce_desc[xec]);
Borislav Petkov86039cd2010-11-08 15:03:35 +0100511 break;
512
513 case 0xd:
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200514 pr_cont("%s.\n", f15h_mc1_mce_desc[xec-2]);
Borislav Petkov86039cd2010-11-08 15:03:35 +0100515 break;
516
Borislav Petkov6c1173a2011-11-21 19:45:34 +0100517 case 0x10:
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200518 pr_cont("%s.\n", f15h_mc1_mce_desc[xec-4]);
Borislav Petkov6c1173a2011-11-21 19:45:34 +0100519 break;
520
Aravind Gopalakrishnaneba4bfb2014-07-14 16:58:19 +0200521 case 0x11 ... 0x15:
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200522 pr_cont("Decoder %s parity error.\n", f15h_mc1_mce_desc[xec-4]);
Borislav Petkov86039cd2010-11-08 15:03:35 +0100523 break;
524
525 default:
526 ret = false;
527 }
528 return ret;
529}
530
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200531static void decode_mc1_mce(struct mce *m)
Borislav Petkovab5535e2009-07-28 14:06:26 +0200532{
Borislav Petkov62452882010-09-22 16:08:37 +0200533 u16 ec = EC(m->status);
534 u8 xec = XEC(m->status, xec_mask);
Borislav Petkovab5535e2009-07-28 14:06:26 +0200535
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200536 pr_emerg(HW_ERR "MC1 Error: ");
Borislav Petkovab5535e2009-07-28 14:06:26 +0200537
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200538 if (TLB_ERROR(ec))
539 pr_cont("%s TLB %s.\n", LL_MSG(ec),
540 (xec ? "multimatch" : "parity error"));
541 else if (BUS_ERROR(ec)) {
Borislav Petkov525906b2010-10-15 15:27:02 +0200542 bool k8 = (boot_cpu_data.x86 == 0xf && (m->status & BIT_64(58)));
Borislav Petkovab5535e2009-07-28 14:06:26 +0200543
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200544 pr_cont("during %s.\n", (k8 ? "system linefill" : "NB data read"));
Aravind Gopalakrishnaneba4bfb2014-07-14 16:58:19 +0200545 } else if (INT_ERROR(ec)) {
546 if (xec <= 0x3f)
547 pr_cont("Hardware Assert.\n");
548 else
549 goto wrong_mc1_mce;
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200550 } else if (fam_ops->mc1_mce(ec, xec))
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200551 ;
552 else
Aravind Gopalakrishnaneba4bfb2014-07-14 16:58:19 +0200553 goto wrong_mc1_mce;
554
555 return;
556
557wrong_mc1_mce:
558 pr_emerg(HW_ERR "Corrupted MC1 MCE info?\n");
Borislav Petkovab5535e2009-07-28 14:06:26 +0200559}
560
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600561static bool k8_mc2_mce(u16 ec, u8 xec)
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200562{
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600563 bool ret = true;
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200564
565 if (xec == 0x1)
566 pr_cont(" in the write data buffers.\n");
567 else if (xec == 0x3)
568 pr_cont(" in the victim data buffers.\n");
569 else if (xec == 0x2 && MEM_ERROR(ec))
Borislav Petkov62452882010-09-22 16:08:37 +0200570 pr_cont(": %s error in the L2 cache tags.\n", R4_MSG(ec));
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200571 else if (xec == 0x0) {
572 if (TLB_ERROR(ec))
Borislav Petkov50872cc2014-11-22 13:41:01 +0100573 pr_cont("%s error in a Page Descriptor Cache or Guest TLB.\n",
574 TT_MSG(ec));
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200575 else if (BUS_ERROR(ec))
576 pr_cont(": %s/ECC error in data read from NB: %s.\n",
Borislav Petkov62452882010-09-22 16:08:37 +0200577 R4_MSG(ec), PP_MSG(ec));
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200578 else if (MEM_ERROR(ec)) {
Borislav Petkov62452882010-09-22 16:08:37 +0200579 u8 r4 = R4(ec);
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200580
Borislav Petkov62452882010-09-22 16:08:37 +0200581 if (r4 >= 0x7)
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200582 pr_cont(": %s error during data copyback.\n",
Borislav Petkov62452882010-09-22 16:08:37 +0200583 R4_MSG(ec));
584 else if (r4 <= 0x1)
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200585 pr_cont(": %s parity/ECC error during data "
Borislav Petkov62452882010-09-22 16:08:37 +0200586 "access from L2.\n", R4_MSG(ec));
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200587 else
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600588 ret = false;
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200589 } else
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600590 ret = false;
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200591 } else
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600592 ret = false;
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200593
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600594 return ret;
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200595}
596
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600597static bool f15h_mc2_mce(u16 ec, u8 xec)
Borislav Petkov70fdb492010-09-21 20:45:10 +0200598{
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600599 bool ret = true;
Borislav Petkov70fdb492010-09-21 20:45:10 +0200600
601 if (TLB_ERROR(ec)) {
602 if (xec == 0x0)
603 pr_cont("Data parity TLB read error.\n");
604 else if (xec == 0x1)
605 pr_cont("Poison data provided for TLB fill.\n");
606 else
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600607 ret = false;
Borislav Petkov70fdb492010-09-21 20:45:10 +0200608 } else if (BUS_ERROR(ec)) {
609 if (xec > 2)
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600610 ret = false;
Borislav Petkov70fdb492010-09-21 20:45:10 +0200611
612 pr_cont("Error during attempted NB data read.\n");
613 } else if (MEM_ERROR(ec)) {
614 switch (xec) {
615 case 0x4 ... 0xc:
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200616 pr_cont("%s.\n", f15h_mc2_mce_desc[xec - 0x4]);
Borislav Petkov70fdb492010-09-21 20:45:10 +0200617 break;
618
619 case 0x10 ... 0x14:
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200620 pr_cont("%s.\n", f15h_mc2_mce_desc[xec - 0x7]);
Borislav Petkov70fdb492010-09-21 20:45:10 +0200621 break;
622
623 default:
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600624 ret = false;
Borislav Petkov70fdb492010-09-21 20:45:10 +0200625 }
Aravind Gopalakrishnaneba4bfb2014-07-14 16:58:19 +0200626 } else if (INT_ERROR(ec)) {
627 if (xec <= 0x3f)
628 pr_cont("Hardware Assert.\n");
629 else
630 ret = false;
Borislav Petkov70fdb492010-09-21 20:45:10 +0200631 }
632
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600633 return ret;
634}
Borislav Petkov70fdb492010-09-21 20:45:10 +0200635
Jacob Shin980eec82012-12-18 15:06:11 -0600636static bool f16h_mc2_mce(u16 ec, u8 xec)
637{
638 u8 r4 = R4(ec);
639
640 if (!MEM_ERROR(ec))
641 return false;
642
643 switch (xec) {
644 case 0x04 ... 0x05:
645 pr_cont("%cBUFF parity error.\n", (r4 == R4_RD) ? 'I' : 'O');
646 break;
647
648 case 0x09 ... 0x0b:
649 case 0x0d ... 0x0f:
650 pr_cont("ECC error in L2 tag (%s).\n",
651 ((r4 == R4_GEN) ? "BankReq" :
652 ((r4 == R4_SNOOP) ? "Prb" : "Fill")));
653 break;
654
655 case 0x10 ... 0x19:
656 case 0x1b:
657 pr_cont("ECC error in L2 data array (%s).\n",
658 (((r4 == R4_RD) && !(xec & 0x3)) ? "Hit" :
659 ((r4 == R4_GEN) ? "Attr" :
660 ((r4 == R4_EVICT) ? "Vict" : "Fill"))));
661 break;
662
663 case 0x1c ... 0x1d:
664 case 0x1f:
665 pr_cont("Parity error in L2 attribute bits (%s).\n",
666 ((r4 == R4_RD) ? "Hit" :
667 ((r4 == R4_GEN) ? "Attr" : "Fill")));
668 break;
669
670 default:
671 return false;
672 }
673
674 return true;
675}
676
Jacob Shin4a73d3d2012-12-18 15:06:10 -0600677static void decode_mc2_mce(struct mce *m)
678{
679 u16 ec = EC(m->status);
680 u8 xec = XEC(m->status, xec_mask);
681
682 pr_emerg(HW_ERR "MC2 Error: ");
683
684 if (!fam_ops->mc2_mce(ec, xec))
685 pr_cont(HW_ERR "Corrupted MC2 MCE info?\n");
Borislav Petkov70fdb492010-09-21 20:45:10 +0200686}
687
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200688static void decode_mc3_mce(struct mce *m)
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200689{
Borislav Petkov62452882010-09-22 16:08:37 +0200690 u16 ec = EC(m->status);
691 u8 xec = XEC(m->status, xec_mask);
Borislav Petkovded50622010-08-27 17:03:34 +0200692
Borislav Petkovb18434c2010-09-22 11:53:32 +0200693 if (boot_cpu_data.x86 >= 0x14) {
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200694 pr_emerg("You shouldn't be seeing MC3 MCE on this cpu family,"
Borislav Petkovded50622010-08-27 17:03:34 +0200695 " please report on LKML.\n");
696 return;
697 }
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200698
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200699 pr_emerg(HW_ERR "MC3 Error");
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200700
701 if (xec == 0x0) {
Borislav Petkov62452882010-09-22 16:08:37 +0200702 u8 r4 = R4(ec);
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200703
Borislav Petkovded50622010-08-27 17:03:34 +0200704 if (!BUS_ERROR(ec) || (r4 != R4_DRD && r4 != R4_DWR))
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200705 goto wrong_mc3_mce;
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200706
Borislav Petkov62452882010-09-22 16:08:37 +0200707 pr_cont(" during %s.\n", R4_MSG(ec));
Borislav Petkovded50622010-08-27 17:03:34 +0200708 } else
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200709 goto wrong_mc3_mce;
Borislav Petkovded50622010-08-27 17:03:34 +0200710
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200711 return;
712
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200713 wrong_mc3_mce:
714 pr_emerg(HW_ERR "Corrupted MC3 MCE info?\n");
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200715}
716
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200717static void decode_mc4_mce(struct mce *m)
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200718{
Borislav Petkov68782672011-11-24 21:29:57 +0100719 struct cpuinfo_x86 *c = &boot_cpu_data;
720 int node_id = amd_get_nb_id(m->extcpu);
721 u16 ec = EC(m->status);
722 u8 xec = XEC(m->status, 0x1f);
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200723 u8 offset = 0;
724
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200725 pr_emerg(HW_ERR "MC4 Error (node %d): ", node_id);
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200726
Borislav Petkov68782672011-11-24 21:29:57 +0100727 switch (xec) {
728 case 0x0 ... 0xe:
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200729
Borislav Petkov68782672011-11-24 21:29:57 +0100730 /* special handling for DRAM ECCs */
731 if (xec == 0x0 || xec == 0x8) {
732 /* no ECCs on F11h */
733 if (c->x86 == 0x11)
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200734 goto wrong_mc4_mce;
Borislav Petkov68782672011-11-24 21:29:57 +0100735
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200736 pr_cont("%s.\n", mc4_mce_desc[xec]);
Borislav Petkov68782672011-11-24 21:29:57 +0100737
738 if (nb_bus_decoder)
739 nb_bus_decoder(node_id, m);
740 return;
741 }
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200742 break;
743
744 case 0xf:
745 if (TLB_ERROR(ec))
746 pr_cont("GART Table Walk data error.\n");
747 else if (BUS_ERROR(ec))
748 pr_cont("DMA Exclusion Vector Table Walk error.\n");
749 else
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200750 goto wrong_mc4_mce;
Borislav Petkov68782672011-11-24 21:29:57 +0100751 return;
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200752
Borislav Petkov05cd6672010-09-22 15:06:24 +0200753 case 0x19:
Jacob Shin980eec82012-12-18 15:06:11 -0600754 if (boot_cpu_data.x86 == 0x15 || boot_cpu_data.x86 == 0x16)
Borislav Petkov05cd6672010-09-22 15:06:24 +0200755 pr_cont("Compute Unit Data Error.\n");
756 else
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200757 goto wrong_mc4_mce;
Borislav Petkov68782672011-11-24 21:29:57 +0100758 return;
Borislav Petkov05cd6672010-09-22 15:06:24 +0200759
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200760 case 0x1c ... 0x1f:
Borislav Petkov68782672011-11-24 21:29:57 +0100761 offset = 13;
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200762 break;
763
764 default:
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200765 goto wrong_mc4_mce;
Borislav Petkov68782672011-11-24 21:29:57 +0100766 }
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200767
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200768 pr_cont("%s.\n", mc4_mce_desc[xec - offset]);
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200769 return;
770
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200771 wrong_mc4_mce:
772 pr_emerg(HW_ERR "Corrupted MC4 MCE info?\n");
Borislav Petkovd93cc222009-07-28 10:56:15 +0200773}
Borislav Petkovd93cc222009-07-28 10:56:15 +0200774
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200775static void decode_mc5_mce(struct mce *m)
Borislav Petkov53bd5fe2009-07-28 14:20:46 +0200776{
Borislav Petkov8259a7e2010-09-22 15:28:59 +0200777 struct cpuinfo_x86 *c = &boot_cpu_data;
Aravind Gopalakrishnaneba4bfb2014-07-14 16:58:19 +0200778 u16 ec = EC(m->status);
Borislav Petkov62452882010-09-22 16:08:37 +0200779 u8 xec = XEC(m->status, xec_mask);
Borislav Petkov8259a7e2010-09-22 15:28:59 +0200780
781 if (c->x86 == 0xf || c->x86 == 0x11)
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200782 goto wrong_mc5_mce;
Borislav Petkovfe4ea262010-08-31 18:38:24 +0200783
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200784 pr_emerg(HW_ERR "MC5 Error: ");
Borislav Petkov8259a7e2010-09-22 15:28:59 +0200785
Aravind Gopalakrishnaneba4bfb2014-07-14 16:58:19 +0200786 if (INT_ERROR(ec)) {
787 if (xec <= 0x1f) {
788 pr_cont("Hardware Assert.\n");
789 return;
790 } else
791 goto wrong_mc5_mce;
792 }
793
Borislav Petkov8259a7e2010-09-22 15:28:59 +0200794 if (xec == 0x0 || xec == 0xc)
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200795 pr_cont("%s.\n", mc5_mce_desc[xec]);
Aravind Gopalakrishnanaad19e52013-06-05 15:50:03 -0500796 else if (xec <= 0xd)
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200797 pr_cont("%s parity error.\n", mc5_mce_desc[xec]);
Borislav Petkov8259a7e2010-09-22 15:28:59 +0200798 else
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200799 goto wrong_mc5_mce;
Borislav Petkov8259a7e2010-09-22 15:28:59 +0200800
801 return;
Borislav Petkovfe4ea262010-08-31 18:38:24 +0200802
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200803 wrong_mc5_mce:
804 pr_emerg(HW_ERR "Corrupted MC5 MCE info?\n");
Borislav Petkov53bd5fe2009-07-28 14:20:46 +0200805}
806
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200807static void decode_mc6_mce(struct mce *m)
Borislav Petkovb8f85c42010-09-22 15:37:58 +0200808{
Borislav Petkov62452882010-09-22 16:08:37 +0200809 u8 xec = XEC(m->status, xec_mask);
Borislav Petkovb8f85c42010-09-22 15:37:58 +0200810
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200811 pr_emerg(HW_ERR "MC6 Error: ");
Borislav Petkovb8f85c42010-09-22 15:37:58 +0200812
Aravind Gopalakrishnanbc4febe2014-11-04 11:41:08 -0600813 if (xec > 0x5)
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200814 goto wrong_mc6_mce;
Borislav Petkovb8f85c42010-09-22 15:37:58 +0200815
Aravind Gopalakrishnanbc4febe2014-11-04 11:41:08 -0600816 pr_cont("%s parity error.\n", mc6_mce_desc[xec]);
Borislav Petkovb8f85c42010-09-22 15:37:58 +0200817 return;
818
Borislav Petkovf05c41a2012-09-11 18:57:43 +0200819 wrong_mc6_mce:
820 pr_emerg(HW_ERR "Corrupted MC6 MCE info?\n");
Borislav Petkovb8f85c42010-09-22 15:37:58 +0200821}
822
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +0100823static void decode_f17h_core_errors(const char *ip_name, u8 xec,
824 unsigned int mca_type)
825{
826 const char * const *error_desc_array;
827 size_t len;
828
829 pr_emerg(HW_ERR "%s Error: ", ip_name);
830
831 switch (mca_type) {
832 case SMCA_LS:
833 error_desc_array = f17h_ls_mce_desc;
834 len = ARRAY_SIZE(f17h_ls_mce_desc) - 1;
835
836 if (xec == 0x4) {
837 pr_cont("Unrecognized LS MCA error code.\n");
838 return;
839 }
840 break;
841
842 case SMCA_IF:
843 error_desc_array = f17h_if_mce_desc;
844 len = ARRAY_SIZE(f17h_if_mce_desc) - 1;
845 break;
846
847 case SMCA_L2_CACHE:
848 error_desc_array = f17h_l2_mce_desc;
849 len = ARRAY_SIZE(f17h_l2_mce_desc) - 1;
850 break;
851
852 case SMCA_DE:
853 error_desc_array = f17h_de_mce_desc;
854 len = ARRAY_SIZE(f17h_de_mce_desc) - 1;
855 break;
856
857 case SMCA_EX:
858 error_desc_array = f17h_ex_mce_desc;
859 len = ARRAY_SIZE(f17h_ex_mce_desc) - 1;
860 break;
861
862 case SMCA_FP:
863 error_desc_array = f17h_fp_mce_desc;
864 len = ARRAY_SIZE(f17h_fp_mce_desc) - 1;
865 break;
866
867 case SMCA_L3_CACHE:
868 error_desc_array = f17h_l3_mce_desc;
869 len = ARRAY_SIZE(f17h_l3_mce_desc) - 1;
870 break;
871
872 default:
873 pr_cont("Corrupted MCA core error info.\n");
874 return;
875 }
876
877 if (xec > len) {
878 pr_cont("Unrecognized %s MCA bank error code.\n",
879 amd_core_mcablock_names[mca_type]);
880 return;
881 }
882
883 pr_cont("%s.\n", error_desc_array[xec]);
884}
885
886static void decode_df_errors(u8 xec, unsigned int mca_type)
887{
888 const char * const *error_desc_array;
889 size_t len;
890
891 pr_emerg(HW_ERR "Data Fabric Error: ");
892
893 switch (mca_type) {
894 case SMCA_CS:
895 error_desc_array = f17h_cs_mce_desc;
896 len = ARRAY_SIZE(f17h_cs_mce_desc) - 1;
897 break;
898
899 case SMCA_PIE:
900 error_desc_array = f17h_pie_mce_desc;
901 len = ARRAY_SIZE(f17h_pie_mce_desc) - 1;
902 break;
903
904 default:
905 pr_cont("Corrupted MCA Data Fabric info.\n");
906 return;
907 }
908
909 if (xec > len) {
910 pr_cont("Unrecognized %s MCA bank error code.\n",
911 amd_df_mcablock_names[mca_type]);
912 return;
913 }
914
915 pr_cont("%s.\n", error_desc_array[xec]);
916}
917
918/* Decode errors according to Scalable MCA specification */
919static void decode_smca_errors(struct mce *m)
920{
921 u32 addr = MSR_AMD64_SMCA_MCx_IPID(m->bank);
922 unsigned int hwid, mca_type, i;
923 u8 xec = XEC(m->status, xec_mask);
924 const char * const *error_desc_array;
925 const char *ip_name;
926 u32 low, high;
927 size_t len;
928
929 if (rdmsr_safe(addr, &low, &high)) {
930 pr_emerg("Invalid IP block specified, error information is unreliable.\n");
931 return;
932 }
933
934 hwid = high & MCI_IPID_HWID;
935 mca_type = (high & MCI_IPID_MCATYPE) >> 16;
936
937 pr_emerg(HW_ERR "MC%d IPID value: 0x%08x%08x\n", m->bank, high, low);
938
939 /*
940 * Based on hwid and mca_type values, decode errors from respective IPs.
941 * Note: mca_type values make sense only in the context of an hwid.
942 */
943 for (i = 0; i < ARRAY_SIZE(amd_hwids); i++)
944 if (amd_hwids[i].hwid == hwid)
945 break;
946
947 switch (i) {
948 case SMCA_F17H_CORE:
949 ip_name = (mca_type == SMCA_L3_CACHE) ?
950 "L3 Cache" : "F17h Core";
951 return decode_f17h_core_errors(ip_name, xec, mca_type);
952 break;
953
954 case SMCA_DF:
955 return decode_df_errors(xec, mca_type);
956 break;
957
958 case SMCA_UMC:
959 error_desc_array = f17h_umc_mce_desc;
960 len = ARRAY_SIZE(f17h_umc_mce_desc) - 1;
961 break;
962
963 case SMCA_PB:
964 error_desc_array = f17h_pb_mce_desc;
965 len = ARRAY_SIZE(f17h_pb_mce_desc) - 1;
966 break;
967
968 case SMCA_PSP:
969 error_desc_array = f17h_psp_mce_desc;
970 len = ARRAY_SIZE(f17h_psp_mce_desc) - 1;
971 break;
972
973 case SMCA_SMU:
974 error_desc_array = f17h_smu_mce_desc;
975 len = ARRAY_SIZE(f17h_smu_mce_desc) - 1;
976 break;
977
978 default:
979 pr_emerg(HW_ERR "HWID:%d does not match any existing IPs.\n", hwid);
980 return;
981 }
982
983 ip_name = amd_hwids[i].name;
984 pr_emerg(HW_ERR "%s Error: ", ip_name);
985
986 if (xec > len) {
987 pr_cont("Unrecognized %s MCA bank error code.\n", ip_name);
988 return;
989 }
990
991 pr_cont("%s.\n", error_desc_array[xec]);
992}
993
Borislav Petkov63375832010-09-06 18:13:39 +0200994static inline void amd_decode_err_code(u16 ec)
Borislav Petkovd93cc222009-07-28 10:56:15 +0200995{
Jacob Shin980eec82012-12-18 15:06:11 -0600996 if (INT_ERROR(ec)) {
997 pr_emerg(HW_ERR "internal: %s\n", UU_MSG(ec));
998 return;
999 }
Borislav Petkovfa7ae8c2010-09-22 17:42:27 +02001000
1001 pr_emerg(HW_ERR "cache level: %s", LL_MSG(ec));
1002
1003 if (BUS_ERROR(ec))
1004 pr_cont(", mem/io: %s", II_MSG(ec));
1005 else
1006 pr_cont(", tx: %s", TT_MSG(ec));
1007
1008 if (MEM_ERROR(ec) || BUS_ERROR(ec)) {
1009 pr_cont(", mem-tx: %s", R4_MSG(ec));
1010
1011 if (BUS_ERROR(ec))
1012 pr_cont(", part-proc: %s (%s)", PP_MSG(ec), TO_MSG(ec));
1013 }
1014
1015 pr_cont("\n");
Borislav Petkov549d0422009-07-24 13:51:42 +02001016}
Borislav Petkov549d0422009-07-24 13:51:42 +02001017
Borislav Petkov5ce88f62010-08-31 18:28:08 +02001018/*
1019 * Filter out unwanted MCE signatures here.
1020 */
1021static bool amd_filter_mce(struct mce *m)
1022{
1023 u8 xec = (m->status >> 16) & 0x1f;
1024
1025 /*
1026 * NB GART TLB error reporting is disabled by default.
1027 */
1028 if (m->bank == 4 && xec == 0x5 && !report_gart_errors)
1029 return true;
1030
1031 return false;
1032}
1033
Borislav Petkovd5c67702012-09-14 20:25:37 +02001034static const char *decode_error_status(struct mce *m)
1035{
1036 if (m->status & MCI_STATUS_UC) {
1037 if (m->status & MCI_STATUS_PCC)
1038 return "System Fatal error.";
1039 if (m->mcgstatus & MCG_STATUS_RIPV)
1040 return "Uncorrected, software restartable error.";
1041 return "Uncorrected, software containable error.";
1042 }
1043
1044 if (m->status & MCI_STATUS_DEFERRED)
1045 return "Deferred error.";
1046
1047 return "Corrected error, no action required.";
1048}
1049
Borislav Petkov9cdeb402010-09-02 18:33:24 +02001050int amd_decode_mce(struct notifier_block *nb, unsigned long val, void *data)
Borislav Petkov549d0422009-07-24 13:51:42 +02001051{
Borislav Petkovfb253192009-10-07 13:20:38 +02001052 struct mce *m = (struct mce *)data;
Borislav Petkovf89f8382012-09-13 15:14:22 +02001053 struct cpuinfo_x86 *c = &cpu_data(m->extcpu);
Borislav Petkovb0b07a22011-08-24 18:44:22 +02001054 int ecc;
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +01001055 u32 ebx = cpuid_ebx(0x80000007);
Borislav Petkov549d0422009-07-24 13:51:42 +02001056
Borislav Petkov5ce88f62010-08-31 18:28:08 +02001057 if (amd_filter_mce(m))
1058 return NOTIFY_STOP;
1059
Borislav Petkovfd0f5fff2014-02-17 20:51:52 +01001060 pr_emerg(HW_ERR "%s\n", decode_error_status(m));
1061
1062 pr_emerg(HW_ERR "CPU:%d (%x:%x:%x) MC%d_STATUS[%s|%s|%s|%s|%s",
1063 m->extcpu,
1064 c->x86, c->x86_model, c->x86_mask,
1065 m->bank,
1066 ((m->status & MCI_STATUS_OVER) ? "Over" : "-"),
Aravind Gopalakrishnan99e1dfb2015-07-13 06:53:02 -05001067 ((m->status & MCI_STATUS_UC) ? "UE" :
1068 (m->status & MCI_STATUS_DEFERRED) ? "-" : "CE"),
Borislav Petkovfd0f5fff2014-02-17 20:51:52 +01001069 ((m->status & MCI_STATUS_MISCV) ? "MiscV" : "-"),
1070 ((m->status & MCI_STATUS_PCC) ? "PCC" : "-"),
1071 ((m->status & MCI_STATUS_ADDRV) ? "AddrV" : "-"));
1072
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +01001073 if (c->x86 >= 0x15)
Borislav Petkovfd0f5fff2014-02-17 20:51:52 +01001074 pr_cont("|%s|%s",
1075 ((m->status & MCI_STATUS_DEFERRED) ? "Deferred" : "-"),
1076 ((m->status & MCI_STATUS_POISON) ? "Poison" : "-"));
1077
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +01001078 if (!!(ebx & BIT(3))) {
1079 u32 low, high;
1080 u32 addr = MSR_AMD64_SMCA_MCx_CONFIG(m->bank);
1081
1082 if (!rdmsr_safe(addr, &low, &high) &&
1083 (low & MCI_CONFIG_MCAX))
1084 pr_cont("|%s", ((m->status & MCI_STATUS_TCC) ? "TCC" : "-"));
1085 }
1086
Borislav Petkovfd0f5fff2014-02-17 20:51:52 +01001087 /* do the two bits[14:13] together */
1088 ecc = (m->status >> 45) & 0x3;
1089 if (ecc)
1090 pr_cont("|%sECC", ((ecc == 2) ? "C" : "U"));
1091
1092 pr_cont("]: 0x%016llx\n", m->status);
1093
1094 if (m->status & MCI_STATUS_ADDRV)
Borislav Petkov50872cc2014-11-22 13:41:01 +01001095 pr_emerg(HW_ERR "MC%d Error Address: 0x%016llx\n", m->bank, m->addr);
Borislav Petkovfd0f5fff2014-02-17 20:51:52 +01001096
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +01001097 if (!!(ebx & BIT(3))) {
1098 decode_smca_errors(m);
1099 goto err_code;
1100 }
1101
Borislav Petkovfd0f5fff2014-02-17 20:51:52 +01001102 if (!fam_ops)
1103 goto err_code;
1104
Borislav Petkov51966242009-07-28 13:50:43 +02001105 switch (m->bank) {
1106 case 0:
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001107 decode_mc0_mce(m);
Borislav Petkov51966242009-07-28 13:50:43 +02001108 break;
Borislav Petkovd93cc222009-07-28 10:56:15 +02001109
Borislav Petkovab5535e2009-07-28 14:06:26 +02001110 case 1:
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001111 decode_mc1_mce(m);
Borislav Petkovab5535e2009-07-28 14:06:26 +02001112 break;
1113
Borislav Petkov56cad2d2009-07-28 14:14:24 +02001114 case 2:
Jacob Shin4a73d3d2012-12-18 15:06:10 -06001115 decode_mc2_mce(m);
Borislav Petkov56cad2d2009-07-28 14:14:24 +02001116 break;
1117
Borislav Petkovf9350ef2009-07-28 14:17:30 +02001118 case 3:
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001119 decode_mc3_mce(m);
Borislav Petkovf9350ef2009-07-28 14:17:30 +02001120 break;
1121
Borislav Petkov51966242009-07-28 13:50:43 +02001122 case 4:
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001123 decode_mc4_mce(m);
Borislav Petkov51966242009-07-28 13:50:43 +02001124 break;
1125
Borislav Petkov53bd5fe2009-07-28 14:20:46 +02001126 case 5:
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001127 decode_mc5_mce(m);
Borislav Petkov53bd5fe2009-07-28 14:20:46 +02001128 break;
1129
Borislav Petkovb8f85c42010-09-22 15:37:58 +02001130 case 6:
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001131 decode_mc6_mce(m);
Borislav Petkovb8f85c42010-09-22 15:37:58 +02001132 break;
1133
Borislav Petkov51966242009-07-28 13:50:43 +02001134 default:
1135 break;
Borislav Petkovb69b29d2009-07-27 16:21:14 +02001136 }
Borislav Petkov51966242009-07-28 13:50:43 +02001137
Borislav Petkovfd0f5fff2014-02-17 20:51:52 +01001138 err_code:
Borislav Petkov51966242009-07-28 13:50:43 +02001139 amd_decode_err_code(m->status & 0xffff);
Borislav Petkovfb253192009-10-07 13:20:38 +02001140
1141 return NOTIFY_STOP;
Borislav Petkov549d0422009-07-24 13:51:42 +02001142}
Borislav Petkov9cdeb402010-09-02 18:33:24 +02001143EXPORT_SYMBOL_GPL(amd_decode_mce);
Ingo Molnarf436f8b2009-10-01 16:14:32 +02001144
Borislav Petkovfb253192009-10-07 13:20:38 +02001145static struct notifier_block amd_mce_dec_nb = {
1146 .notifier_call = amd_decode_mce,
1147};
1148
Ingo Molnarf436f8b2009-10-01 16:14:32 +02001149static int __init mce_amd_init(void)
1150{
Borislav Petkovbad11e02010-09-22 17:44:51 +02001151 struct cpuinfo_x86 *c = &boot_cpu_data;
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +01001152 u32 ebx;
Borislav Petkovbad11e02010-09-22 17:44:51 +02001153
1154 if (c->x86_vendor != X86_VENDOR_AMD)
Borislav Petkovfd0f5fff2014-02-17 20:51:52 +01001155 return -ENODEV;
Borislav Petkove045c292010-08-06 18:55:45 +02001156
Borislav Petkov888ab8e2010-08-18 15:11:35 +02001157 fam_ops = kzalloc(sizeof(struct amd_decoder_ops), GFP_KERNEL);
1158 if (!fam_ops)
1159 return -ENOMEM;
1160
Borislav Petkovbad11e02010-09-22 17:44:51 +02001161 switch (c->x86) {
Borislav Petkov888ab8e2010-08-18 15:11:35 +02001162 case 0xf:
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001163 fam_ops->mc0_mce = k8_mc0_mce;
1164 fam_ops->mc1_mce = k8_mc1_mce;
Jacob Shin4a73d3d2012-12-18 15:06:10 -06001165 fam_ops->mc2_mce = k8_mc2_mce;
Borislav Petkov888ab8e2010-08-18 15:11:35 +02001166 break;
1167
1168 case 0x10:
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001169 fam_ops->mc0_mce = f10h_mc0_mce;
1170 fam_ops->mc1_mce = k8_mc1_mce;
Jacob Shin4a73d3d2012-12-18 15:06:10 -06001171 fam_ops->mc2_mce = k8_mc2_mce;
Borislav Petkov888ab8e2010-08-18 15:11:35 +02001172 break;
1173
Borislav Petkovf0157b32010-10-05 19:07:16 +02001174 case 0x11:
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001175 fam_ops->mc0_mce = k8_mc0_mce;
1176 fam_ops->mc1_mce = k8_mc1_mce;
Jacob Shin4a73d3d2012-12-18 15:06:10 -06001177 fam_ops->mc2_mce = k8_mc2_mce;
Borislav Petkovf0157b32010-10-05 19:07:16 +02001178 break;
1179
Borislav Petkov9be0bb12010-09-16 15:08:14 +02001180 case 0x12:
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001181 fam_ops->mc0_mce = f12h_mc0_mce;
1182 fam_ops->mc1_mce = k8_mc1_mce;
Jacob Shin4a73d3d2012-12-18 15:06:10 -06001183 fam_ops->mc2_mce = k8_mc2_mce;
Borislav Petkov9be0bb12010-09-16 15:08:14 +02001184 break;
1185
Borislav Petkov888ab8e2010-08-18 15:11:35 +02001186 case 0x14:
Jacob Shin980eec82012-12-18 15:06:11 -06001187 fam_ops->mc0_mce = cat_mc0_mce;
1188 fam_ops->mc1_mce = cat_mc1_mce;
Jacob Shin4a73d3d2012-12-18 15:06:10 -06001189 fam_ops->mc2_mce = k8_mc2_mce;
Borislav Petkov888ab8e2010-08-18 15:11:35 +02001190 break;
1191
Borislav Petkov2be64bf2010-09-17 19:11:47 +02001192 case 0x15:
Aravind Gopalakrishnaneba4bfb2014-07-14 16:58:19 +02001193 xec_mask = c->x86_model == 0x60 ? 0x3f : 0x1f;
1194
Borislav Petkovf05c41a2012-09-11 18:57:43 +02001195 fam_ops->mc0_mce = f15h_mc0_mce;
1196 fam_ops->mc1_mce = f15h_mc1_mce;
Jacob Shin4a73d3d2012-12-18 15:06:10 -06001197 fam_ops->mc2_mce = f15h_mc2_mce;
Borislav Petkov2be64bf2010-09-17 19:11:47 +02001198 break;
1199
Jacob Shin980eec82012-12-18 15:06:11 -06001200 case 0x16:
1201 xec_mask = 0x1f;
1202 fam_ops->mc0_mce = cat_mc0_mce;
1203 fam_ops->mc1_mce = cat_mc1_mce;
1204 fam_ops->mc2_mce = f16h_mc2_mce;
1205 break;
1206
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +01001207 case 0x17:
1208 ebx = cpuid_ebx(0x80000007);
1209 xec_mask = 0x3f;
1210 if (!(ebx & BIT(3))) {
1211 printk(KERN_WARNING "Decoding supported only on Scalable MCA processors.\n");
1212 goto err_out;
1213 }
1214 break;
1215
Borislav Petkov888ab8e2010-08-18 15:11:35 +02001216 default:
Borislav Petkovec3e82d2012-04-04 14:21:02 +02001217 printk(KERN_WARNING "Huh? What family is it: 0x%x?!\n", c->x86);
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +01001218 goto err_out;
Borislav Petkov888ab8e2010-08-18 15:11:35 +02001219 }
1220
Borislav Petkov9530d602010-09-06 15:05:45 +02001221 pr_info("MCE: In-kernel MCE decoding enabled.\n");
1222
Borislav Petkov3653ada2011-12-04 15:12:09 +01001223 mce_register_decode_chain(&amd_mce_dec_nb);
Ingo Molnarf436f8b2009-10-01 16:14:32 +02001224
1225 return 0;
Aravind Gopalakrishnanbe0aec22016-03-07 14:02:18 +01001226
1227err_out:
1228 kfree(fam_ops);
1229 fam_ops = NULL;
1230 return -EINVAL;
Ingo Molnarf436f8b2009-10-01 16:14:32 +02001231}
1232early_initcall(mce_amd_init);
Borislav Petkov0d18b2e2009-10-02 15:31:48 +02001233
1234#ifdef MODULE
1235static void __exit mce_amd_exit(void)
1236{
Borislav Petkov3653ada2011-12-04 15:12:09 +01001237 mce_unregister_decode_chain(&amd_mce_dec_nb);
Borislav Petkov888ab8e2010-08-18 15:11:35 +02001238 kfree(fam_ops);
Borislav Petkov0d18b2e2009-10-02 15:31:48 +02001239}
1240
1241MODULE_DESCRIPTION("AMD MCE decoder");
1242MODULE_ALIAS("edac-mce-amd");
1243MODULE_LICENSE("GPL");
1244module_exit(mce_amd_exit);
1245#endif