blob: b81c5da542c024cef2aa0a511f9da81377e62724 [file] [log] [blame]
Borislav Petkovb70ef012009-06-25 19:32:38 +02001#include <linux/module.h>
Borislav Petkov888ab8e2010-08-18 15:11:35 +02002#include <linux/slab.h>
3
Borislav Petkov47ca08a2010-09-27 15:30:39 +02004#include "mce_amd.h"
Doug Thompsonb52401ce2009-05-06 17:57:20 +02005
Borislav Petkov888ab8e2010-08-18 15:11:35 +02006static struct amd_decoder_ops *fam_ops;
7
Borislav Petkov2be64bf2010-09-17 19:11:47 +02008static u8 xec_mask = 0xf;
Borislav Petkov5ce88f62010-08-31 18:28:08 +02009static u8 nb_err_cpumask = 0xf;
10
Borislav Petkov549d0422009-07-24 13:51:42 +020011static bool report_gart_errors;
Borislav Petkov7cfd4a82010-09-01 14:45:20 +020012static void (*nb_bus_decoder)(int node_id, struct mce *m, u32 nbcfg);
Borislav Petkov549d0422009-07-24 13:51:42 +020013
14void amd_report_gart_errors(bool v)
15{
16 report_gart_errors = v;
17}
18EXPORT_SYMBOL_GPL(amd_report_gart_errors);
19
Borislav Petkov7cfd4a82010-09-01 14:45:20 +020020void amd_register_ecc_decoder(void (*f)(int, struct mce *, u32))
Borislav Petkov549d0422009-07-24 13:51:42 +020021{
22 nb_bus_decoder = f;
23}
24EXPORT_SYMBOL_GPL(amd_register_ecc_decoder);
25
Borislav Petkov7cfd4a82010-09-01 14:45:20 +020026void amd_unregister_ecc_decoder(void (*f)(int, struct mce *, u32))
Borislav Petkov549d0422009-07-24 13:51:42 +020027{
28 if (nb_bus_decoder) {
29 WARN_ON(nb_bus_decoder != f);
30
31 nb_bus_decoder = NULL;
32 }
33}
34EXPORT_SYMBOL_GPL(amd_unregister_ecc_decoder);
35
Doug Thompsonb52401ce2009-05-06 17:57:20 +020036/*
37 * string representation for the different MCA reported error types, see F3x48
38 * or MSR0000_0411.
39 */
Borislav Petkov63375832010-09-06 18:13:39 +020040
41/* transaction type */
42const char *tt_msgs[] = { "INSN", "DATA", "GEN", "RESV" };
Borislav Petkovb70ef012009-06-25 19:32:38 +020043EXPORT_SYMBOL_GPL(tt_msgs);
Doug Thompsonb52401ce2009-05-06 17:57:20 +020044
Borislav Petkov63375832010-09-06 18:13:39 +020045/* cache level */
46const char *ll_msgs[] = { "RESV", "L1", "L2", "L3/GEN" };
Borislav Petkovb70ef012009-06-25 19:32:38 +020047EXPORT_SYMBOL_GPL(ll_msgs);
Doug Thompsonb52401ce2009-05-06 17:57:20 +020048
Borislav Petkov63375832010-09-06 18:13:39 +020049/* memory transaction type */
Doug Thompsonb52401ce2009-05-06 17:57:20 +020050const char *rrrr_msgs[] = {
Borislav Petkov63375832010-09-06 18:13:39 +020051 "GEN", "RD", "WR", "DRD", "DWR", "IRD", "PRF", "EV", "SNP"
Doug Thompsonb52401ce2009-05-06 17:57:20 +020052};
Borislav Petkovb70ef012009-06-25 19:32:38 +020053EXPORT_SYMBOL_GPL(rrrr_msgs);
Doug Thompsonb52401ce2009-05-06 17:57:20 +020054
Borislav Petkov63375832010-09-06 18:13:39 +020055/* participating processor */
56const char *pp_msgs[] = { "SRC", "RES", "OBS", "GEN" };
Borislav Petkovb70ef012009-06-25 19:32:38 +020057EXPORT_SYMBOL_GPL(pp_msgs);
Doug Thompsonb52401ce2009-05-06 17:57:20 +020058
Borislav Petkov63375832010-09-06 18:13:39 +020059/* request timeout */
60const char *to_msgs[] = { "no timeout", "timed out" };
Borislav Petkovb70ef012009-06-25 19:32:38 +020061EXPORT_SYMBOL_GPL(to_msgs);
Doug Thompsonb52401ce2009-05-06 17:57:20 +020062
Borislav Petkov63375832010-09-06 18:13:39 +020063/* memory or i/o */
64const char *ii_msgs[] = { "MEM", "RESV", "IO", "GEN" };
Borislav Petkovb70ef012009-06-25 19:32:38 +020065EXPORT_SYMBOL_GPL(ii_msgs);
Doug Thompsonb52401ce2009-05-06 17:57:20 +020066
Borislav Petkov5ce88f62010-08-31 18:28:08 +020067static const char *f10h_nb_mce_desc[] = {
68 "HT link data error",
69 "Protocol error (link, L3, probe filter, etc.)",
70 "Parity error in NB-internal arrays",
71 "Link Retry due to IO link transmission error",
72 "L3 ECC data cache error",
73 "ECC error in L3 cache tag",
74 "L3 LRU parity bits error",
75 "ECC Error in the Probe Filter directory"
Doug Thompsonb52401ce2009-05-06 17:57:20 +020076};
Borislav Petkov549d0422009-07-24 13:51:42 +020077
Borislav Petkov86039cd2010-11-08 15:03:35 +010078static const char * const f15h_ic_mce_desc[] = {
79 "UC during a demand linefill from L2",
80 "Parity error during data load from IC",
81 "Parity error for IC valid bit",
82 "Main tag parity error",
83 "Parity error in prediction queue",
84 "PFB data/address parity error",
85 "Parity error in the branch status reg",
86 "PFB promotion address error",
87 "Tag error during probe/victimization",
88 "Parity error for IC probe tag valid bit",
89 "PFB non-cacheable bit parity error",
90 "PFB valid bit parity error", /* xec = 0xd */
91 "patch RAM", /* xec = 010 */
92 "uop queue",
93 "insn buffer",
94 "predecode buffer",
95 "fetch address FIFO"
96};
97
Borislav Petkov70fdb492010-09-21 20:45:10 +020098static const char * const f15h_cu_mce_desc[] = {
99 "Fill ECC error on data fills", /* xec = 0x4 */
100 "Fill parity error on insn fills",
101 "Prefetcher request FIFO parity error",
102 "PRQ address parity error",
103 "PRQ data parity error",
104 "WCC Tag ECC error",
105 "WCC Data ECC error",
106 "WCB Data parity error",
107 "VB Data/ECC error",
108 "L2 Tag ECC error", /* xec = 0x10 */
109 "Hard L2 Tag ECC error",
110 "Multiple hits on L2 tag",
111 "XAB parity error",
112 "PRB address parity error"
113};
114
Borislav Petkov8259a7e2010-09-22 15:28:59 +0200115static const char * const fr_ex_mce_desc[] = {
116 "CPU Watchdog timer expire",
117 "Wakeup array dest tag",
118 "AG payload array",
119 "EX payload array",
120 "IDRF array",
121 "Retire dispatch queue",
122 "Mapper checkpoint array",
123 "Physical register file EX0 port",
124 "Physical register file EX1 port",
125 "Physical register file AG0 port",
126 "Physical register file AG1 port",
127 "Flag register file",
128 "DE correctable error could not be corrected"
129};
130
Borislav Petkov25a4f8b2010-09-17 19:22:34 +0200131static bool f12h_dc_mce(u16 ec, u8 xec)
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200132{
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200133 bool ret = false;
134
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200135 if (MEM_ERROR(ec)) {
Borislav Petkov62452882010-09-22 16:08:37 +0200136 u8 ll = LL(ec);
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200137 ret = true;
138
139 if (ll == LL_L2)
140 pr_cont("during L1 linefill from L2.\n");
141 else if (ll == LL_L1)
Borislav Petkov62452882010-09-22 16:08:37 +0200142 pr_cont("Data/Tag %s error.\n", R4_MSG(ec));
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200143 else
144 ret = false;
145 }
146 return ret;
147}
148
Borislav Petkov25a4f8b2010-09-17 19:22:34 +0200149static bool f10h_dc_mce(u16 ec, u8 xec)
Borislav Petkov9be0bb12010-09-16 15:08:14 +0200150{
Borislav Petkov62452882010-09-22 16:08:37 +0200151 if (R4(ec) == R4_GEN && LL(ec) == LL_L1) {
Borislav Petkov9be0bb12010-09-16 15:08:14 +0200152 pr_cont("during data scrub.\n");
153 return true;
154 }
Borislav Petkov25a4f8b2010-09-17 19:22:34 +0200155 return f12h_dc_mce(ec, xec);
Borislav Petkov9be0bb12010-09-16 15:08:14 +0200156}
157
Borislav Petkov25a4f8b2010-09-17 19:22:34 +0200158static bool k8_dc_mce(u16 ec, u8 xec)
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200159{
160 if (BUS_ERROR(ec)) {
161 pr_cont("during system linefill.\n");
162 return true;
163 }
164
Borislav Petkov25a4f8b2010-09-17 19:22:34 +0200165 return f10h_dc_mce(ec, xec);
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200166}
167
Borislav Petkov25a4f8b2010-09-17 19:22:34 +0200168static bool f14h_dc_mce(u16 ec, u8 xec)
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200169{
Borislav Petkov62452882010-09-22 16:08:37 +0200170 u8 r4 = R4(ec);
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200171 bool ret = true;
172
173 if (MEM_ERROR(ec)) {
174
Borislav Petkov62452882010-09-22 16:08:37 +0200175 if (TT(ec) != TT_DATA || LL(ec) != LL_L1)
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200176 return false;
177
178 switch (r4) {
179 case R4_DRD:
180 case R4_DWR:
181 pr_cont("Data/Tag parity error due to %s.\n",
182 (r4 == R4_DRD ? "load/hw prf" : "store"));
183 break;
184 case R4_EVICT:
185 pr_cont("Copyback parity error on a tag miss.\n");
186 break;
187 case R4_SNOOP:
188 pr_cont("Tag parity error during snoop.\n");
189 break;
190 default:
191 ret = false;
192 }
193 } else if (BUS_ERROR(ec)) {
194
Borislav Petkov62452882010-09-22 16:08:37 +0200195 if ((II(ec) != II_MEM && II(ec) != II_IO) || LL(ec) != LL_LG)
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200196 return false;
197
198 pr_cont("System read data error on a ");
199
200 switch (r4) {
201 case R4_RD:
202 pr_cont("TLB reload.\n");
203 break;
204 case R4_DWR:
205 pr_cont("store.\n");
206 break;
207 case R4_DRD:
208 pr_cont("load.\n");
209 break;
210 default:
211 ret = false;
212 }
213 } else {
214 ret = false;
215 }
216
217 return ret;
218}
219
Borislav Petkov25a4f8b2010-09-17 19:22:34 +0200220static bool f15h_dc_mce(u16 ec, u8 xec)
221{
222 bool ret = true;
223
224 if (MEM_ERROR(ec)) {
225
226 switch (xec) {
227 case 0x0:
228 pr_cont("Data Array access error.\n");
229 break;
230
231 case 0x1:
232 pr_cont("UC error during a linefill from L2/NB.\n");
233 break;
234
235 case 0x2:
236 case 0x11:
237 pr_cont("STQ access error.\n");
238 break;
239
240 case 0x3:
241 pr_cont("SCB access error.\n");
242 break;
243
244 case 0x10:
245 pr_cont("Tag error.\n");
246 break;
247
248 case 0x12:
249 pr_cont("LDQ access error.\n");
250 break;
251
252 default:
253 ret = false;
254 }
255 } else if (BUS_ERROR(ec)) {
256
257 if (!xec)
258 pr_cont("during system linefill.\n");
259 else
260 pr_cont(" Internal %s condition.\n",
261 ((xec == 1) ? "livelock" : "deadlock"));
262 } else
263 ret = false;
264
265 return ret;
266}
267
Borislav Petkov7cfd4a82010-09-01 14:45:20 +0200268static void amd_decode_dc_mce(struct mce *m)
Borislav Petkov51966242009-07-28 13:50:43 +0200269{
Borislav Petkov62452882010-09-22 16:08:37 +0200270 u16 ec = EC(m->status);
271 u8 xec = XEC(m->status, xec_mask);
Borislav Petkov51966242009-07-28 13:50:43 +0200272
Borislav Petkovc9f281f2010-08-18 18:21:42 +0200273 pr_emerg(HW_ERR "Data Cache Error: ");
Borislav Petkov51966242009-07-28 13:50:43 +0200274
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200275 /* TLB error signatures are the same across families */
276 if (TLB_ERROR(ec)) {
Borislav Petkov62452882010-09-22 16:08:37 +0200277 if (TT(ec) == TT_DATA) {
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200278 pr_cont("%s TLB %s.\n", LL_MSG(ec),
Borislav Petkov25a4f8b2010-09-17 19:22:34 +0200279 ((xec == 2) ? "locked miss"
280 : (xec ? "multimatch" : "parity")));
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200281 return;
282 }
Borislav Petkov25a4f8b2010-09-17 19:22:34 +0200283 } else if (fam_ops->dc_mce(ec, xec))
284 ;
285 else
286 pr_emerg(HW_ERR "Corrupted DC MCE info?\n");
Borislav Petkov51966242009-07-28 13:50:43 +0200287}
288
Borislav Petkov86039cd2010-11-08 15:03:35 +0100289static bool k8_ic_mce(u16 ec, u8 xec)
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200290{
Borislav Petkov62452882010-09-22 16:08:37 +0200291 u8 ll = LL(ec);
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200292 bool ret = true;
293
294 if (!MEM_ERROR(ec))
295 return false;
296
297 if (ll == 0x2)
298 pr_cont("during a linefill from L2.\n");
299 else if (ll == 0x1) {
Borislav Petkov62452882010-09-22 16:08:37 +0200300 switch (R4(ec)) {
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200301 case R4_IRD:
302 pr_cont("Parity error during data load.\n");
303 break;
304
305 case R4_EVICT:
306 pr_cont("Copyback Parity/Victim error.\n");
307 break;
308
309 case R4_SNOOP:
310 pr_cont("Tag Snoop error.\n");
311 break;
312
313 default:
314 ret = false;
315 break;
316 }
317 } else
318 ret = false;
319
320 return ret;
321}
322
Borislav Petkov86039cd2010-11-08 15:03:35 +0100323static bool f14h_ic_mce(u16 ec, u8 xec)
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200324{
Borislav Petkov62452882010-09-22 16:08:37 +0200325 u8 r4 = R4(ec);
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200326 bool ret = true;
327
328 if (MEM_ERROR(ec)) {
Borislav Petkov62452882010-09-22 16:08:37 +0200329 if (TT(ec) != 0 || LL(ec) != 1)
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200330 ret = false;
331
332 if (r4 == R4_IRD)
333 pr_cont("Data/tag array parity error for a tag hit.\n");
334 else if (r4 == R4_SNOOP)
335 pr_cont("Tag error during snoop/victimization.\n");
336 else
337 ret = false;
338 }
339 return ret;
340}
341
Borislav Petkov86039cd2010-11-08 15:03:35 +0100342static bool f15h_ic_mce(u16 ec, u8 xec)
343{
344 bool ret = true;
345
346 if (!MEM_ERROR(ec))
347 return false;
348
349 switch (xec) {
350 case 0x0 ... 0xa:
351 pr_cont("%s.\n", f15h_ic_mce_desc[xec]);
352 break;
353
354 case 0xd:
355 pr_cont("%s.\n", f15h_ic_mce_desc[xec-2]);
356 break;
357
358 case 0x10 ... 0x14:
359 pr_cont("Decoder %s parity error.\n", f15h_ic_mce_desc[xec-4]);
360 break;
361
362 default:
363 ret = false;
364 }
365 return ret;
366}
367
Borislav Petkov7cfd4a82010-09-01 14:45:20 +0200368static void amd_decode_ic_mce(struct mce *m)
Borislav Petkovab5535e2009-07-28 14:06:26 +0200369{
Borislav Petkov62452882010-09-22 16:08:37 +0200370 u16 ec = EC(m->status);
371 u8 xec = XEC(m->status, xec_mask);
Borislav Petkovab5535e2009-07-28 14:06:26 +0200372
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200373 pr_emerg(HW_ERR "Instruction Cache Error: ");
Borislav Petkovab5535e2009-07-28 14:06:26 +0200374
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200375 if (TLB_ERROR(ec))
376 pr_cont("%s TLB %s.\n", LL_MSG(ec),
377 (xec ? "multimatch" : "parity error"));
378 else if (BUS_ERROR(ec)) {
Borislav Petkov525906b2010-10-15 15:27:02 +0200379 bool k8 = (boot_cpu_data.x86 == 0xf && (m->status & BIT_64(58)));
Borislav Petkovab5535e2009-07-28 14:06:26 +0200380
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200381 pr_cont("during %s.\n", (k8 ? "system linefill" : "NB data read"));
Borislav Petkov86039cd2010-11-08 15:03:35 +0100382 } else if (fam_ops->ic_mce(ec, xec))
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200383 ;
384 else
385 pr_emerg(HW_ERR "Corrupted IC MCE info?\n");
Borislav Petkovab5535e2009-07-28 14:06:26 +0200386}
387
Borislav Petkov7cfd4a82010-09-01 14:45:20 +0200388static void amd_decode_bu_mce(struct mce *m)
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200389{
Borislav Petkov62452882010-09-22 16:08:37 +0200390 u16 ec = EC(m->status);
391 u8 xec = XEC(m->status, xec_mask);
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200392
Borislav Petkovc9f281f2010-08-18 18:21:42 +0200393 pr_emerg(HW_ERR "Bus Unit Error");
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200394
395 if (xec == 0x1)
396 pr_cont(" in the write data buffers.\n");
397 else if (xec == 0x3)
398 pr_cont(" in the victim data buffers.\n");
399 else if (xec == 0x2 && MEM_ERROR(ec))
Borislav Petkov62452882010-09-22 16:08:37 +0200400 pr_cont(": %s error in the L2 cache tags.\n", R4_MSG(ec));
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200401 else if (xec == 0x0) {
402 if (TLB_ERROR(ec))
403 pr_cont(": %s error in a Page Descriptor Cache or "
404 "Guest TLB.\n", TT_MSG(ec));
405 else if (BUS_ERROR(ec))
406 pr_cont(": %s/ECC error in data read from NB: %s.\n",
Borislav Petkov62452882010-09-22 16:08:37 +0200407 R4_MSG(ec), PP_MSG(ec));
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200408 else if (MEM_ERROR(ec)) {
Borislav Petkov62452882010-09-22 16:08:37 +0200409 u8 r4 = R4(ec);
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200410
Borislav Petkov62452882010-09-22 16:08:37 +0200411 if (r4 >= 0x7)
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200412 pr_cont(": %s error during data copyback.\n",
Borislav Petkov62452882010-09-22 16:08:37 +0200413 R4_MSG(ec));
414 else if (r4 <= 0x1)
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200415 pr_cont(": %s parity/ECC error during data "
Borislav Petkov62452882010-09-22 16:08:37 +0200416 "access from L2.\n", R4_MSG(ec));
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200417 else
418 goto wrong_bu_mce;
419 } else
420 goto wrong_bu_mce;
421 } else
422 goto wrong_bu_mce;
423
424 return;
425
426wrong_bu_mce:
Borislav Petkovc9f281f2010-08-18 18:21:42 +0200427 pr_emerg(HW_ERR "Corrupted BU MCE info?\n");
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200428}
429
Borislav Petkov70fdb492010-09-21 20:45:10 +0200430static void amd_decode_cu_mce(struct mce *m)
431{
Borislav Petkov62452882010-09-22 16:08:37 +0200432 u16 ec = EC(m->status);
433 u8 xec = XEC(m->status, xec_mask);
Borislav Petkov70fdb492010-09-21 20:45:10 +0200434
435 pr_emerg(HW_ERR "Combined Unit Error: ");
436
437 if (TLB_ERROR(ec)) {
438 if (xec == 0x0)
439 pr_cont("Data parity TLB read error.\n");
440 else if (xec == 0x1)
441 pr_cont("Poison data provided for TLB fill.\n");
442 else
443 goto wrong_cu_mce;
444 } else if (BUS_ERROR(ec)) {
445 if (xec > 2)
446 goto wrong_cu_mce;
447
448 pr_cont("Error during attempted NB data read.\n");
449 } else if (MEM_ERROR(ec)) {
450 switch (xec) {
451 case 0x4 ... 0xc:
452 pr_cont("%s.\n", f15h_cu_mce_desc[xec - 0x4]);
453 break;
454
455 case 0x10 ... 0x14:
456 pr_cont("%s.\n", f15h_cu_mce_desc[xec - 0x7]);
457 break;
458
459 default:
460 goto wrong_cu_mce;
461 }
462 }
463
464 return;
465
466wrong_cu_mce:
467 pr_emerg(HW_ERR "Corrupted CU MCE info?\n");
468}
469
Borislav Petkov7cfd4a82010-09-01 14:45:20 +0200470static void amd_decode_ls_mce(struct mce *m)
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200471{
Borislav Petkov62452882010-09-22 16:08:37 +0200472 u16 ec = EC(m->status);
473 u8 xec = XEC(m->status, xec_mask);
Borislav Petkovded50622010-08-27 17:03:34 +0200474
Borislav Petkovb18434c2010-09-22 11:53:32 +0200475 if (boot_cpu_data.x86 >= 0x14) {
Borislav Petkovded50622010-08-27 17:03:34 +0200476 pr_emerg("You shouldn't be seeing an LS MCE on this cpu family,"
477 " please report on LKML.\n");
478 return;
479 }
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200480
Borislav Petkovc9f281f2010-08-18 18:21:42 +0200481 pr_emerg(HW_ERR "Load Store Error");
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200482
483 if (xec == 0x0) {
Borislav Petkov62452882010-09-22 16:08:37 +0200484 u8 r4 = R4(ec);
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200485
Borislav Petkovded50622010-08-27 17:03:34 +0200486 if (!BUS_ERROR(ec) || (r4 != R4_DRD && r4 != R4_DWR))
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200487 goto wrong_ls_mce;
488
Borislav Petkov62452882010-09-22 16:08:37 +0200489 pr_cont(" during %s.\n", R4_MSG(ec));
Borislav Petkovded50622010-08-27 17:03:34 +0200490 } else
491 goto wrong_ls_mce;
492
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200493 return;
494
495wrong_ls_mce:
Borislav Petkovc9f281f2010-08-18 18:21:42 +0200496 pr_emerg(HW_ERR "Corrupted LS MCE info?\n");
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200497}
498
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200499static bool k8_nb_mce(u16 ec, u8 xec)
500{
501 bool ret = true;
502
503 switch (xec) {
504 case 0x1:
505 pr_cont("CRC error detected on HT link.\n");
506 break;
507
508 case 0x5:
509 pr_cont("Invalid GART PTE entry during GART table walk.\n");
510 break;
511
512 case 0x6:
513 pr_cont("Unsupported atomic RMW received from an IO link.\n");
514 break;
515
516 case 0x0:
517 case 0x8:
Borislav Petkovf0157b32010-10-05 19:07:16 +0200518 if (boot_cpu_data.x86 == 0x11)
519 return false;
520
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200521 pr_cont("DRAM ECC error detected on the NB.\n");
522 break;
523
524 case 0xd:
525 pr_cont("Parity error on the DRAM addr/ctl signals.\n");
526 break;
527
528 default:
529 ret = false;
530 break;
531 }
532
533 return ret;
534}
535
536static bool f10h_nb_mce(u16 ec, u8 xec)
537{
538 bool ret = true;
539 u8 offset = 0;
540
541 if (k8_nb_mce(ec, xec))
542 return true;
543
544 switch(xec) {
545 case 0xa ... 0xc:
546 offset = 10;
547 break;
548
549 case 0xe:
550 offset = 11;
551 break;
552
553 case 0xf:
554 if (TLB_ERROR(ec))
555 pr_cont("GART Table Walk data error.\n");
556 else if (BUS_ERROR(ec))
557 pr_cont("DMA Exclusion Vector Table Walk error.\n");
558 else
559 ret = false;
560
561 goto out;
562 break;
563
Borislav Petkov05cd6672010-09-22 15:06:24 +0200564 case 0x19:
565 if (boot_cpu_data.x86 == 0x15)
566 pr_cont("Compute Unit Data Error.\n");
567 else
568 ret = false;
569
570 goto out;
571 break;
572
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200573 case 0x1c ... 0x1f:
574 offset = 24;
575 break;
576
577 default:
578 ret = false;
579
580 goto out;
581 break;
582 }
583
584 pr_cont("%s.\n", f10h_nb_mce_desc[xec - offset]);
585
586out:
587 return ret;
588}
589
Borislav Petkovcb9d5ec2010-09-16 17:36:12 +0200590static bool nb_noop_mce(u16 ec, u8 xec)
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200591{
592 return false;
593}
594
Borislav Petkov7cfd4a82010-09-01 14:45:20 +0200595void amd_decode_nb_mce(int node_id, struct mce *m, u32 nbcfg)
Borislav Petkov549d0422009-07-24 13:51:42 +0200596{
Borislav Petkovdf71a052011-01-19 18:15:10 +0100597 struct cpuinfo_x86 *c = &boot_cpu_data;
Borislav Petkov62452882010-09-22 16:08:37 +0200598 u16 ec = EC(m->status);
599 u8 xec = XEC(m->status, 0x1f);
Borislav Petkov549d0422009-07-24 13:51:42 +0200600
Borislav Petkov295d8cd2011-08-24 17:47:11 +0200601 pr_emerg(HW_ERR "Northbridge Error (node %d): ", node_id);
Borislav Petkov6d5db462010-11-25 15:40:27 +0100602
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200603 switch (xec) {
604 case 0x2:
605 pr_cont("Sync error (sync packets on HT link detected).\n");
606 return;
Borislav Petkovd93cc222009-07-28 10:56:15 +0200607
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200608 case 0x3:
609 pr_cont("HT Master abort.\n");
610 return;
611
612 case 0x4:
613 pr_cont("HT Target abort.\n");
614 return;
615
616 case 0x7:
617 pr_cont("NB Watchdog timeout.\n");
618 return;
619
620 case 0x9:
621 pr_cont("SVM DMA Exclusion Vector error.\n");
622 return;
623
624 default:
625 break;
626 }
627
628 if (!fam_ops->nb_mce(ec, xec))
629 goto wrong_nb_mce;
630
Borislav Petkovdf71a052011-01-19 18:15:10 +0100631 if (c->x86 == 0xf || c->x86 == 0x10 || c->x86 == 0x15)
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200632 if ((xec == 0x8 || xec == 0x0) && nb_bus_decoder)
633 nb_bus_decoder(node_id, m, nbcfg);
634
635 return;
636
637wrong_nb_mce:
638 pr_emerg(HW_ERR "Corrupted NB MCE info?\n");
Borislav Petkovd93cc222009-07-28 10:56:15 +0200639}
640EXPORT_SYMBOL_GPL(amd_decode_nb_mce);
641
Borislav Petkov7cfd4a82010-09-01 14:45:20 +0200642static void amd_decode_fr_mce(struct mce *m)
Borislav Petkov53bd5fe2009-07-28 14:20:46 +0200643{
Borislav Petkov8259a7e2010-09-22 15:28:59 +0200644 struct cpuinfo_x86 *c = &boot_cpu_data;
Borislav Petkov62452882010-09-22 16:08:37 +0200645 u8 xec = XEC(m->status, xec_mask);
Borislav Petkov8259a7e2010-09-22 15:28:59 +0200646
647 if (c->x86 == 0xf || c->x86 == 0x11)
Borislav Petkovfe4ea262010-08-31 18:38:24 +0200648 goto wrong_fr_mce;
649
Borislav Petkov8259a7e2010-09-22 15:28:59 +0200650 if (c->x86 != 0x15 && xec != 0x0)
651 goto wrong_fr_mce;
652
653 pr_emerg(HW_ERR "%s Error: ",
654 (c->x86 == 0x15 ? "Execution Unit" : "FIROB"));
655
656 if (xec == 0x0 || xec == 0xc)
657 pr_cont("%s.\n", fr_ex_mce_desc[xec]);
658 else if (xec < 0xd)
659 pr_cont("%s parity error.\n", fr_ex_mce_desc[xec]);
660 else
661 goto wrong_fr_mce;
662
663 return;
Borislav Petkovfe4ea262010-08-31 18:38:24 +0200664
665wrong_fr_mce:
666 pr_emerg(HW_ERR "Corrupted FR MCE info?\n");
Borislav Petkov53bd5fe2009-07-28 14:20:46 +0200667}
668
Borislav Petkovb8f85c42010-09-22 15:37:58 +0200669static void amd_decode_fp_mce(struct mce *m)
670{
Borislav Petkov62452882010-09-22 16:08:37 +0200671 u8 xec = XEC(m->status, xec_mask);
Borislav Petkovb8f85c42010-09-22 15:37:58 +0200672
673 pr_emerg(HW_ERR "Floating Point Unit Error: ");
674
675 switch (xec) {
676 case 0x1:
677 pr_cont("Free List");
678 break;
679
680 case 0x2:
681 pr_cont("Physical Register File");
682 break;
683
684 case 0x3:
685 pr_cont("Retire Queue");
686 break;
687
688 case 0x4:
689 pr_cont("Scheduler table");
690 break;
691
692 case 0x5:
693 pr_cont("Status Register File");
694 break;
695
696 default:
697 goto wrong_fp_mce;
698 break;
699 }
700
701 pr_cont(" parity error.\n");
702
703 return;
704
705wrong_fp_mce:
706 pr_emerg(HW_ERR "Corrupted FP MCE info?\n");
707}
708
Borislav Petkov63375832010-09-06 18:13:39 +0200709static inline void amd_decode_err_code(u16 ec)
Borislav Petkovd93cc222009-07-28 10:56:15 +0200710{
Borislav Petkovfa7ae8c2010-09-22 17:42:27 +0200711
712 pr_emerg(HW_ERR "cache level: %s", LL_MSG(ec));
713
714 if (BUS_ERROR(ec))
715 pr_cont(", mem/io: %s", II_MSG(ec));
716 else
717 pr_cont(", tx: %s", TT_MSG(ec));
718
719 if (MEM_ERROR(ec) || BUS_ERROR(ec)) {
720 pr_cont(", mem-tx: %s", R4_MSG(ec));
721
722 if (BUS_ERROR(ec))
723 pr_cont(", part-proc: %s (%s)", PP_MSG(ec), TO_MSG(ec));
724 }
725
726 pr_cont("\n");
Borislav Petkov549d0422009-07-24 13:51:42 +0200727}
Borislav Petkov549d0422009-07-24 13:51:42 +0200728
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200729/*
730 * Filter out unwanted MCE signatures here.
731 */
732static bool amd_filter_mce(struct mce *m)
733{
734 u8 xec = (m->status >> 16) & 0x1f;
735
736 /*
737 * NB GART TLB error reporting is disabled by default.
738 */
739 if (m->bank == 4 && xec == 0x5 && !report_gart_errors)
740 return true;
741
742 return false;
743}
744
Borislav Petkov9cdeb402010-09-02 18:33:24 +0200745int amd_decode_mce(struct notifier_block *nb, unsigned long val, void *data)
Borislav Petkov549d0422009-07-24 13:51:42 +0200746{
Borislav Petkovfb253192009-10-07 13:20:38 +0200747 struct mce *m = (struct mce *)data;
Borislav Petkovfa7ae8c2010-09-22 17:42:27 +0200748 struct cpuinfo_x86 *c = &boot_cpu_data;
Borislav Petkovb69b29d2009-07-27 16:21:14 +0200749 int node, ecc;
Borislav Petkov549d0422009-07-24 13:51:42 +0200750
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200751 if (amd_filter_mce(m))
752 return NOTIFY_STOP;
753
Borislav Petkov086be782011-09-30 16:34:44 +0200754 pr_emerg(HW_ERR "CPU:%d\tMC%d_STATUS[%s|%s|%s|%s|%s",
Borislav Petkovbff7b812011-08-04 19:25:24 +0200755 m->extcpu, m->bank,
Borislav Petkovfa7ae8c2010-09-22 17:42:27 +0200756 ((m->status & MCI_STATUS_OVER) ? "Over" : "-"),
757 ((m->status & MCI_STATUS_UC) ? "UE" : "CE"),
758 ((m->status & MCI_STATUS_MISCV) ? "MiscV" : "-"),
759 ((m->status & MCI_STATUS_PCC) ? "PCC" : "-"),
760 ((m->status & MCI_STATUS_ADDRV) ? "AddrV" : "-"));
Borislav Petkov549d0422009-07-24 13:51:42 +0200761
Borislav Petkovfa7ae8c2010-09-22 17:42:27 +0200762 if (c->x86 == 0x15)
763 pr_cont("|%s|%s",
Randy Dunlap50adbbd2010-11-13 11:44:26 -0500764 ((m->status & BIT_64(44)) ? "Deferred" : "-"),
765 ((m->status & BIT_64(43)) ? "Poison" : "-"));
Borislav Petkov549d0422009-07-24 13:51:42 +0200766
Borislav Petkovb69b29d2009-07-27 16:21:14 +0200767 /* do the two bits[14:13] together */
Borislav Petkov35d824b2010-04-30 15:19:02 +0200768 ecc = (m->status >> 45) & 0x3;
Borislav Petkovb69b29d2009-07-27 16:21:14 +0200769 if (ecc)
Borislav Petkovfa7ae8c2010-09-22 17:42:27 +0200770 pr_cont("|%sECC", ((ecc == 2) ? "C" : "U"));
Borislav Petkovb69b29d2009-07-27 16:21:14 +0200771
Borislav Petkovfa7ae8c2010-09-22 17:42:27 +0200772 pr_cont("]: 0x%016llx\n", m->status);
773
Borislav Petkov086be782011-09-30 16:34:44 +0200774 if (m->status & MCI_STATUS_ADDRV)
775 pr_emerg(HW_ERR "\tMC%d_ADDR: 0x%016llx\n", m->bank, m->addr);
Borislav Petkovb69b29d2009-07-27 16:21:14 +0200776
Borislav Petkov51966242009-07-28 13:50:43 +0200777 switch (m->bank) {
778 case 0:
Borislav Petkov7cfd4a82010-09-01 14:45:20 +0200779 amd_decode_dc_mce(m);
Borislav Petkov51966242009-07-28 13:50:43 +0200780 break;
Borislav Petkovd93cc222009-07-28 10:56:15 +0200781
Borislav Petkovab5535e2009-07-28 14:06:26 +0200782 case 1:
Borislav Petkov7cfd4a82010-09-01 14:45:20 +0200783 amd_decode_ic_mce(m);
Borislav Petkovab5535e2009-07-28 14:06:26 +0200784 break;
785
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200786 case 2:
Borislav Petkovfa7ae8c2010-09-22 17:42:27 +0200787 if (c->x86 == 0x15)
Borislav Petkov70fdb492010-09-21 20:45:10 +0200788 amd_decode_cu_mce(m);
789 else
790 amd_decode_bu_mce(m);
Borislav Petkov56cad2d2009-07-28 14:14:24 +0200791 break;
792
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200793 case 3:
Borislav Petkov7cfd4a82010-09-01 14:45:20 +0200794 amd_decode_ls_mce(m);
Borislav Petkovf9350ef2009-07-28 14:17:30 +0200795 break;
796
Borislav Petkov51966242009-07-28 13:50:43 +0200797 case 4:
Borislav Petkov7cfd4a82010-09-01 14:45:20 +0200798 node = amd_get_nb_id(m->extcpu);
799 amd_decode_nb_mce(node, m, 0);
Borislav Petkov51966242009-07-28 13:50:43 +0200800 break;
801
Borislav Petkov53bd5fe2009-07-28 14:20:46 +0200802 case 5:
Borislav Petkov7cfd4a82010-09-01 14:45:20 +0200803 amd_decode_fr_mce(m);
Borislav Petkov53bd5fe2009-07-28 14:20:46 +0200804 break;
805
Borislav Petkovb8f85c42010-09-22 15:37:58 +0200806 case 6:
807 amd_decode_fp_mce(m);
808 break;
809
Borislav Petkov51966242009-07-28 13:50:43 +0200810 default:
811 break;
Borislav Petkovb69b29d2009-07-27 16:21:14 +0200812 }
Borislav Petkov51966242009-07-28 13:50:43 +0200813
814 amd_decode_err_code(m->status & 0xffff);
Borislav Petkovfb253192009-10-07 13:20:38 +0200815
816 return NOTIFY_STOP;
Borislav Petkov549d0422009-07-24 13:51:42 +0200817}
Borislav Petkov9cdeb402010-09-02 18:33:24 +0200818EXPORT_SYMBOL_GPL(amd_decode_mce);
Ingo Molnarf436f8b2009-10-01 16:14:32 +0200819
Borislav Petkovfb253192009-10-07 13:20:38 +0200820static struct notifier_block amd_mce_dec_nb = {
821 .notifier_call = amd_decode_mce,
822};
823
Ingo Molnarf436f8b2009-10-01 16:14:32 +0200824static int __init mce_amd_init(void)
825{
Borislav Petkovbad11e02010-09-22 17:44:51 +0200826 struct cpuinfo_x86 *c = &boot_cpu_data;
827
828 if (c->x86_vendor != X86_VENDOR_AMD)
Borislav Petkove045c292010-08-06 18:55:45 +0200829 return 0;
830
Borislav Petkovbad11e02010-09-22 17:44:51 +0200831 if ((c->x86 < 0xf || c->x86 > 0x12) &&
832 (c->x86 != 0x14 || c->x86_model > 0xf) &&
833 (c->x86 != 0x15 || c->x86_model > 0xf))
Borislav Petkove045c292010-08-06 18:55:45 +0200834 return 0;
835
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200836 fam_ops = kzalloc(sizeof(struct amd_decoder_ops), GFP_KERNEL);
837 if (!fam_ops)
838 return -ENOMEM;
839
Borislav Petkovbad11e02010-09-22 17:44:51 +0200840 switch (c->x86) {
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200841 case 0xf:
842 fam_ops->dc_mce = k8_dc_mce;
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200843 fam_ops->ic_mce = k8_ic_mce;
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200844 fam_ops->nb_mce = k8_nb_mce;
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200845 break;
846
847 case 0x10:
848 fam_ops->dc_mce = f10h_dc_mce;
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200849 fam_ops->ic_mce = k8_ic_mce;
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200850 fam_ops->nb_mce = f10h_nb_mce;
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200851 break;
852
Borislav Petkovf0157b32010-10-05 19:07:16 +0200853 case 0x11:
854 fam_ops->dc_mce = k8_dc_mce;
855 fam_ops->ic_mce = k8_ic_mce;
856 fam_ops->nb_mce = f10h_nb_mce;
857 break;
858
Borislav Petkov9be0bb12010-09-16 15:08:14 +0200859 case 0x12:
860 fam_ops->dc_mce = f12h_dc_mce;
Borislav Petkove7281eb2010-09-16 16:45:22 +0200861 fam_ops->ic_mce = k8_ic_mce;
Borislav Petkovcb9d5ec2010-09-16 17:36:12 +0200862 fam_ops->nb_mce = nb_noop_mce;
Borislav Petkov9be0bb12010-09-16 15:08:14 +0200863 break;
864
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200865 case 0x14:
Borislav Petkov5ce88f62010-08-31 18:28:08 +0200866 nb_err_cpumask = 0x3;
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200867 fam_ops->dc_mce = f14h_dc_mce;
Borislav Petkovdd53bce2010-08-26 19:05:49 +0200868 fam_ops->ic_mce = f14h_ic_mce;
Borislav Petkovcb9d5ec2010-09-16 17:36:12 +0200869 fam_ops->nb_mce = nb_noop_mce;
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200870 break;
871
Borislav Petkov2be64bf2010-09-17 19:11:47 +0200872 case 0x15:
873 xec_mask = 0x1f;
Borislav Petkov25a4f8b2010-09-17 19:22:34 +0200874 fam_ops->dc_mce = f15h_dc_mce;
Borislav Petkov86039cd2010-11-08 15:03:35 +0100875 fam_ops->ic_mce = f15h_ic_mce;
Borislav Petkov05cd6672010-09-22 15:06:24 +0200876 fam_ops->nb_mce = f10h_nb_mce;
Borislav Petkov2be64bf2010-09-17 19:11:47 +0200877 break;
878
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200879 default:
Borislav Petkovbad11e02010-09-22 17:44:51 +0200880 printk(KERN_WARNING "Huh? What family is that: %d?!\n", c->x86);
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200881 kfree(fam_ops);
882 return -EINVAL;
883 }
884
Borislav Petkov9530d602010-09-06 15:05:45 +0200885 pr_info("MCE: In-kernel MCE decoding enabled.\n");
886
Borislav Petkove045c292010-08-06 18:55:45 +0200887 atomic_notifier_chain_register(&x86_mce_decoder_chain, &amd_mce_dec_nb);
Ingo Molnarf436f8b2009-10-01 16:14:32 +0200888
889 return 0;
890}
891early_initcall(mce_amd_init);
Borislav Petkov0d18b2e2009-10-02 15:31:48 +0200892
893#ifdef MODULE
894static void __exit mce_amd_exit(void)
895{
Borislav Petkovfb253192009-10-07 13:20:38 +0200896 atomic_notifier_chain_unregister(&x86_mce_decoder_chain, &amd_mce_dec_nb);
Borislav Petkov888ab8e2010-08-18 15:11:35 +0200897 kfree(fam_ops);
Borislav Petkov0d18b2e2009-10-02 15:31:48 +0200898}
899
900MODULE_DESCRIPTION("AMD MCE decoder");
901MODULE_ALIAS("edac-mce-amd");
902MODULE_LICENSE("GPL");
903module_exit(mce_amd_exit);
904#endif