blob: b10b45cc787082569f060e12b7906f02beb1b3d7 [file] [log] [blame]
Alan Coxda9bb1d2006-01-18 17:44:13 -08001/*
2 * edac_mc kernel module
Doug Thompson49c0dab72006-07-10 04:45:19 -07003 * (C) 2005, 2006 Linux Networx (http://lnxi.com)
Alan Coxda9bb1d2006-01-18 17:44:13 -08004 * This file may be distributed under the terms of the
5 * GNU General Public License.
6 *
7 * Written by Thayne Harbaugh
8 * Based on work by Dan Hollis <goemon at anime dot net> and others.
9 * http://www.anime.net/~goemon/linux-ecc/
10 *
11 * Modified by Dave Peterson and Doug Thompson
12 *
13 */
14
Alan Coxda9bb1d2006-01-18 17:44:13 -080015#include <linux/module.h>
16#include <linux/proc_fs.h>
17#include <linux/kernel.h>
18#include <linux/types.h>
19#include <linux/smp.h>
20#include <linux/init.h>
21#include <linux/sysctl.h>
22#include <linux/highmem.h>
23#include <linux/timer.h>
24#include <linux/slab.h>
25#include <linux/jiffies.h>
26#include <linux/spinlock.h>
27#include <linux/list.h>
28#include <linux/sysdev.h>
29#include <linux/ctype.h>
Dave Jiangc0d12172007-07-19 01:49:46 -070030#include <linux/edac.h>
Alan Coxda9bb1d2006-01-18 17:44:13 -080031#include <asm/uaccess.h>
32#include <asm/page.h>
33#include <asm/edac.h>
Douglas Thompson20bcb7a2007-07-19 01:49:47 -070034#include "edac_core.h"
Douglas Thompson7c9281d2007-07-19 01:49:33 -070035#include "edac_module.h"
Alan Coxda9bb1d2006-01-18 17:44:13 -080036
Alan Coxda9bb1d2006-01-18 17:44:13 -080037/* lock to memory controller's control array */
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -070038static DEFINE_MUTEX(mem_ctls_mutex);
Robert P. J. Dayff6ac2a2008-04-29 01:03:17 -070039static LIST_HEAD(mc_devices);
Alan Coxda9bb1d2006-01-18 17:44:13 -080040
Alan Coxda9bb1d2006-01-18 17:44:13 -080041#ifdef CONFIG_EDAC_DEBUG
42
Adrian Bunk2da1c112007-07-19 01:49:32 -070043static void edac_mc_dump_channel(struct channel_info *chan)
Alan Coxda9bb1d2006-01-18 17:44:13 -080044{
45 debugf4("\tchannel = %p\n", chan);
46 debugf4("\tchannel->chan_idx = %d\n", chan->chan_idx);
47 debugf4("\tchannel->ce_count = %d\n", chan->ce_count);
48 debugf4("\tchannel->label = '%s'\n", chan->label);
49 debugf4("\tchannel->csrow = %p\n\n", chan->csrow);
50}
51
Adrian Bunk2da1c112007-07-19 01:49:32 -070052static void edac_mc_dump_csrow(struct csrow_info *csrow)
Alan Coxda9bb1d2006-01-18 17:44:13 -080053{
54 debugf4("\tcsrow = %p\n", csrow);
55 debugf4("\tcsrow->csrow_idx = %d\n", csrow->csrow_idx);
Douglas Thompson079708b2007-07-19 01:49:58 -070056 debugf4("\tcsrow->first_page = 0x%lx\n", csrow->first_page);
Alan Coxda9bb1d2006-01-18 17:44:13 -080057 debugf4("\tcsrow->last_page = 0x%lx\n", csrow->last_page);
58 debugf4("\tcsrow->page_mask = 0x%lx\n", csrow->page_mask);
59 debugf4("\tcsrow->nr_pages = 0x%x\n", csrow->nr_pages);
Douglas Thompson079708b2007-07-19 01:49:58 -070060 debugf4("\tcsrow->nr_channels = %d\n", csrow->nr_channels);
Alan Coxda9bb1d2006-01-18 17:44:13 -080061 debugf4("\tcsrow->channels = %p\n", csrow->channels);
62 debugf4("\tcsrow->mci = %p\n\n", csrow->mci);
63}
64
Adrian Bunk2da1c112007-07-19 01:49:32 -070065static void edac_mc_dump_mci(struct mem_ctl_info *mci)
Alan Coxda9bb1d2006-01-18 17:44:13 -080066{
67 debugf3("\tmci = %p\n", mci);
68 debugf3("\tmci->mtype_cap = %lx\n", mci->mtype_cap);
69 debugf3("\tmci->edac_ctl_cap = %lx\n", mci->edac_ctl_cap);
70 debugf3("\tmci->edac_cap = %lx\n", mci->edac_cap);
71 debugf4("\tmci->edac_check = %p\n", mci->edac_check);
72 debugf3("\tmci->nr_csrows = %d, csrows = %p\n",
73 mci->nr_csrows, mci->csrows);
Doug Thompson37f04582006-06-30 01:56:07 -070074 debugf3("\tdev = %p\n", mci->dev);
Douglas Thompson079708b2007-07-19 01:49:58 -070075 debugf3("\tmod_name:ctl_name = %s:%s\n", mci->mod_name, mci->ctl_name);
Alan Coxda9bb1d2006-01-18 17:44:13 -080076 debugf3("\tpvt_info = %p\n\n", mci->pvt_info);
77}
78
Borislav Petkov239642f2009-11-12 15:33:16 +010079/*
80 * keep those in sync with the enum mem_type
81 */
82const char *edac_mem_types[] = {
83 "Empty csrow",
84 "Reserved csrow type",
85 "Unknown csrow type",
86 "Fast page mode RAM",
87 "Extended data out RAM",
88 "Burst Extended data out RAM",
89 "Single data rate SDRAM",
90 "Registered single data rate SDRAM",
91 "Double data rate SDRAM",
92 "Registered Double data rate SDRAM",
93 "Rambus DRAM",
94 "Unbuffered DDR2 RAM",
95 "Fully buffered DDR2",
96 "Registered DDR2 RAM",
97 "Rambus XDR",
98 "Unbuffered DDR3 RAM",
99 "Registered DDR3 RAM",
100};
101EXPORT_SYMBOL_GPL(edac_mem_types);
102
Douglas Thompson079708b2007-07-19 01:49:58 -0700103#endif /* CONFIG_EDAC_DEBUG */
Alan Coxda9bb1d2006-01-18 17:44:13 -0800104
105/* 'ptr' points to a possibly unaligned item X such that sizeof(X) is 'size'.
106 * Adjust 'ptr' so that its alignment is at least as stringent as what the
107 * compiler would provide for X and return the aligned result.
108 *
109 * If 'size' is a constant, the compiler will optimize this whole function
110 * down to either a no-op or the addition of a constant to the value of 'ptr'.
111 */
Douglas Thompson7391c6d2007-07-19 01:50:21 -0700112void *edac_align_ptr(void *ptr, unsigned size)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800113{
114 unsigned align, r;
115
116 /* Here we assume that the alignment of a "long long" is the most
117 * stringent alignment that the compiler will ever provide by default.
118 * As far as I know, this is a reasonable assumption.
119 */
120 if (size > sizeof(long))
121 align = sizeof(long long);
122 else if (size > sizeof(int))
123 align = sizeof(long);
124 else if (size > sizeof(short))
125 align = sizeof(int);
126 else if (size > sizeof(char))
127 align = sizeof(short);
128 else
Douglas Thompson079708b2007-07-19 01:49:58 -0700129 return (char *)ptr;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800130
131 r = size % align;
132
133 if (r == 0)
Douglas Thompson079708b2007-07-19 01:49:58 -0700134 return (char *)ptr;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800135
Douglas Thompson7391c6d2007-07-19 01:50:21 -0700136 return (void *)(((unsigned long)ptr) + align - r);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800137}
138
Alan Coxda9bb1d2006-01-18 17:44:13 -0800139/**
140 * edac_mc_alloc: Allocate a struct mem_ctl_info structure
141 * @size_pvt: size of private storage needed
142 * @nr_csrows: Number of CWROWS needed for this MC
143 * @nr_chans: Number of channels for the MC
144 *
145 * Everything is kmalloc'ed as one big chunk - more efficient.
146 * Only can be used if all structures have the same lifetime - otherwise
147 * you have to allocate and initialize your own structures.
148 *
149 * Use edac_mc_free() to free mc structures allocated by this function.
150 *
151 * Returns:
152 * NULL allocation failed
153 * struct mem_ctl_info pointer
154 */
155struct mem_ctl_info *edac_mc_alloc(unsigned sz_pvt, unsigned nr_csrows,
Doug Thompsonb8f6f972007-07-19 01:50:26 -0700156 unsigned nr_chans, int edac_index)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800157{
158 struct mem_ctl_info *mci;
159 struct csrow_info *csi, *csrow;
160 struct channel_info *chi, *chp, *chan;
161 void *pvt;
162 unsigned size;
163 int row, chn;
Doug Thompson8096cfa2007-07-19 01:50:27 -0700164 int err;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800165
166 /* Figure out the offsets of the various items from the start of an mc
167 * structure. We want the alignment of each item to be at least as
168 * stringent as what the compiler would provide if we could simply
169 * hardcode everything into a single struct.
170 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700171 mci = (struct mem_ctl_info *)0;
Douglas Thompson7391c6d2007-07-19 01:50:21 -0700172 csi = edac_align_ptr(&mci[1], sizeof(*csi));
173 chi = edac_align_ptr(&csi[nr_csrows], sizeof(*chi));
Douglas Thompsone27e3da2007-07-19 01:49:36 -0700174 pvt = edac_align_ptr(&chi[nr_chans * nr_csrows], sz_pvt);
Douglas Thompson079708b2007-07-19 01:49:58 -0700175 size = ((unsigned long)pvt) + sz_pvt;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800176
Doug Thompson8096cfa2007-07-19 01:50:27 -0700177 mci = kzalloc(size, GFP_KERNEL);
178 if (mci == NULL)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800179 return NULL;
180
181 /* Adjust pointers so they point within the memory we just allocated
182 * rather than an imaginary chunk of memory located at address 0.
183 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700184 csi = (struct csrow_info *)(((char *)mci) + ((unsigned long)csi));
185 chi = (struct channel_info *)(((char *)mci) + ((unsigned long)chi));
186 pvt = sz_pvt ? (((char *)mci) + ((unsigned long)pvt)) : NULL;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800187
Doug Thompsonb8f6f972007-07-19 01:50:26 -0700188 /* setup index and various internal pointers */
189 mci->mc_idx = edac_index;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800190 mci->csrows = csi;
191 mci->pvt_info = pvt;
192 mci->nr_csrows = nr_csrows;
193
194 for (row = 0; row < nr_csrows; row++) {
195 csrow = &csi[row];
196 csrow->csrow_idx = row;
197 csrow->mci = mci;
198 csrow->nr_channels = nr_chans;
199 chp = &chi[row * nr_chans];
200 csrow->channels = chp;
201
202 for (chn = 0; chn < nr_chans; chn++) {
203 chan = &chp[chn];
204 chan->chan_idx = chn;
205 chan->csrow = csrow;
206 }
207 }
208
Dave Jiang81d87cb2007-07-19 01:49:52 -0700209 mci->op_state = OP_ALLOC;
Mauro Carvalho Chehab6fe11082010-08-12 00:30:25 -0300210 INIT_LIST_HEAD(&mci->grp_kobj_list);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700211
Doug Thompson8096cfa2007-07-19 01:50:27 -0700212 /*
213 * Initialize the 'root' kobj for the edac_mc controller
214 */
215 err = edac_mc_register_sysfs_main_kobj(mci);
216 if (err) {
217 kfree(mci);
218 return NULL;
219 }
220
221 /* at this point, the root kobj is valid, and in order to
222 * 'free' the object, then the function:
223 * edac_mc_unregister_sysfs_main_kobj() must be called
224 * which will perform kobj unregistration and the actual free
225 * will occur during the kobject callback operation
226 */
Alan Coxda9bb1d2006-01-18 17:44:13 -0800227 return mci;
228}
Dave Peterson91105402006-03-26 01:38:55 -0800229EXPORT_SYMBOL_GPL(edac_mc_alloc);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800230
Alan Coxda9bb1d2006-01-18 17:44:13 -0800231/**
Doug Thompson8096cfa2007-07-19 01:50:27 -0700232 * edac_mc_free
233 * 'Free' a previously allocated 'mci' structure
Alan Coxda9bb1d2006-01-18 17:44:13 -0800234 * @mci: pointer to a struct mem_ctl_info structure
Alan Coxda9bb1d2006-01-18 17:44:13 -0800235 */
236void edac_mc_free(struct mem_ctl_info *mci)
237{
Doug Thompson8096cfa2007-07-19 01:50:27 -0700238 edac_mc_unregister_sysfs_main_kobj(mci);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800239}
Dave Peterson91105402006-03-26 01:38:55 -0800240EXPORT_SYMBOL_GPL(edac_mc_free);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800241
Doug Thompsonbce19682007-07-26 10:41:14 -0700242
Mauro Carvalho Chehab939747bd2010-08-10 11:22:01 -0300243/**
Doug Thompsonbce19682007-07-26 10:41:14 -0700244 * find_mci_by_dev
245 *
246 * scan list of controllers looking for the one that manages
247 * the 'dev' device
Mauro Carvalho Chehab939747bd2010-08-10 11:22:01 -0300248 * @dev: pointer to a struct device related with the MCI
Doug Thompsonbce19682007-07-26 10:41:14 -0700249 */
Mauro Carvalho Chehab939747bd2010-08-10 11:22:01 -0300250struct mem_ctl_info *find_mci_by_dev(struct device *dev)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800251{
252 struct mem_ctl_info *mci;
253 struct list_head *item;
254
Dave Peterson537fba22006-03-26 01:38:40 -0800255 debugf3("%s()\n", __func__);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800256
257 list_for_each(item, &mc_devices) {
258 mci = list_entry(item, struct mem_ctl_info, link);
259
Doug Thompson37f04582006-06-30 01:56:07 -0700260 if (mci->dev == dev)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800261 return mci;
262 }
263
264 return NULL;
265}
Mauro Carvalho Chehab939747bd2010-08-10 11:22:01 -0300266EXPORT_SYMBOL_GPL(find_mci_by_dev);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800267
Dave Jiang81d87cb2007-07-19 01:49:52 -0700268/*
269 * handler for EDAC to check if NMI type handler has asserted interrupt
270 */
271static int edac_mc_assert_error_check_and_clear(void)
272{
Dave Jiang66ee2f92007-07-19 01:49:54 -0700273 int old_state;
Dave Jiang81d87cb2007-07-19 01:49:52 -0700274
Douglas Thompson079708b2007-07-19 01:49:58 -0700275 if (edac_op_state == EDAC_OPSTATE_POLL)
Dave Jiang81d87cb2007-07-19 01:49:52 -0700276 return 1;
277
Dave Jiang66ee2f92007-07-19 01:49:54 -0700278 old_state = edac_err_assert;
279 edac_err_assert = 0;
Dave Jiang81d87cb2007-07-19 01:49:52 -0700280
Dave Jiang66ee2f92007-07-19 01:49:54 -0700281 return old_state;
Dave Jiang81d87cb2007-07-19 01:49:52 -0700282}
283
284/*
285 * edac_mc_workq_function
286 * performs the operation scheduled by a workq request
287 */
Dave Jiang81d87cb2007-07-19 01:49:52 -0700288static void edac_mc_workq_function(struct work_struct *work_req)
289{
Jean Delvarefbeb4382009-04-13 14:40:21 -0700290 struct delayed_work *d_work = to_delayed_work(work_req);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700291 struct mem_ctl_info *mci = to_edac_mem_ctl_work(d_work);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700292
293 mutex_lock(&mem_ctls_mutex);
294
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700295 /* if this control struct has movd to offline state, we are done */
296 if (mci->op_state == OP_OFFLINE) {
297 mutex_unlock(&mem_ctls_mutex);
298 return;
299 }
300
Dave Jiang81d87cb2007-07-19 01:49:52 -0700301 /* Only poll controllers that are running polled and have a check */
302 if (edac_mc_assert_error_check_and_clear() && (mci->edac_check != NULL))
303 mci->edac_check(mci);
304
Dave Jiang81d87cb2007-07-19 01:49:52 -0700305 mutex_unlock(&mem_ctls_mutex);
306
307 /* Reschedule */
Dave Jiang4de78c62007-07-19 01:49:54 -0700308 queue_delayed_work(edac_workqueue, &mci->work,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700309 msecs_to_jiffies(edac_mc_get_poll_msec()));
Dave Jiang81d87cb2007-07-19 01:49:52 -0700310}
311
312/*
313 * edac_mc_workq_setup
314 * initialize a workq item for this mci
315 * passing in the new delay period in msec
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700316 *
317 * locking model:
318 *
319 * called with the mem_ctls_mutex held
Dave Jiang81d87cb2007-07-19 01:49:52 -0700320 */
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700321static void edac_mc_workq_setup(struct mem_ctl_info *mci, unsigned msec)
Dave Jiang81d87cb2007-07-19 01:49:52 -0700322{
323 debugf0("%s()\n", __func__);
324
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700325 /* if this instance is not in the POLL state, then simply return */
326 if (mci->op_state != OP_RUNNING_POLL)
327 return;
328
Dave Jiang81d87cb2007-07-19 01:49:52 -0700329 INIT_DELAYED_WORK(&mci->work, edac_mc_workq_function);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700330 queue_delayed_work(edac_workqueue, &mci->work, msecs_to_jiffies(msec));
331}
332
333/*
334 * edac_mc_workq_teardown
335 * stop the workq processing on this mci
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700336 *
337 * locking model:
338 *
339 * called WITHOUT lock held
Dave Jiang81d87cb2007-07-19 01:49:52 -0700340 */
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700341static void edac_mc_workq_teardown(struct mem_ctl_info *mci)
Dave Jiang81d87cb2007-07-19 01:49:52 -0700342{
343 int status;
344
Borislav Petkov00740c52010-09-26 12:42:23 +0200345 if (mci->op_state != OP_RUNNING_POLL)
346 return;
347
Doug Thompsonbce19682007-07-26 10:41:14 -0700348 status = cancel_delayed_work(&mci->work);
349 if (status == 0) {
350 debugf0("%s() not canceled, flush the queue\n",
351 __func__);
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700352
Doug Thompsonbce19682007-07-26 10:41:14 -0700353 /* workq instance might be running, wait for it */
354 flush_workqueue(edac_workqueue);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700355 }
356}
357
358/*
Doug Thompsonbce19682007-07-26 10:41:14 -0700359 * edac_mc_reset_delay_period(unsigned long value)
360 *
361 * user space has updated our poll period value, need to
362 * reset our workq delays
Dave Jiang81d87cb2007-07-19 01:49:52 -0700363 */
Doug Thompsonbce19682007-07-26 10:41:14 -0700364void edac_mc_reset_delay_period(int value)
Dave Jiang81d87cb2007-07-19 01:49:52 -0700365{
Doug Thompsonbce19682007-07-26 10:41:14 -0700366 struct mem_ctl_info *mci;
367 struct list_head *item;
Dave Jiang81d87cb2007-07-19 01:49:52 -0700368
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700369 mutex_lock(&mem_ctls_mutex);
370
Doug Thompsonbce19682007-07-26 10:41:14 -0700371 /* scan the list and turn off all workq timers, doing so under lock
372 */
373 list_for_each(item, &mc_devices) {
374 mci = list_entry(item, struct mem_ctl_info, link);
375
376 if (mci->op_state == OP_RUNNING_POLL)
377 cancel_delayed_work(&mci->work);
378 }
379
380 mutex_unlock(&mem_ctls_mutex);
381
382
383 /* re-walk the list, and reset the poll delay */
384 mutex_lock(&mem_ctls_mutex);
385
386 list_for_each(item, &mc_devices) {
387 mci = list_entry(item, struct mem_ctl_info, link);
388
389 edac_mc_workq_setup(mci, (unsigned long) value);
390 }
Dave Jiang81d87cb2007-07-19 01:49:52 -0700391
392 mutex_unlock(&mem_ctls_mutex);
393}
394
Doug Thompsonbce19682007-07-26 10:41:14 -0700395
396
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700397/* Return 0 on success, 1 on failure.
398 * Before calling this function, caller must
399 * assign a unique value to mci->mc_idx.
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700400 *
401 * locking model:
402 *
403 * called with the mem_ctls_mutex lock held
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700404 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700405static int add_mc_to_global_list(struct mem_ctl_info *mci)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800406{
407 struct list_head *item, *insert_before;
408 struct mem_ctl_info *p;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800409
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700410 insert_before = &mc_devices;
411
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700412 p = find_mci_by_dev(mci->dev);
413 if (unlikely(p != NULL))
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700414 goto fail0;
415
416 list_for_each(item, &mc_devices) {
417 p = list_entry(item, struct mem_ctl_info, link);
418
419 if (p->mc_idx >= mci->mc_idx) {
420 if (unlikely(p->mc_idx == mci->mc_idx))
421 goto fail1;
422
423 insert_before = item;
424 break;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800425 }
Alan Coxda9bb1d2006-01-18 17:44:13 -0800426 }
427
428 list_add_tail_rcu(&mci->link, insert_before);
Dave Jiangc0d12172007-07-19 01:49:46 -0700429 atomic_inc(&edac_handlers);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800430 return 0;
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700431
Douglas Thompson052dfb42007-07-19 01:50:13 -0700432fail0:
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700433 edac_printk(KERN_WARNING, EDAC_MC,
Kay Sievers281efb12009-01-06 14:42:57 -0800434 "%s (%s) %s %s already assigned %d\n", dev_name(p->dev),
Stephen Rothwell17aa7e02008-05-05 13:54:19 +1000435 edac_dev_name(mci), p->mod_name, p->ctl_name, p->mc_idx);
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700436 return 1;
437
Douglas Thompson052dfb42007-07-19 01:50:13 -0700438fail1:
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700439 edac_printk(KERN_WARNING, EDAC_MC,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700440 "bug in low-level driver: attempt to assign\n"
441 " duplicate mc_idx %d in %s()\n", p->mc_idx, __func__);
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700442 return 1;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800443}
444
Dave Petersone7ecd892006-03-26 01:38:52 -0800445static void complete_mc_list_del(struct rcu_head *head)
Dave Petersona1d03fc2006-03-26 01:38:46 -0800446{
447 struct mem_ctl_info *mci;
448
449 mci = container_of(head, struct mem_ctl_info, rcu);
450 INIT_LIST_HEAD(&mci->link);
Dave Petersona1d03fc2006-03-26 01:38:46 -0800451}
452
Dave Petersone7ecd892006-03-26 01:38:52 -0800453static void del_mc_from_global_list(struct mem_ctl_info *mci)
Dave Petersona1d03fc2006-03-26 01:38:46 -0800454{
Dave Jiangc0d12172007-07-19 01:49:46 -0700455 atomic_dec(&edac_handlers);
Dave Petersona1d03fc2006-03-26 01:38:46 -0800456 list_del_rcu(&mci->link);
Dave Petersona1d03fc2006-03-26 01:38:46 -0800457 call_rcu(&mci->rcu, complete_mc_list_del);
Jesper Dangaard Brouer458e5ff2009-09-23 15:57:29 -0700458 rcu_barrier();
Dave Petersona1d03fc2006-03-26 01:38:46 -0800459}
460
Alan Coxda9bb1d2006-01-18 17:44:13 -0800461/**
Douglas Thompson5da08312007-07-19 01:49:31 -0700462 * edac_mc_find: Search for a mem_ctl_info structure whose index is 'idx'.
463 *
464 * If found, return a pointer to the structure.
465 * Else return NULL.
466 *
467 * Caller must hold mem_ctls_mutex.
468 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700469struct mem_ctl_info *edac_mc_find(int idx)
Douglas Thompson5da08312007-07-19 01:49:31 -0700470{
471 struct list_head *item;
472 struct mem_ctl_info *mci;
473
474 list_for_each(item, &mc_devices) {
475 mci = list_entry(item, struct mem_ctl_info, link);
476
477 if (mci->mc_idx >= idx) {
478 if (mci->mc_idx == idx)
479 return mci;
480
481 break;
482 }
483 }
484
485 return NULL;
486}
487EXPORT_SYMBOL(edac_mc_find);
488
489/**
Dave Peterson472678e2006-03-26 01:38:49 -0800490 * edac_mc_add_mc: Insert the 'mci' structure into the mci global list and
491 * create sysfs entries associated with mci structure
Alan Coxda9bb1d2006-01-18 17:44:13 -0800492 * @mci: pointer to the mci structure to be added to the list
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700493 * @mc_idx: A unique numeric identifier to be assigned to the 'mci' structure.
Alan Coxda9bb1d2006-01-18 17:44:13 -0800494 *
495 * Return:
496 * 0 Success
497 * !0 Failure
498 */
499
500/* FIXME - should a warning be printed if no error detection? correction? */
Doug Thompsonb8f6f972007-07-19 01:50:26 -0700501int edac_mc_add_mc(struct mem_ctl_info *mci)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800502{
Dave Peterson537fba22006-03-26 01:38:40 -0800503 debugf0("%s()\n", __func__);
Doug Thompsonb8f6f972007-07-19 01:50:26 -0700504
Alan Coxda9bb1d2006-01-18 17:44:13 -0800505#ifdef CONFIG_EDAC_DEBUG
506 if (edac_debug_level >= 3)
507 edac_mc_dump_mci(mci);
Dave Petersone7ecd892006-03-26 01:38:52 -0800508
Alan Coxda9bb1d2006-01-18 17:44:13 -0800509 if (edac_debug_level >= 4) {
510 int i;
511
512 for (i = 0; i < mci->nr_csrows; i++) {
513 int j;
Dave Petersone7ecd892006-03-26 01:38:52 -0800514
Alan Coxda9bb1d2006-01-18 17:44:13 -0800515 edac_mc_dump_csrow(&mci->csrows[i]);
516 for (j = 0; j < mci->csrows[i].nr_channels; j++)
Douglas Thompson079708b2007-07-19 01:49:58 -0700517 edac_mc_dump_channel(&mci->csrows[i].
Douglas Thompson052dfb42007-07-19 01:50:13 -0700518 channels[j]);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800519 }
520 }
521#endif
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700522 mutex_lock(&mem_ctls_mutex);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800523
524 if (add_mc_to_global_list(mci))
Dave Peterson028a7b62006-03-26 01:38:47 -0800525 goto fail0;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800526
527 /* set load time so that error rate can be tracked */
528 mci->start_time = jiffies;
529
eric wollesen9794f332007-02-12 00:53:08 -0800530 if (edac_create_sysfs_mci_device(mci)) {
531 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700532 "failed to create sysfs device\n");
eric wollesen9794f332007-02-12 00:53:08 -0800533 goto fail1;
534 }
Alan Coxda9bb1d2006-01-18 17:44:13 -0800535
Dave Jiang81d87cb2007-07-19 01:49:52 -0700536 /* If there IS a check routine, then we are running POLLED */
537 if (mci->edac_check != NULL) {
538 /* This instance is NOW RUNNING */
539 mci->op_state = OP_RUNNING_POLL;
540
541 edac_mc_workq_setup(mci, edac_mc_get_poll_msec());
542 } else {
543 mci->op_state = OP_RUNNING_INTERRUPT;
544 }
545
Alan Coxda9bb1d2006-01-18 17:44:13 -0800546 /* Report action taken */
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700547 edac_mc_printk(mci, KERN_INFO, "Giving out device to '%s' '%s':"
Stephen Rothwell17aa7e02008-05-05 13:54:19 +1000548 " DEV %s\n", mci->mod_name, mci->ctl_name, edac_dev_name(mci));
Alan Coxda9bb1d2006-01-18 17:44:13 -0800549
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700550 mutex_unlock(&mem_ctls_mutex);
Dave Peterson028a7b62006-03-26 01:38:47 -0800551 return 0;
552
Douglas Thompson052dfb42007-07-19 01:50:13 -0700553fail1:
Dave Peterson028a7b62006-03-26 01:38:47 -0800554 del_mc_from_global_list(mci);
555
Douglas Thompson052dfb42007-07-19 01:50:13 -0700556fail0:
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700557 mutex_unlock(&mem_ctls_mutex);
Dave Peterson028a7b62006-03-26 01:38:47 -0800558 return 1;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800559}
Dave Peterson91105402006-03-26 01:38:55 -0800560EXPORT_SYMBOL_GPL(edac_mc_add_mc);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800561
Alan Coxda9bb1d2006-01-18 17:44:13 -0800562/**
Dave Peterson472678e2006-03-26 01:38:49 -0800563 * edac_mc_del_mc: Remove sysfs entries for specified mci structure and
564 * remove mci structure from global list
Doug Thompson37f04582006-06-30 01:56:07 -0700565 * @pdev: Pointer to 'struct device' representing mci structure to remove.
Alan Coxda9bb1d2006-01-18 17:44:13 -0800566 *
Dave Peterson18dbc332006-03-26 01:38:50 -0800567 * Return pointer to removed mci structure, or NULL if device not found.
Alan Coxda9bb1d2006-01-18 17:44:13 -0800568 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700569struct mem_ctl_info *edac_mc_del_mc(struct device *dev)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800570{
Dave Peterson18dbc332006-03-26 01:38:50 -0800571 struct mem_ctl_info *mci;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800572
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700573 debugf0("%s()\n", __func__);
574
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700575 mutex_lock(&mem_ctls_mutex);
Dave Peterson18dbc332006-03-26 01:38:50 -0800576
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700577 /* find the requested mci struct in the global list */
578 mci = find_mci_by_dev(dev);
579 if (mci == NULL) {
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700580 mutex_unlock(&mem_ctls_mutex);
Dave Peterson18dbc332006-03-26 01:38:50 -0800581 return NULL;
582 }
583
Dave Jiang81d87cb2007-07-19 01:49:52 -0700584 /* marking MCI offline */
585 mci->op_state = OP_OFFLINE;
586
Alan Coxda9bb1d2006-01-18 17:44:13 -0800587 del_mc_from_global_list(mci);
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700588 mutex_unlock(&mem_ctls_mutex);
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700589
590 /* flush workq processes and remove sysfs */
591 edac_mc_workq_teardown(mci);
592 edac_remove_sysfs_mci_device(mci);
593
Dave Peterson537fba22006-03-26 01:38:40 -0800594 edac_printk(KERN_INFO, EDAC_MC,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700595 "Removed device %d for %s %s: DEV %s\n", mci->mc_idx,
Stephen Rothwell17aa7e02008-05-05 13:54:19 +1000596 mci->mod_name, mci->ctl_name, edac_dev_name(mci));
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700597
Dave Peterson18dbc332006-03-26 01:38:50 -0800598 return mci;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800599}
Dave Peterson91105402006-03-26 01:38:55 -0800600EXPORT_SYMBOL_GPL(edac_mc_del_mc);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800601
Adrian Bunk2da1c112007-07-19 01:49:32 -0700602static void edac_mc_scrub_block(unsigned long page, unsigned long offset,
603 u32 size)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800604{
605 struct page *pg;
606 void *virt_addr;
607 unsigned long flags = 0;
608
Dave Peterson537fba22006-03-26 01:38:40 -0800609 debugf3("%s()\n", __func__);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800610
611 /* ECC error page was not in our memory. Ignore it. */
Douglas Thompson079708b2007-07-19 01:49:58 -0700612 if (!pfn_valid(page))
Alan Coxda9bb1d2006-01-18 17:44:13 -0800613 return;
614
615 /* Find the actual page structure then map it and fix */
616 pg = pfn_to_page(page);
617
618 if (PageHighMem(pg))
619 local_irq_save(flags);
620
621 virt_addr = kmap_atomic(pg, KM_BOUNCE_READ);
622
623 /* Perform architecture specific atomic scrub operation */
624 atomic_scrub(virt_addr + offset, size);
625
626 /* Unmap and complete */
627 kunmap_atomic(virt_addr, KM_BOUNCE_READ);
628
629 if (PageHighMem(pg))
630 local_irq_restore(flags);
631}
632
Alan Coxda9bb1d2006-01-18 17:44:13 -0800633/* FIXME - should return -1 */
Dave Petersone7ecd892006-03-26 01:38:52 -0800634int edac_mc_find_csrow_by_page(struct mem_ctl_info *mci, unsigned long page)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800635{
636 struct csrow_info *csrows = mci->csrows;
637 int row, i;
638
Dave Peterson537fba22006-03-26 01:38:40 -0800639 debugf1("MC%d: %s(): 0x%lx\n", mci->mc_idx, __func__, page);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800640 row = -1;
641
642 for (i = 0; i < mci->nr_csrows; i++) {
643 struct csrow_info *csrow = &csrows[i];
644
645 if (csrow->nr_pages == 0)
646 continue;
647
Dave Peterson537fba22006-03-26 01:38:40 -0800648 debugf3("MC%d: %s(): first(0x%lx) page(0x%lx) last(0x%lx) "
649 "mask(0x%lx)\n", mci->mc_idx, __func__,
650 csrow->first_page, page, csrow->last_page,
651 csrow->page_mask);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800652
653 if ((page >= csrow->first_page) &&
654 (page <= csrow->last_page) &&
655 ((page & csrow->page_mask) ==
656 (csrow->first_page & csrow->page_mask))) {
657 row = i;
658 break;
659 }
660 }
661
662 if (row == -1)
Dave Peterson537fba22006-03-26 01:38:40 -0800663 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700664 "could not look up page error address %lx\n",
665 (unsigned long)page);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800666
667 return row;
668}
Dave Peterson91105402006-03-26 01:38:55 -0800669EXPORT_SYMBOL_GPL(edac_mc_find_csrow_by_page);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800670
Alan Coxda9bb1d2006-01-18 17:44:13 -0800671/* FIXME - setable log (warning/emerg) levels */
672/* FIXME - integrate with evlog: http://evlog.sourceforge.net/ */
673void edac_mc_handle_ce(struct mem_ctl_info *mci,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700674 unsigned long page_frame_number,
675 unsigned long offset_in_page, unsigned long syndrome,
676 int row, int channel, const char *msg)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800677{
678 unsigned long remapped_page;
679
Dave Peterson537fba22006-03-26 01:38:40 -0800680 debugf3("MC%d: %s()\n", mci->mc_idx, __func__);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800681
682 /* FIXME - maybe make panic on INTERNAL ERROR an option */
683 if (row >= mci->nr_csrows || row < 0) {
684 /* something is wrong */
Dave Peterson537fba22006-03-26 01:38:40 -0800685 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700686 "INTERNAL ERROR: row out of range "
687 "(%d >= %d)\n", row, mci->nr_csrows);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800688 edac_mc_handle_ce_no_info(mci, "INTERNAL ERROR");
689 return;
690 }
Dave Petersone7ecd892006-03-26 01:38:52 -0800691
Alan Coxda9bb1d2006-01-18 17:44:13 -0800692 if (channel >= mci->csrows[row].nr_channels || channel < 0) {
693 /* something is wrong */
Dave Peterson537fba22006-03-26 01:38:40 -0800694 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700695 "INTERNAL ERROR: channel out of range "
696 "(%d >= %d)\n", channel,
697 mci->csrows[row].nr_channels);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800698 edac_mc_handle_ce_no_info(mci, "INTERNAL ERROR");
699 return;
700 }
701
Dave Jiang4de78c62007-07-19 01:49:54 -0700702 if (edac_mc_get_log_ce())
Alan Coxda9bb1d2006-01-18 17:44:13 -0800703 /* FIXME - put in DIMM location */
Dave Peterson537fba22006-03-26 01:38:40 -0800704 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700705 "CE page 0x%lx, offset 0x%lx, grain %d, syndrome "
706 "0x%lx, row %d, channel %d, label \"%s\": %s\n",
707 page_frame_number, offset_in_page,
708 mci->csrows[row].grain, syndrome, row, channel,
709 mci->csrows[row].channels[channel].label, msg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800710
711 mci->ce_count++;
712 mci->csrows[row].ce_count++;
713 mci->csrows[row].channels[channel].ce_count++;
714
715 if (mci->scrub_mode & SCRUB_SW_SRC) {
716 /*
717 * Some MC's can remap memory so that it is still available
718 * at a different address when PCI devices map into memory.
719 * MC's that can't do this lose the memory where PCI devices
720 * are mapped. This mapping is MC dependant and so we call
721 * back into the MC driver for it to map the MC page to
722 * a physical (CPU) page which can then be mapped to a virtual
723 * page - which can then be scrubbed.
724 */
725 remapped_page = mci->ctl_page_to_phys ?
Douglas Thompson052dfb42007-07-19 01:50:13 -0700726 mci->ctl_page_to_phys(mci, page_frame_number) :
727 page_frame_number;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800728
729 edac_mc_scrub_block(remapped_page, offset_in_page,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700730 mci->csrows[row].grain);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800731 }
732}
Dave Peterson91105402006-03-26 01:38:55 -0800733EXPORT_SYMBOL_GPL(edac_mc_handle_ce);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800734
Dave Petersone7ecd892006-03-26 01:38:52 -0800735void edac_mc_handle_ce_no_info(struct mem_ctl_info *mci, const char *msg)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800736{
Dave Jiang4de78c62007-07-19 01:49:54 -0700737 if (edac_mc_get_log_ce())
Dave Peterson537fba22006-03-26 01:38:40 -0800738 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700739 "CE - no information available: %s\n", msg);
Dave Petersone7ecd892006-03-26 01:38:52 -0800740
Alan Coxda9bb1d2006-01-18 17:44:13 -0800741 mci->ce_noinfo_count++;
742 mci->ce_count++;
743}
Dave Peterson91105402006-03-26 01:38:55 -0800744EXPORT_SYMBOL_GPL(edac_mc_handle_ce_no_info);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800745
Alan Coxda9bb1d2006-01-18 17:44:13 -0800746void edac_mc_handle_ue(struct mem_ctl_info *mci,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700747 unsigned long page_frame_number,
748 unsigned long offset_in_page, int row, const char *msg)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800749{
750 int len = EDAC_MC_LABEL_LEN * 4;
751 char labels[len + 1];
752 char *pos = labels;
753 int chan;
754 int chars;
755
Dave Peterson537fba22006-03-26 01:38:40 -0800756 debugf3("MC%d: %s()\n", mci->mc_idx, __func__);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800757
758 /* FIXME - maybe make panic on INTERNAL ERROR an option */
759 if (row >= mci->nr_csrows || row < 0) {
760 /* something is wrong */
Dave Peterson537fba22006-03-26 01:38:40 -0800761 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700762 "INTERNAL ERROR: row out of range "
763 "(%d >= %d)\n", row, mci->nr_csrows);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800764 edac_mc_handle_ue_no_info(mci, "INTERNAL ERROR");
765 return;
766 }
767
768 chars = snprintf(pos, len + 1, "%s",
Douglas Thompson079708b2007-07-19 01:49:58 -0700769 mci->csrows[row].channels[0].label);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800770 len -= chars;
771 pos += chars;
Dave Petersone7ecd892006-03-26 01:38:52 -0800772
Alan Coxda9bb1d2006-01-18 17:44:13 -0800773 for (chan = 1; (chan < mci->csrows[row].nr_channels) && (len > 0);
Douglas Thompson052dfb42007-07-19 01:50:13 -0700774 chan++) {
Alan Coxda9bb1d2006-01-18 17:44:13 -0800775 chars = snprintf(pos, len + 1, ":%s",
Douglas Thompson079708b2007-07-19 01:49:58 -0700776 mci->csrows[row].channels[chan].label);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800777 len -= chars;
778 pos += chars;
779 }
780
Dave Jiang4de78c62007-07-19 01:49:54 -0700781 if (edac_mc_get_log_ue())
Dave Peterson537fba22006-03-26 01:38:40 -0800782 edac_mc_printk(mci, KERN_EMERG,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700783 "UE page 0x%lx, offset 0x%lx, grain %d, row %d, "
784 "labels \"%s\": %s\n", page_frame_number,
785 offset_in_page, mci->csrows[row].grain, row,
786 labels, msg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800787
Dave Jiang4de78c62007-07-19 01:49:54 -0700788 if (edac_mc_get_panic_on_ue())
Dave Petersone7ecd892006-03-26 01:38:52 -0800789 panic("EDAC MC%d: UE page 0x%lx, offset 0x%lx, grain %d, "
Douglas Thompson052dfb42007-07-19 01:50:13 -0700790 "row %d, labels \"%s\": %s\n", mci->mc_idx,
791 page_frame_number, offset_in_page,
792 mci->csrows[row].grain, row, labels, msg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800793
794 mci->ue_count++;
795 mci->csrows[row].ue_count++;
796}
Dave Peterson91105402006-03-26 01:38:55 -0800797EXPORT_SYMBOL_GPL(edac_mc_handle_ue);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800798
Dave Petersone7ecd892006-03-26 01:38:52 -0800799void edac_mc_handle_ue_no_info(struct mem_ctl_info *mci, const char *msg)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800800{
Dave Jiang4de78c62007-07-19 01:49:54 -0700801 if (edac_mc_get_panic_on_ue())
Alan Coxda9bb1d2006-01-18 17:44:13 -0800802 panic("EDAC MC%d: Uncorrected Error", mci->mc_idx);
803
Dave Jiang4de78c62007-07-19 01:49:54 -0700804 if (edac_mc_get_log_ue())
Dave Peterson537fba22006-03-26 01:38:40 -0800805 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700806 "UE - no information available: %s\n", msg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800807 mci->ue_noinfo_count++;
808 mci->ue_count++;
809}
Douglas Thompson079708b2007-07-19 01:49:58 -0700810EXPORT_SYMBOL_GPL(edac_mc_handle_ue_no_info);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800811
eric wollesen9794f332007-02-12 00:53:08 -0800812/*************************************************************
813 * On Fully Buffered DIMM modules, this help function is
814 * called to process UE events
815 */
816void edac_mc_handle_fbd_ue(struct mem_ctl_info *mci,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700817 unsigned int csrow,
818 unsigned int channela,
819 unsigned int channelb, char *msg)
eric wollesen9794f332007-02-12 00:53:08 -0800820{
821 int len = EDAC_MC_LABEL_LEN * 4;
822 char labels[len + 1];
823 char *pos = labels;
824 int chars;
825
826 if (csrow >= mci->nr_csrows) {
827 /* something is wrong */
828 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700829 "INTERNAL ERROR: row out of range (%d >= %d)\n",
830 csrow, mci->nr_csrows);
eric wollesen9794f332007-02-12 00:53:08 -0800831 edac_mc_handle_ue_no_info(mci, "INTERNAL ERROR");
832 return;
833 }
834
835 if (channela >= mci->csrows[csrow].nr_channels) {
836 /* something is wrong */
837 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700838 "INTERNAL ERROR: channel-a out of range "
839 "(%d >= %d)\n",
840 channela, mci->csrows[csrow].nr_channels);
eric wollesen9794f332007-02-12 00:53:08 -0800841 edac_mc_handle_ue_no_info(mci, "INTERNAL ERROR");
842 return;
843 }
844
845 if (channelb >= mci->csrows[csrow].nr_channels) {
846 /* something is wrong */
847 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700848 "INTERNAL ERROR: channel-b out of range "
849 "(%d >= %d)\n",
850 channelb, mci->csrows[csrow].nr_channels);
eric wollesen9794f332007-02-12 00:53:08 -0800851 edac_mc_handle_ue_no_info(mci, "INTERNAL ERROR");
852 return;
853 }
854
855 mci->ue_count++;
856 mci->csrows[csrow].ue_count++;
857
858 /* Generate the DIMM labels from the specified channels */
859 chars = snprintf(pos, len + 1, "%s",
860 mci->csrows[csrow].channels[channela].label);
Douglas Thompson079708b2007-07-19 01:49:58 -0700861 len -= chars;
862 pos += chars;
eric wollesen9794f332007-02-12 00:53:08 -0800863 chars = snprintf(pos, len + 1, "-%s",
864 mci->csrows[csrow].channels[channelb].label);
865
Dave Jiang4de78c62007-07-19 01:49:54 -0700866 if (edac_mc_get_log_ue())
eric wollesen9794f332007-02-12 00:53:08 -0800867 edac_mc_printk(mci, KERN_EMERG,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700868 "UE row %d, channel-a= %d channel-b= %d "
869 "labels \"%s\": %s\n", csrow, channela, channelb,
870 labels, msg);
eric wollesen9794f332007-02-12 00:53:08 -0800871
Dave Jiang4de78c62007-07-19 01:49:54 -0700872 if (edac_mc_get_panic_on_ue())
eric wollesen9794f332007-02-12 00:53:08 -0800873 panic("UE row %d, channel-a= %d channel-b= %d "
Douglas Thompson052dfb42007-07-19 01:50:13 -0700874 "labels \"%s\": %s\n", csrow, channela,
875 channelb, labels, msg);
eric wollesen9794f332007-02-12 00:53:08 -0800876}
877EXPORT_SYMBOL(edac_mc_handle_fbd_ue);
878
879/*************************************************************
880 * On Fully Buffered DIMM modules, this help function is
881 * called to process CE events
882 */
883void edac_mc_handle_fbd_ce(struct mem_ctl_info *mci,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700884 unsigned int csrow, unsigned int channel, char *msg)
eric wollesen9794f332007-02-12 00:53:08 -0800885{
886
887 /* Ensure boundary values */
888 if (csrow >= mci->nr_csrows) {
889 /* something is wrong */
890 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700891 "INTERNAL ERROR: row out of range (%d >= %d)\n",
892 csrow, mci->nr_csrows);
eric wollesen9794f332007-02-12 00:53:08 -0800893 edac_mc_handle_ce_no_info(mci, "INTERNAL ERROR");
894 return;
895 }
896 if (channel >= mci->csrows[csrow].nr_channels) {
897 /* something is wrong */
898 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700899 "INTERNAL ERROR: channel out of range (%d >= %d)\n",
900 channel, mci->csrows[csrow].nr_channels);
eric wollesen9794f332007-02-12 00:53:08 -0800901 edac_mc_handle_ce_no_info(mci, "INTERNAL ERROR");
902 return;
903 }
904
Dave Jiang4de78c62007-07-19 01:49:54 -0700905 if (edac_mc_get_log_ce())
eric wollesen9794f332007-02-12 00:53:08 -0800906 /* FIXME - put in DIMM location */
907 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700908 "CE row %d, channel %d, label \"%s\": %s\n",
909 csrow, channel,
910 mci->csrows[csrow].channels[channel].label, msg);
eric wollesen9794f332007-02-12 00:53:08 -0800911
912 mci->ce_count++;
913 mci->csrows[csrow].ce_count++;
914 mci->csrows[csrow].channels[channel].ce_count++;
915}
Douglas Thompson079708b2007-07-19 01:49:58 -0700916EXPORT_SYMBOL(edac_mc_handle_fbd_ce);