blob: 072aa81b4a708905bdde09c1f03a889d2946c94a [file] [log] [blame]
Alan Coxda9bb1d2006-01-18 17:44:13 -08001/*
2 * edac_mc kernel module
Doug Thompson49c0dab72006-07-10 04:45:19 -07003 * (C) 2005, 2006 Linux Networx (http://lnxi.com)
Alan Coxda9bb1d2006-01-18 17:44:13 -08004 * This file may be distributed under the terms of the
5 * GNU General Public License.
6 *
7 * Written by Thayne Harbaugh
8 * Based on work by Dan Hollis <goemon at anime dot net> and others.
9 * http://www.anime.net/~goemon/linux-ecc/
10 *
11 * Modified by Dave Peterson and Doug Thompson
12 *
13 */
14
Alan Coxda9bb1d2006-01-18 17:44:13 -080015#include <linux/module.h>
16#include <linux/proc_fs.h>
17#include <linux/kernel.h>
18#include <linux/types.h>
19#include <linux/smp.h>
20#include <linux/init.h>
21#include <linux/sysctl.h>
22#include <linux/highmem.h>
23#include <linux/timer.h>
24#include <linux/slab.h>
25#include <linux/jiffies.h>
26#include <linux/spinlock.h>
27#include <linux/list.h>
Alan Coxda9bb1d2006-01-18 17:44:13 -080028#include <linux/ctype.h>
Dave Jiangc0d12172007-07-19 01:49:46 -070029#include <linux/edac.h>
Alan Coxda9bb1d2006-01-18 17:44:13 -080030#include <asm/uaccess.h>
31#include <asm/page.h>
32#include <asm/edac.h>
Douglas Thompson20bcb7a2007-07-19 01:49:47 -070033#include "edac_core.h"
Douglas Thompson7c9281d2007-07-19 01:49:33 -070034#include "edac_module.h"
Alan Coxda9bb1d2006-01-18 17:44:13 -080035
Alan Coxda9bb1d2006-01-18 17:44:13 -080036/* lock to memory controller's control array */
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -070037static DEFINE_MUTEX(mem_ctls_mutex);
Robert P. J. Dayff6ac2a2008-04-29 01:03:17 -070038static LIST_HEAD(mc_devices);
Alan Coxda9bb1d2006-01-18 17:44:13 -080039
Alan Coxda9bb1d2006-01-18 17:44:13 -080040#ifdef CONFIG_EDAC_DEBUG
41
Mauro Carvalho Chehaba4b4be32012-01-27 10:26:13 -030042static void edac_mc_dump_channel(struct rank_info *chan)
Alan Coxda9bb1d2006-01-18 17:44:13 -080043{
44 debugf4("\tchannel = %p\n", chan);
45 debugf4("\tchannel->chan_idx = %d\n", chan->chan_idx);
Alan Coxda9bb1d2006-01-18 17:44:13 -080046 debugf4("\tchannel->csrow = %p\n\n", chan->csrow);
Mauro Carvalho Chehaba895bf82012-01-28 09:09:38 -030047 debugf4("\tdimm->ce_count = %d\n", chan->dimm->ce_count);
48 debugf4("\tdimm->label = '%s'\n", chan->dimm->label);
49 debugf4("\tdimm->nr_pages = 0x%x\n", chan->dimm->nr_pages);
Alan Coxda9bb1d2006-01-18 17:44:13 -080050}
51
Adrian Bunk2da1c112007-07-19 01:49:32 -070052static void edac_mc_dump_csrow(struct csrow_info *csrow)
Alan Coxda9bb1d2006-01-18 17:44:13 -080053{
54 debugf4("\tcsrow = %p\n", csrow);
55 debugf4("\tcsrow->csrow_idx = %d\n", csrow->csrow_idx);
Douglas Thompson079708b2007-07-19 01:49:58 -070056 debugf4("\tcsrow->first_page = 0x%lx\n", csrow->first_page);
Alan Coxda9bb1d2006-01-18 17:44:13 -080057 debugf4("\tcsrow->last_page = 0x%lx\n", csrow->last_page);
58 debugf4("\tcsrow->page_mask = 0x%lx\n", csrow->page_mask);
Douglas Thompson079708b2007-07-19 01:49:58 -070059 debugf4("\tcsrow->nr_channels = %d\n", csrow->nr_channels);
Alan Coxda9bb1d2006-01-18 17:44:13 -080060 debugf4("\tcsrow->channels = %p\n", csrow->channels);
61 debugf4("\tcsrow->mci = %p\n\n", csrow->mci);
62}
63
Adrian Bunk2da1c112007-07-19 01:49:32 -070064static void edac_mc_dump_mci(struct mem_ctl_info *mci)
Alan Coxda9bb1d2006-01-18 17:44:13 -080065{
66 debugf3("\tmci = %p\n", mci);
67 debugf3("\tmci->mtype_cap = %lx\n", mci->mtype_cap);
68 debugf3("\tmci->edac_ctl_cap = %lx\n", mci->edac_ctl_cap);
69 debugf3("\tmci->edac_cap = %lx\n", mci->edac_cap);
70 debugf4("\tmci->edac_check = %p\n", mci->edac_check);
71 debugf3("\tmci->nr_csrows = %d, csrows = %p\n",
72 mci->nr_csrows, mci->csrows);
Doug Thompson37f04582006-06-30 01:56:07 -070073 debugf3("\tdev = %p\n", mci->dev);
Douglas Thompson079708b2007-07-19 01:49:58 -070074 debugf3("\tmod_name:ctl_name = %s:%s\n", mci->mod_name, mci->ctl_name);
Alan Coxda9bb1d2006-01-18 17:44:13 -080075 debugf3("\tpvt_info = %p\n\n", mci->pvt_info);
76}
77
Borislav Petkov24f9a7f2010-10-07 18:29:15 +020078#endif /* CONFIG_EDAC_DEBUG */
79
Borislav Petkov239642f2009-11-12 15:33:16 +010080/*
81 * keep those in sync with the enum mem_type
82 */
83const char *edac_mem_types[] = {
84 "Empty csrow",
85 "Reserved csrow type",
86 "Unknown csrow type",
87 "Fast page mode RAM",
88 "Extended data out RAM",
89 "Burst Extended data out RAM",
90 "Single data rate SDRAM",
91 "Registered single data rate SDRAM",
92 "Double data rate SDRAM",
93 "Registered Double data rate SDRAM",
94 "Rambus DRAM",
95 "Unbuffered DDR2 RAM",
96 "Fully buffered DDR2",
97 "Registered DDR2 RAM",
98 "Rambus XDR",
99 "Unbuffered DDR3 RAM",
100 "Registered DDR3 RAM",
101};
102EXPORT_SYMBOL_GPL(edac_mem_types);
103
Alan Coxda9bb1d2006-01-18 17:44:13 -0800104/* 'ptr' points to a possibly unaligned item X such that sizeof(X) is 'size'.
105 * Adjust 'ptr' so that its alignment is at least as stringent as what the
106 * compiler would provide for X and return the aligned result.
107 *
108 * If 'size' is a constant, the compiler will optimize this whole function
109 * down to either a no-op or the addition of a constant to the value of 'ptr'.
110 */
Douglas Thompson7391c6d2007-07-19 01:50:21 -0700111void *edac_align_ptr(void *ptr, unsigned size)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800112{
113 unsigned align, r;
114
115 /* Here we assume that the alignment of a "long long" is the most
116 * stringent alignment that the compiler will ever provide by default.
117 * As far as I know, this is a reasonable assumption.
118 */
119 if (size > sizeof(long))
120 align = sizeof(long long);
121 else if (size > sizeof(int))
122 align = sizeof(long);
123 else if (size > sizeof(short))
124 align = sizeof(int);
125 else if (size > sizeof(char))
126 align = sizeof(short);
127 else
Douglas Thompson079708b2007-07-19 01:49:58 -0700128 return (char *)ptr;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800129
130 r = size % align;
131
132 if (r == 0)
Douglas Thompson079708b2007-07-19 01:49:58 -0700133 return (char *)ptr;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800134
Douglas Thompson7391c6d2007-07-19 01:50:21 -0700135 return (void *)(((unsigned long)ptr) + align - r);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800136}
137
Alan Coxda9bb1d2006-01-18 17:44:13 -0800138/**
139 * edac_mc_alloc: Allocate a struct mem_ctl_info structure
140 * @size_pvt: size of private storage needed
141 * @nr_csrows: Number of CWROWS needed for this MC
142 * @nr_chans: Number of channels for the MC
143 *
144 * Everything is kmalloc'ed as one big chunk - more efficient.
145 * Only can be used if all structures have the same lifetime - otherwise
146 * you have to allocate and initialize your own structures.
147 *
148 * Use edac_mc_free() to free mc structures allocated by this function.
149 *
150 * Returns:
151 * NULL allocation failed
152 * struct mem_ctl_info pointer
153 */
154struct mem_ctl_info *edac_mc_alloc(unsigned sz_pvt, unsigned nr_csrows,
Doug Thompsonb8f6f972007-07-19 01:50:26 -0700155 unsigned nr_chans, int edac_index)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800156{
157 struct mem_ctl_info *mci;
158 struct csrow_info *csi, *csrow;
Mauro Carvalho Chehaba4b4be32012-01-27 10:26:13 -0300159 struct rank_info *chi, *chp, *chan;
Mauro Carvalho Chehaba7d7d2e2012-01-27 14:12:32 -0300160 struct dimm_info *dimm;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800161 void *pvt;
162 unsigned size;
163 int row, chn;
Doug Thompson8096cfa2007-07-19 01:50:27 -0700164 int err;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800165
166 /* Figure out the offsets of the various items from the start of an mc
167 * structure. We want the alignment of each item to be at least as
168 * stringent as what the compiler would provide if we could simply
169 * hardcode everything into a single struct.
170 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700171 mci = (struct mem_ctl_info *)0;
Douglas Thompson7391c6d2007-07-19 01:50:21 -0700172 csi = edac_align_ptr(&mci[1], sizeof(*csi));
173 chi = edac_align_ptr(&csi[nr_csrows], sizeof(*chi));
Mauro Carvalho Chehaba7d7d2e2012-01-27 14:12:32 -0300174 dimm = edac_align_ptr(&chi[nr_chans * nr_csrows], sizeof(*dimm));
175 pvt = edac_align_ptr(&dimm[nr_chans * nr_csrows], sz_pvt);
Douglas Thompson079708b2007-07-19 01:49:58 -0700176 size = ((unsigned long)pvt) + sz_pvt;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800177
Doug Thompson8096cfa2007-07-19 01:50:27 -0700178 mci = kzalloc(size, GFP_KERNEL);
179 if (mci == NULL)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800180 return NULL;
181
182 /* Adjust pointers so they point within the memory we just allocated
183 * rather than an imaginary chunk of memory located at address 0.
184 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700185 csi = (struct csrow_info *)(((char *)mci) + ((unsigned long)csi));
Mauro Carvalho Chehaba4b4be32012-01-27 10:26:13 -0300186 chi = (struct rank_info *)(((char *)mci) + ((unsigned long)chi));
Mauro Carvalho Chehaba7d7d2e2012-01-27 14:12:32 -0300187 dimm = (struct dimm_info *)(((char *)mci) + ((unsigned long)dimm));
Douglas Thompson079708b2007-07-19 01:49:58 -0700188 pvt = sz_pvt ? (((char *)mci) + ((unsigned long)pvt)) : NULL;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800189
Doug Thompsonb8f6f972007-07-19 01:50:26 -0700190 /* setup index and various internal pointers */
191 mci->mc_idx = edac_index;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800192 mci->csrows = csi;
Mauro Carvalho Chehaba7d7d2e2012-01-27 14:12:32 -0300193 mci->dimms = dimm;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800194 mci->pvt_info = pvt;
195 mci->nr_csrows = nr_csrows;
196
Mauro Carvalho Chehaba7d7d2e2012-01-27 14:12:32 -0300197 /*
198 * For now, assumes that a per-csrow arrangement for dimms.
199 * This will be latter changed.
200 */
201 dimm = mci->dimms;
202
Alan Coxda9bb1d2006-01-18 17:44:13 -0800203 for (row = 0; row < nr_csrows; row++) {
204 csrow = &csi[row];
205 csrow->csrow_idx = row;
206 csrow->mci = mci;
207 csrow->nr_channels = nr_chans;
208 chp = &chi[row * nr_chans];
209 csrow->channels = chp;
210
211 for (chn = 0; chn < nr_chans; chn++) {
212 chan = &chp[chn];
213 chan->chan_idx = chn;
214 chan->csrow = csrow;
Mauro Carvalho Chehaba7d7d2e2012-01-27 14:12:32 -0300215
216 mci->csrows[row].channels[chn].dimm = dimm;
217 dimm->csrow = row;
218 dimm->csrow_channel = chn;
219 dimm++;
220 mci->nr_dimms++;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800221 }
222 }
223
Dave Jiang81d87cb2007-07-19 01:49:52 -0700224 mci->op_state = OP_ALLOC;
Mauro Carvalho Chehab6fe11082010-08-12 00:30:25 -0300225 INIT_LIST_HEAD(&mci->grp_kobj_list);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700226
Doug Thompson8096cfa2007-07-19 01:50:27 -0700227 /*
228 * Initialize the 'root' kobj for the edac_mc controller
229 */
230 err = edac_mc_register_sysfs_main_kobj(mci);
231 if (err) {
232 kfree(mci);
233 return NULL;
234 }
235
236 /* at this point, the root kobj is valid, and in order to
237 * 'free' the object, then the function:
238 * edac_mc_unregister_sysfs_main_kobj() must be called
239 * which will perform kobj unregistration and the actual free
240 * will occur during the kobject callback operation
241 */
Alan Coxda9bb1d2006-01-18 17:44:13 -0800242 return mci;
243}
Dave Peterson91105402006-03-26 01:38:55 -0800244EXPORT_SYMBOL_GPL(edac_mc_alloc);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800245
Alan Coxda9bb1d2006-01-18 17:44:13 -0800246/**
Doug Thompson8096cfa2007-07-19 01:50:27 -0700247 * edac_mc_free
248 * 'Free' a previously allocated 'mci' structure
Alan Coxda9bb1d2006-01-18 17:44:13 -0800249 * @mci: pointer to a struct mem_ctl_info structure
Alan Coxda9bb1d2006-01-18 17:44:13 -0800250 */
251void edac_mc_free(struct mem_ctl_info *mci)
252{
Mauro Carvalho Chehabbbc560a2010-08-16 18:22:43 -0300253 debugf1("%s()\n", __func__);
254
Doug Thompson8096cfa2007-07-19 01:50:27 -0700255 edac_mc_unregister_sysfs_main_kobj(mci);
Mauro Carvalho Chehabaccf74f2010-08-16 18:34:37 -0300256
257 /* free the mci instance memory here */
258 kfree(mci);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800259}
Dave Peterson91105402006-03-26 01:38:55 -0800260EXPORT_SYMBOL_GPL(edac_mc_free);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800261
Doug Thompsonbce19682007-07-26 10:41:14 -0700262
Mauro Carvalho Chehab939747bd2010-08-10 11:22:01 -0300263/**
Doug Thompsonbce19682007-07-26 10:41:14 -0700264 * find_mci_by_dev
265 *
266 * scan list of controllers looking for the one that manages
267 * the 'dev' device
Mauro Carvalho Chehab939747bd2010-08-10 11:22:01 -0300268 * @dev: pointer to a struct device related with the MCI
Doug Thompsonbce19682007-07-26 10:41:14 -0700269 */
Mauro Carvalho Chehab939747bd2010-08-10 11:22:01 -0300270struct mem_ctl_info *find_mci_by_dev(struct device *dev)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800271{
272 struct mem_ctl_info *mci;
273 struct list_head *item;
274
Dave Peterson537fba22006-03-26 01:38:40 -0800275 debugf3("%s()\n", __func__);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800276
277 list_for_each(item, &mc_devices) {
278 mci = list_entry(item, struct mem_ctl_info, link);
279
Doug Thompson37f04582006-06-30 01:56:07 -0700280 if (mci->dev == dev)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800281 return mci;
282 }
283
284 return NULL;
285}
Mauro Carvalho Chehab939747bd2010-08-10 11:22:01 -0300286EXPORT_SYMBOL_GPL(find_mci_by_dev);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800287
Dave Jiang81d87cb2007-07-19 01:49:52 -0700288/*
289 * handler for EDAC to check if NMI type handler has asserted interrupt
290 */
291static int edac_mc_assert_error_check_and_clear(void)
292{
Dave Jiang66ee2f92007-07-19 01:49:54 -0700293 int old_state;
Dave Jiang81d87cb2007-07-19 01:49:52 -0700294
Douglas Thompson079708b2007-07-19 01:49:58 -0700295 if (edac_op_state == EDAC_OPSTATE_POLL)
Dave Jiang81d87cb2007-07-19 01:49:52 -0700296 return 1;
297
Dave Jiang66ee2f92007-07-19 01:49:54 -0700298 old_state = edac_err_assert;
299 edac_err_assert = 0;
Dave Jiang81d87cb2007-07-19 01:49:52 -0700300
Dave Jiang66ee2f92007-07-19 01:49:54 -0700301 return old_state;
Dave Jiang81d87cb2007-07-19 01:49:52 -0700302}
303
304/*
305 * edac_mc_workq_function
306 * performs the operation scheduled by a workq request
307 */
Dave Jiang81d87cb2007-07-19 01:49:52 -0700308static void edac_mc_workq_function(struct work_struct *work_req)
309{
Jean Delvarefbeb4382009-04-13 14:40:21 -0700310 struct delayed_work *d_work = to_delayed_work(work_req);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700311 struct mem_ctl_info *mci = to_edac_mem_ctl_work(d_work);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700312
313 mutex_lock(&mem_ctls_mutex);
314
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700315 /* if this control struct has movd to offline state, we are done */
316 if (mci->op_state == OP_OFFLINE) {
317 mutex_unlock(&mem_ctls_mutex);
318 return;
319 }
320
Dave Jiang81d87cb2007-07-19 01:49:52 -0700321 /* Only poll controllers that are running polled and have a check */
322 if (edac_mc_assert_error_check_and_clear() && (mci->edac_check != NULL))
323 mci->edac_check(mci);
324
Dave Jiang81d87cb2007-07-19 01:49:52 -0700325 mutex_unlock(&mem_ctls_mutex);
326
327 /* Reschedule */
Dave Jiang4de78c62007-07-19 01:49:54 -0700328 queue_delayed_work(edac_workqueue, &mci->work,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700329 msecs_to_jiffies(edac_mc_get_poll_msec()));
Dave Jiang81d87cb2007-07-19 01:49:52 -0700330}
331
332/*
333 * edac_mc_workq_setup
334 * initialize a workq item for this mci
335 * passing in the new delay period in msec
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700336 *
337 * locking model:
338 *
339 * called with the mem_ctls_mutex held
Dave Jiang81d87cb2007-07-19 01:49:52 -0700340 */
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700341static void edac_mc_workq_setup(struct mem_ctl_info *mci, unsigned msec)
Dave Jiang81d87cb2007-07-19 01:49:52 -0700342{
343 debugf0("%s()\n", __func__);
344
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700345 /* if this instance is not in the POLL state, then simply return */
346 if (mci->op_state != OP_RUNNING_POLL)
347 return;
348
Dave Jiang81d87cb2007-07-19 01:49:52 -0700349 INIT_DELAYED_WORK(&mci->work, edac_mc_workq_function);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700350 queue_delayed_work(edac_workqueue, &mci->work, msecs_to_jiffies(msec));
351}
352
353/*
354 * edac_mc_workq_teardown
355 * stop the workq processing on this mci
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700356 *
357 * locking model:
358 *
359 * called WITHOUT lock held
Dave Jiang81d87cb2007-07-19 01:49:52 -0700360 */
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700361static void edac_mc_workq_teardown(struct mem_ctl_info *mci)
Dave Jiang81d87cb2007-07-19 01:49:52 -0700362{
363 int status;
364
Borislav Petkov00740c52010-09-26 12:42:23 +0200365 if (mci->op_state != OP_RUNNING_POLL)
366 return;
367
Doug Thompsonbce19682007-07-26 10:41:14 -0700368 status = cancel_delayed_work(&mci->work);
369 if (status == 0) {
370 debugf0("%s() not canceled, flush the queue\n",
371 __func__);
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700372
Doug Thompsonbce19682007-07-26 10:41:14 -0700373 /* workq instance might be running, wait for it */
374 flush_workqueue(edac_workqueue);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700375 }
376}
377
378/*
Doug Thompsonbce19682007-07-26 10:41:14 -0700379 * edac_mc_reset_delay_period(unsigned long value)
380 *
381 * user space has updated our poll period value, need to
382 * reset our workq delays
Dave Jiang81d87cb2007-07-19 01:49:52 -0700383 */
Doug Thompsonbce19682007-07-26 10:41:14 -0700384void edac_mc_reset_delay_period(int value)
Dave Jiang81d87cb2007-07-19 01:49:52 -0700385{
Doug Thompsonbce19682007-07-26 10:41:14 -0700386 struct mem_ctl_info *mci;
387 struct list_head *item;
Dave Jiang81d87cb2007-07-19 01:49:52 -0700388
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700389 mutex_lock(&mem_ctls_mutex);
390
Doug Thompsonbce19682007-07-26 10:41:14 -0700391 /* scan the list and turn off all workq timers, doing so under lock
392 */
393 list_for_each(item, &mc_devices) {
394 mci = list_entry(item, struct mem_ctl_info, link);
395
396 if (mci->op_state == OP_RUNNING_POLL)
397 cancel_delayed_work(&mci->work);
398 }
399
400 mutex_unlock(&mem_ctls_mutex);
401
402
403 /* re-walk the list, and reset the poll delay */
404 mutex_lock(&mem_ctls_mutex);
405
406 list_for_each(item, &mc_devices) {
407 mci = list_entry(item, struct mem_ctl_info, link);
408
409 edac_mc_workq_setup(mci, (unsigned long) value);
410 }
Dave Jiang81d87cb2007-07-19 01:49:52 -0700411
412 mutex_unlock(&mem_ctls_mutex);
413}
414
Doug Thompsonbce19682007-07-26 10:41:14 -0700415
416
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700417/* Return 0 on success, 1 on failure.
418 * Before calling this function, caller must
419 * assign a unique value to mci->mc_idx.
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700420 *
421 * locking model:
422 *
423 * called with the mem_ctls_mutex lock held
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700424 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700425static int add_mc_to_global_list(struct mem_ctl_info *mci)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800426{
427 struct list_head *item, *insert_before;
428 struct mem_ctl_info *p;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800429
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700430 insert_before = &mc_devices;
431
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700432 p = find_mci_by_dev(mci->dev);
433 if (unlikely(p != NULL))
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700434 goto fail0;
435
436 list_for_each(item, &mc_devices) {
437 p = list_entry(item, struct mem_ctl_info, link);
438
439 if (p->mc_idx >= mci->mc_idx) {
440 if (unlikely(p->mc_idx == mci->mc_idx))
441 goto fail1;
442
443 insert_before = item;
444 break;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800445 }
Alan Coxda9bb1d2006-01-18 17:44:13 -0800446 }
447
448 list_add_tail_rcu(&mci->link, insert_before);
Dave Jiangc0d12172007-07-19 01:49:46 -0700449 atomic_inc(&edac_handlers);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800450 return 0;
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700451
Douglas Thompson052dfb42007-07-19 01:50:13 -0700452fail0:
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700453 edac_printk(KERN_WARNING, EDAC_MC,
Kay Sievers281efb12009-01-06 14:42:57 -0800454 "%s (%s) %s %s already assigned %d\n", dev_name(p->dev),
Stephen Rothwell17aa7e02008-05-05 13:54:19 +1000455 edac_dev_name(mci), p->mod_name, p->ctl_name, p->mc_idx);
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700456 return 1;
457
Douglas Thompson052dfb42007-07-19 01:50:13 -0700458fail1:
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700459 edac_printk(KERN_WARNING, EDAC_MC,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700460 "bug in low-level driver: attempt to assign\n"
461 " duplicate mc_idx %d in %s()\n", p->mc_idx, __func__);
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700462 return 1;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800463}
464
Dave Petersone7ecd892006-03-26 01:38:52 -0800465static void del_mc_from_global_list(struct mem_ctl_info *mci)
Dave Petersona1d03fc2006-03-26 01:38:46 -0800466{
Dave Jiangc0d12172007-07-19 01:49:46 -0700467 atomic_dec(&edac_handlers);
Dave Petersona1d03fc2006-03-26 01:38:46 -0800468 list_del_rcu(&mci->link);
Lai Jiangshane2e77092011-05-26 16:25:58 -0700469
470 /* these are for safe removal of devices from global list while
471 * NMI handlers may be traversing list
472 */
473 synchronize_rcu();
474 INIT_LIST_HEAD(&mci->link);
Dave Petersona1d03fc2006-03-26 01:38:46 -0800475}
476
Alan Coxda9bb1d2006-01-18 17:44:13 -0800477/**
Douglas Thompson5da08312007-07-19 01:49:31 -0700478 * edac_mc_find: Search for a mem_ctl_info structure whose index is 'idx'.
479 *
480 * If found, return a pointer to the structure.
481 * Else return NULL.
482 *
483 * Caller must hold mem_ctls_mutex.
484 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700485struct mem_ctl_info *edac_mc_find(int idx)
Douglas Thompson5da08312007-07-19 01:49:31 -0700486{
487 struct list_head *item;
488 struct mem_ctl_info *mci;
489
490 list_for_each(item, &mc_devices) {
491 mci = list_entry(item, struct mem_ctl_info, link);
492
493 if (mci->mc_idx >= idx) {
494 if (mci->mc_idx == idx)
495 return mci;
496
497 break;
498 }
499 }
500
501 return NULL;
502}
503EXPORT_SYMBOL(edac_mc_find);
504
505/**
Dave Peterson472678e2006-03-26 01:38:49 -0800506 * edac_mc_add_mc: Insert the 'mci' structure into the mci global list and
507 * create sysfs entries associated with mci structure
Alan Coxda9bb1d2006-01-18 17:44:13 -0800508 * @mci: pointer to the mci structure to be added to the list
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700509 * @mc_idx: A unique numeric identifier to be assigned to the 'mci' structure.
Alan Coxda9bb1d2006-01-18 17:44:13 -0800510 *
511 * Return:
512 * 0 Success
513 * !0 Failure
514 */
515
516/* FIXME - should a warning be printed if no error detection? correction? */
Doug Thompsonb8f6f972007-07-19 01:50:26 -0700517int edac_mc_add_mc(struct mem_ctl_info *mci)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800518{
Dave Peterson537fba22006-03-26 01:38:40 -0800519 debugf0("%s()\n", __func__);
Doug Thompsonb8f6f972007-07-19 01:50:26 -0700520
Alan Coxda9bb1d2006-01-18 17:44:13 -0800521#ifdef CONFIG_EDAC_DEBUG
522 if (edac_debug_level >= 3)
523 edac_mc_dump_mci(mci);
Dave Petersone7ecd892006-03-26 01:38:52 -0800524
Alan Coxda9bb1d2006-01-18 17:44:13 -0800525 if (edac_debug_level >= 4) {
526 int i;
527
528 for (i = 0; i < mci->nr_csrows; i++) {
529 int j;
Dave Petersone7ecd892006-03-26 01:38:52 -0800530
Alan Coxda9bb1d2006-01-18 17:44:13 -0800531 edac_mc_dump_csrow(&mci->csrows[i]);
532 for (j = 0; j < mci->csrows[i].nr_channels; j++)
Douglas Thompson079708b2007-07-19 01:49:58 -0700533 edac_mc_dump_channel(&mci->csrows[i].
Douglas Thompson052dfb42007-07-19 01:50:13 -0700534 channels[j]);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800535 }
536 }
537#endif
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700538 mutex_lock(&mem_ctls_mutex);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800539
540 if (add_mc_to_global_list(mci))
Dave Peterson028a7b62006-03-26 01:38:47 -0800541 goto fail0;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800542
543 /* set load time so that error rate can be tracked */
544 mci->start_time = jiffies;
545
eric wollesen9794f332007-02-12 00:53:08 -0800546 if (edac_create_sysfs_mci_device(mci)) {
547 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700548 "failed to create sysfs device\n");
eric wollesen9794f332007-02-12 00:53:08 -0800549 goto fail1;
550 }
Alan Coxda9bb1d2006-01-18 17:44:13 -0800551
Dave Jiang81d87cb2007-07-19 01:49:52 -0700552 /* If there IS a check routine, then we are running POLLED */
553 if (mci->edac_check != NULL) {
554 /* This instance is NOW RUNNING */
555 mci->op_state = OP_RUNNING_POLL;
556
557 edac_mc_workq_setup(mci, edac_mc_get_poll_msec());
558 } else {
559 mci->op_state = OP_RUNNING_INTERRUPT;
560 }
561
Alan Coxda9bb1d2006-01-18 17:44:13 -0800562 /* Report action taken */
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700563 edac_mc_printk(mci, KERN_INFO, "Giving out device to '%s' '%s':"
Stephen Rothwell17aa7e02008-05-05 13:54:19 +1000564 " DEV %s\n", mci->mod_name, mci->ctl_name, edac_dev_name(mci));
Alan Coxda9bb1d2006-01-18 17:44:13 -0800565
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700566 mutex_unlock(&mem_ctls_mutex);
Dave Peterson028a7b62006-03-26 01:38:47 -0800567 return 0;
568
Douglas Thompson052dfb42007-07-19 01:50:13 -0700569fail1:
Dave Peterson028a7b62006-03-26 01:38:47 -0800570 del_mc_from_global_list(mci);
571
Douglas Thompson052dfb42007-07-19 01:50:13 -0700572fail0:
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700573 mutex_unlock(&mem_ctls_mutex);
Dave Peterson028a7b62006-03-26 01:38:47 -0800574 return 1;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800575}
Dave Peterson91105402006-03-26 01:38:55 -0800576EXPORT_SYMBOL_GPL(edac_mc_add_mc);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800577
Alan Coxda9bb1d2006-01-18 17:44:13 -0800578/**
Dave Peterson472678e2006-03-26 01:38:49 -0800579 * edac_mc_del_mc: Remove sysfs entries for specified mci structure and
580 * remove mci structure from global list
Doug Thompson37f04582006-06-30 01:56:07 -0700581 * @pdev: Pointer to 'struct device' representing mci structure to remove.
Alan Coxda9bb1d2006-01-18 17:44:13 -0800582 *
Dave Peterson18dbc332006-03-26 01:38:50 -0800583 * Return pointer to removed mci structure, or NULL if device not found.
Alan Coxda9bb1d2006-01-18 17:44:13 -0800584 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700585struct mem_ctl_info *edac_mc_del_mc(struct device *dev)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800586{
Dave Peterson18dbc332006-03-26 01:38:50 -0800587 struct mem_ctl_info *mci;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800588
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700589 debugf0("%s()\n", __func__);
590
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700591 mutex_lock(&mem_ctls_mutex);
Dave Peterson18dbc332006-03-26 01:38:50 -0800592
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700593 /* find the requested mci struct in the global list */
594 mci = find_mci_by_dev(dev);
595 if (mci == NULL) {
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700596 mutex_unlock(&mem_ctls_mutex);
Dave Peterson18dbc332006-03-26 01:38:50 -0800597 return NULL;
598 }
599
Alan Coxda9bb1d2006-01-18 17:44:13 -0800600 del_mc_from_global_list(mci);
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700601 mutex_unlock(&mem_ctls_mutex);
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700602
Borislav Petkovbb31b3122010-12-02 17:48:35 +0100603 /* flush workq processes */
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700604 edac_mc_workq_teardown(mci);
Borislav Petkovbb31b3122010-12-02 17:48:35 +0100605
606 /* marking MCI offline */
607 mci->op_state = OP_OFFLINE;
608
609 /* remove from sysfs */
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700610 edac_remove_sysfs_mci_device(mci);
611
Dave Peterson537fba22006-03-26 01:38:40 -0800612 edac_printk(KERN_INFO, EDAC_MC,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700613 "Removed device %d for %s %s: DEV %s\n", mci->mc_idx,
Stephen Rothwell17aa7e02008-05-05 13:54:19 +1000614 mci->mod_name, mci->ctl_name, edac_dev_name(mci));
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700615
Dave Peterson18dbc332006-03-26 01:38:50 -0800616 return mci;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800617}
Dave Peterson91105402006-03-26 01:38:55 -0800618EXPORT_SYMBOL_GPL(edac_mc_del_mc);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800619
Adrian Bunk2da1c112007-07-19 01:49:32 -0700620static void edac_mc_scrub_block(unsigned long page, unsigned long offset,
621 u32 size)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800622{
623 struct page *pg;
624 void *virt_addr;
625 unsigned long flags = 0;
626
Dave Peterson537fba22006-03-26 01:38:40 -0800627 debugf3("%s()\n", __func__);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800628
629 /* ECC error page was not in our memory. Ignore it. */
Douglas Thompson079708b2007-07-19 01:49:58 -0700630 if (!pfn_valid(page))
Alan Coxda9bb1d2006-01-18 17:44:13 -0800631 return;
632
633 /* Find the actual page structure then map it and fix */
634 pg = pfn_to_page(page);
635
636 if (PageHighMem(pg))
637 local_irq_save(flags);
638
Cong Wang4e5df7c2011-11-25 23:14:19 +0800639 virt_addr = kmap_atomic(pg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800640
641 /* Perform architecture specific atomic scrub operation */
642 atomic_scrub(virt_addr + offset, size);
643
644 /* Unmap and complete */
Cong Wang4e5df7c2011-11-25 23:14:19 +0800645 kunmap_atomic(virt_addr);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800646
647 if (PageHighMem(pg))
648 local_irq_restore(flags);
649}
650
Alan Coxda9bb1d2006-01-18 17:44:13 -0800651/* FIXME - should return -1 */
Dave Petersone7ecd892006-03-26 01:38:52 -0800652int edac_mc_find_csrow_by_page(struct mem_ctl_info *mci, unsigned long page)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800653{
654 struct csrow_info *csrows = mci->csrows;
Mauro Carvalho Chehaba895bf82012-01-28 09:09:38 -0300655 int row, i, j, n;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800656
Dave Peterson537fba22006-03-26 01:38:40 -0800657 debugf1("MC%d: %s(): 0x%lx\n", mci->mc_idx, __func__, page);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800658 row = -1;
659
660 for (i = 0; i < mci->nr_csrows; i++) {
661 struct csrow_info *csrow = &csrows[i];
Mauro Carvalho Chehaba895bf82012-01-28 09:09:38 -0300662 n = 0;
663 for (j = 0; j < csrow->nr_channels; j++) {
664 struct dimm_info *dimm = csrow->channels[j].dimm;
665 n += dimm->nr_pages;
666 }
667 if (n == 0)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800668 continue;
669
Dave Peterson537fba22006-03-26 01:38:40 -0800670 debugf3("MC%d: %s(): first(0x%lx) page(0x%lx) last(0x%lx) "
671 "mask(0x%lx)\n", mci->mc_idx, __func__,
672 csrow->first_page, page, csrow->last_page,
673 csrow->page_mask);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800674
675 if ((page >= csrow->first_page) &&
676 (page <= csrow->last_page) &&
677 ((page & csrow->page_mask) ==
678 (csrow->first_page & csrow->page_mask))) {
679 row = i;
680 break;
681 }
682 }
683
684 if (row == -1)
Dave Peterson537fba22006-03-26 01:38:40 -0800685 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700686 "could not look up page error address %lx\n",
687 (unsigned long)page);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800688
689 return row;
690}
Dave Peterson91105402006-03-26 01:38:55 -0800691EXPORT_SYMBOL_GPL(edac_mc_find_csrow_by_page);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800692
Alan Coxda9bb1d2006-01-18 17:44:13 -0800693/* FIXME - setable log (warning/emerg) levels */
694/* FIXME - integrate with evlog: http://evlog.sourceforge.net/ */
695void edac_mc_handle_ce(struct mem_ctl_info *mci,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700696 unsigned long page_frame_number,
697 unsigned long offset_in_page, unsigned long syndrome,
698 int row, int channel, const char *msg)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800699{
700 unsigned long remapped_page;
Mauro Carvalho Chehaba7d7d2e2012-01-27 14:12:32 -0300701 char *label = NULL;
Mauro Carvalho Chehab084a4fc2012-01-27 18:38:08 -0300702 u32 grain;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800703
Dave Peterson537fba22006-03-26 01:38:40 -0800704 debugf3("MC%d: %s()\n", mci->mc_idx, __func__);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800705
706 /* FIXME - maybe make panic on INTERNAL ERROR an option */
707 if (row >= mci->nr_csrows || row < 0) {
708 /* something is wrong */
Dave Peterson537fba22006-03-26 01:38:40 -0800709 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700710 "INTERNAL ERROR: row out of range "
711 "(%d >= %d)\n", row, mci->nr_csrows);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800712 edac_mc_handle_ce_no_info(mci, "INTERNAL ERROR");
713 return;
714 }
Dave Petersone7ecd892006-03-26 01:38:52 -0800715
Alan Coxda9bb1d2006-01-18 17:44:13 -0800716 if (channel >= mci->csrows[row].nr_channels || channel < 0) {
717 /* something is wrong */
Dave Peterson537fba22006-03-26 01:38:40 -0800718 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700719 "INTERNAL ERROR: channel out of range "
720 "(%d >= %d)\n", channel,
721 mci->csrows[row].nr_channels);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800722 edac_mc_handle_ce_no_info(mci, "INTERNAL ERROR");
723 return;
724 }
725
Mauro Carvalho Chehaba7d7d2e2012-01-27 14:12:32 -0300726 label = mci->csrows[row].channels[channel].dimm->label;
Mauro Carvalho Chehab084a4fc2012-01-27 18:38:08 -0300727 grain = mci->csrows[row].channels[channel].dimm->grain;
Mauro Carvalho Chehaba7d7d2e2012-01-27 14:12:32 -0300728
Dave Jiang4de78c62007-07-19 01:49:54 -0700729 if (edac_mc_get_log_ce())
Alan Coxda9bb1d2006-01-18 17:44:13 -0800730 /* FIXME - put in DIMM location */
Dave Peterson537fba22006-03-26 01:38:40 -0800731 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700732 "CE page 0x%lx, offset 0x%lx, grain %d, syndrome "
733 "0x%lx, row %d, channel %d, label \"%s\": %s\n",
734 page_frame_number, offset_in_page,
Mauro Carvalho Chehab084a4fc2012-01-27 18:38:08 -0300735 grain, syndrome, row, channel,
Mauro Carvalho Chehaba7d7d2e2012-01-27 14:12:32 -0300736 label, msg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800737
738 mci->ce_count++;
739 mci->csrows[row].ce_count++;
Mauro Carvalho Chehab084a4fc2012-01-27 18:38:08 -0300740 mci->csrows[row].channels[channel].dimm->ce_count++;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800741 mci->csrows[row].channels[channel].ce_count++;
742
743 if (mci->scrub_mode & SCRUB_SW_SRC) {
744 /*
745 * Some MC's can remap memory so that it is still available
746 * at a different address when PCI devices map into memory.
747 * MC's that can't do this lose the memory where PCI devices
Lucas De Marchi25985ed2011-03-30 22:57:33 -0300748 * are mapped. This mapping is MC dependent and so we call
Alan Coxda9bb1d2006-01-18 17:44:13 -0800749 * back into the MC driver for it to map the MC page to
750 * a physical (CPU) page which can then be mapped to a virtual
751 * page - which can then be scrubbed.
752 */
753 remapped_page = mci->ctl_page_to_phys ?
Douglas Thompson052dfb42007-07-19 01:50:13 -0700754 mci->ctl_page_to_phys(mci, page_frame_number) :
755 page_frame_number;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800756
Mauro Carvalho Chehab084a4fc2012-01-27 18:38:08 -0300757 edac_mc_scrub_block(remapped_page, offset_in_page, grain);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800758 }
759}
Dave Peterson91105402006-03-26 01:38:55 -0800760EXPORT_SYMBOL_GPL(edac_mc_handle_ce);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800761
Dave Petersone7ecd892006-03-26 01:38:52 -0800762void edac_mc_handle_ce_no_info(struct mem_ctl_info *mci, const char *msg)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800763{
Dave Jiang4de78c62007-07-19 01:49:54 -0700764 if (edac_mc_get_log_ce())
Dave Peterson537fba22006-03-26 01:38:40 -0800765 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700766 "CE - no information available: %s\n", msg);
Dave Petersone7ecd892006-03-26 01:38:52 -0800767
Alan Coxda9bb1d2006-01-18 17:44:13 -0800768 mci->ce_noinfo_count++;
769 mci->ce_count++;
770}
Dave Peterson91105402006-03-26 01:38:55 -0800771EXPORT_SYMBOL_GPL(edac_mc_handle_ce_no_info);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800772
Alan Coxda9bb1d2006-01-18 17:44:13 -0800773void edac_mc_handle_ue(struct mem_ctl_info *mci,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700774 unsigned long page_frame_number,
775 unsigned long offset_in_page, int row, const char *msg)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800776{
777 int len = EDAC_MC_LABEL_LEN * 4;
778 char labels[len + 1];
779 char *pos = labels;
780 int chan;
781 int chars;
Mauro Carvalho Chehaba7d7d2e2012-01-27 14:12:32 -0300782 char *label = NULL;
Mauro Carvalho Chehab084a4fc2012-01-27 18:38:08 -0300783 u32 grain;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800784
Dave Peterson537fba22006-03-26 01:38:40 -0800785 debugf3("MC%d: %s()\n", mci->mc_idx, __func__);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800786
787 /* FIXME - maybe make panic on INTERNAL ERROR an option */
788 if (row >= mci->nr_csrows || row < 0) {
789 /* something is wrong */
Dave Peterson537fba22006-03-26 01:38:40 -0800790 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700791 "INTERNAL ERROR: row out of range "
792 "(%d >= %d)\n", row, mci->nr_csrows);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800793 edac_mc_handle_ue_no_info(mci, "INTERNAL ERROR");
794 return;
795 }
796
Mauro Carvalho Chehab084a4fc2012-01-27 18:38:08 -0300797 grain = mci->csrows[row].channels[0].dimm->grain;
Mauro Carvalho Chehaba7d7d2e2012-01-27 14:12:32 -0300798 label = mci->csrows[row].channels[0].dimm->label;
799 chars = snprintf(pos, len + 1, "%s", label);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800800 len -= chars;
801 pos += chars;
Dave Petersone7ecd892006-03-26 01:38:52 -0800802
Alan Coxda9bb1d2006-01-18 17:44:13 -0800803 for (chan = 1; (chan < mci->csrows[row].nr_channels) && (len > 0);
Douglas Thompson052dfb42007-07-19 01:50:13 -0700804 chan++) {
Mauro Carvalho Chehaba7d7d2e2012-01-27 14:12:32 -0300805 label = mci->csrows[row].channels[chan].dimm->label;
806 chars = snprintf(pos, len + 1, ":%s", label);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800807 len -= chars;
808 pos += chars;
809 }
810
Dave Jiang4de78c62007-07-19 01:49:54 -0700811 if (edac_mc_get_log_ue())
Dave Peterson537fba22006-03-26 01:38:40 -0800812 edac_mc_printk(mci, KERN_EMERG,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700813 "UE page 0x%lx, offset 0x%lx, grain %d, row %d, "
814 "labels \"%s\": %s\n", page_frame_number,
Mauro Carvalho Chehab084a4fc2012-01-27 18:38:08 -0300815 offset_in_page, grain, row, labels, msg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800816
Dave Jiang4de78c62007-07-19 01:49:54 -0700817 if (edac_mc_get_panic_on_ue())
Dave Petersone7ecd892006-03-26 01:38:52 -0800818 panic("EDAC MC%d: UE page 0x%lx, offset 0x%lx, grain %d, "
Douglas Thompson052dfb42007-07-19 01:50:13 -0700819 "row %d, labels \"%s\": %s\n", mci->mc_idx,
820 page_frame_number, offset_in_page,
Mauro Carvalho Chehab084a4fc2012-01-27 18:38:08 -0300821 grain, row, labels, msg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800822
823 mci->ue_count++;
824 mci->csrows[row].ue_count++;
825}
Dave Peterson91105402006-03-26 01:38:55 -0800826EXPORT_SYMBOL_GPL(edac_mc_handle_ue);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800827
Dave Petersone7ecd892006-03-26 01:38:52 -0800828void edac_mc_handle_ue_no_info(struct mem_ctl_info *mci, const char *msg)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800829{
Dave Jiang4de78c62007-07-19 01:49:54 -0700830 if (edac_mc_get_panic_on_ue())
Alan Coxda9bb1d2006-01-18 17:44:13 -0800831 panic("EDAC MC%d: Uncorrected Error", mci->mc_idx);
832
Dave Jiang4de78c62007-07-19 01:49:54 -0700833 if (edac_mc_get_log_ue())
Dave Peterson537fba22006-03-26 01:38:40 -0800834 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700835 "UE - no information available: %s\n", msg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800836 mci->ue_noinfo_count++;
837 mci->ue_count++;
838}
Douglas Thompson079708b2007-07-19 01:49:58 -0700839EXPORT_SYMBOL_GPL(edac_mc_handle_ue_no_info);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800840
eric wollesen9794f332007-02-12 00:53:08 -0800841/*************************************************************
842 * On Fully Buffered DIMM modules, this help function is
843 * called to process UE events
844 */
845void edac_mc_handle_fbd_ue(struct mem_ctl_info *mci,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700846 unsigned int csrow,
847 unsigned int channela,
848 unsigned int channelb, char *msg)
eric wollesen9794f332007-02-12 00:53:08 -0800849{
850 int len = EDAC_MC_LABEL_LEN * 4;
851 char labels[len + 1];
852 char *pos = labels;
853 int chars;
Mauro Carvalho Chehaba7d7d2e2012-01-27 14:12:32 -0300854 char *label;
eric wollesen9794f332007-02-12 00:53:08 -0800855
856 if (csrow >= mci->nr_csrows) {
857 /* something is wrong */
858 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700859 "INTERNAL ERROR: row out of range (%d >= %d)\n",
860 csrow, mci->nr_csrows);
eric wollesen9794f332007-02-12 00:53:08 -0800861 edac_mc_handle_ue_no_info(mci, "INTERNAL ERROR");
862 return;
863 }
864
865 if (channela >= mci->csrows[csrow].nr_channels) {
866 /* something is wrong */
867 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700868 "INTERNAL ERROR: channel-a out of range "
869 "(%d >= %d)\n",
870 channela, mci->csrows[csrow].nr_channels);
eric wollesen9794f332007-02-12 00:53:08 -0800871 edac_mc_handle_ue_no_info(mci, "INTERNAL ERROR");
872 return;
873 }
874
875 if (channelb >= mci->csrows[csrow].nr_channels) {
876 /* something is wrong */
877 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700878 "INTERNAL ERROR: channel-b out of range "
879 "(%d >= %d)\n",
880 channelb, mci->csrows[csrow].nr_channels);
eric wollesen9794f332007-02-12 00:53:08 -0800881 edac_mc_handle_ue_no_info(mci, "INTERNAL ERROR");
882 return;
883 }
884
885 mci->ue_count++;
886 mci->csrows[csrow].ue_count++;
887
888 /* Generate the DIMM labels from the specified channels */
Mauro Carvalho Chehaba7d7d2e2012-01-27 14:12:32 -0300889 label = mci->csrows[csrow].channels[channela].dimm->label;
890 chars = snprintf(pos, len + 1, "%s", label);
Douglas Thompson079708b2007-07-19 01:49:58 -0700891 len -= chars;
892 pos += chars;
Mauro Carvalho Chehab084a4fc2012-01-27 18:38:08 -0300893
eric wollesen9794f332007-02-12 00:53:08 -0800894 chars = snprintf(pos, len + 1, "-%s",
Mauro Carvalho Chehaba7d7d2e2012-01-27 14:12:32 -0300895 mci->csrows[csrow].channels[channelb].dimm->label);
eric wollesen9794f332007-02-12 00:53:08 -0800896
Dave Jiang4de78c62007-07-19 01:49:54 -0700897 if (edac_mc_get_log_ue())
eric wollesen9794f332007-02-12 00:53:08 -0800898 edac_mc_printk(mci, KERN_EMERG,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700899 "UE row %d, channel-a= %d channel-b= %d "
900 "labels \"%s\": %s\n", csrow, channela, channelb,
901 labels, msg);
eric wollesen9794f332007-02-12 00:53:08 -0800902
Dave Jiang4de78c62007-07-19 01:49:54 -0700903 if (edac_mc_get_panic_on_ue())
eric wollesen9794f332007-02-12 00:53:08 -0800904 panic("UE row %d, channel-a= %d channel-b= %d "
Douglas Thompson052dfb42007-07-19 01:50:13 -0700905 "labels \"%s\": %s\n", csrow, channela,
906 channelb, labels, msg);
eric wollesen9794f332007-02-12 00:53:08 -0800907}
908EXPORT_SYMBOL(edac_mc_handle_fbd_ue);
909
910/*************************************************************
911 * On Fully Buffered DIMM modules, this help function is
912 * called to process CE events
913 */
914void edac_mc_handle_fbd_ce(struct mem_ctl_info *mci,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700915 unsigned int csrow, unsigned int channel, char *msg)
eric wollesen9794f332007-02-12 00:53:08 -0800916{
Mauro Carvalho Chehaba7d7d2e2012-01-27 14:12:32 -0300917 char *label = NULL;
eric wollesen9794f332007-02-12 00:53:08 -0800918
919 /* Ensure boundary values */
920 if (csrow >= mci->nr_csrows) {
921 /* something is wrong */
922 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700923 "INTERNAL ERROR: row out of range (%d >= %d)\n",
924 csrow, mci->nr_csrows);
eric wollesen9794f332007-02-12 00:53:08 -0800925 edac_mc_handle_ce_no_info(mci, "INTERNAL ERROR");
926 return;
927 }
928 if (channel >= mci->csrows[csrow].nr_channels) {
929 /* something is wrong */
930 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700931 "INTERNAL ERROR: channel out of range (%d >= %d)\n",
932 channel, mci->csrows[csrow].nr_channels);
eric wollesen9794f332007-02-12 00:53:08 -0800933 edac_mc_handle_ce_no_info(mci, "INTERNAL ERROR");
934 return;
935 }
936
Mauro Carvalho Chehaba7d7d2e2012-01-27 14:12:32 -0300937 label = mci->csrows[csrow].channels[channel].dimm->label;
938
Dave Jiang4de78c62007-07-19 01:49:54 -0700939 if (edac_mc_get_log_ce())
eric wollesen9794f332007-02-12 00:53:08 -0800940 /* FIXME - put in DIMM location */
941 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700942 "CE row %d, channel %d, label \"%s\": %s\n",
Mauro Carvalho Chehaba7d7d2e2012-01-27 14:12:32 -0300943 csrow, channel, label, msg);
eric wollesen9794f332007-02-12 00:53:08 -0800944
945 mci->ce_count++;
946 mci->csrows[csrow].ce_count++;
Mauro Carvalho Chehab084a4fc2012-01-27 18:38:08 -0300947 mci->csrows[csrow].channels[channel].dimm->ce_count++;
eric wollesen9794f332007-02-12 00:53:08 -0800948 mci->csrows[csrow].channels[channel].ce_count++;
949}
Douglas Thompson079708b2007-07-19 01:49:58 -0700950EXPORT_SYMBOL(edac_mc_handle_fbd_ce);