blob: 6b21e25f7a84cc99ad6ea710b788745992d1170f [file] [log] [blame]
Alan Coxda9bb1d2006-01-18 17:44:13 -08001/*
2 * edac_mc kernel module
Doug Thompson49c0dab72006-07-10 04:45:19 -07003 * (C) 2005, 2006 Linux Networx (http://lnxi.com)
Alan Coxda9bb1d2006-01-18 17:44:13 -08004 * This file may be distributed under the terms of the
5 * GNU General Public License.
6 *
7 * Written by Thayne Harbaugh
8 * Based on work by Dan Hollis <goemon at anime dot net> and others.
9 * http://www.anime.net/~goemon/linux-ecc/
10 *
11 * Modified by Dave Peterson and Doug Thompson
12 *
13 */
14
Alan Coxda9bb1d2006-01-18 17:44:13 -080015#include <linux/module.h>
16#include <linux/proc_fs.h>
17#include <linux/kernel.h>
18#include <linux/types.h>
19#include <linux/smp.h>
20#include <linux/init.h>
21#include <linux/sysctl.h>
22#include <linux/highmem.h>
23#include <linux/timer.h>
24#include <linux/slab.h>
25#include <linux/jiffies.h>
26#include <linux/spinlock.h>
27#include <linux/list.h>
28#include <linux/sysdev.h>
29#include <linux/ctype.h>
Dave Jiangc0d12172007-07-19 01:49:46 -070030#include <linux/edac.h>
Alan Coxda9bb1d2006-01-18 17:44:13 -080031#include <asm/uaccess.h>
32#include <asm/page.h>
33#include <asm/edac.h>
Douglas Thompson20bcb7a2007-07-19 01:49:47 -070034#include "edac_core.h"
Douglas Thompson7c9281d2007-07-19 01:49:33 -070035#include "edac_module.h"
Alan Coxda9bb1d2006-01-18 17:44:13 -080036
Alan Coxda9bb1d2006-01-18 17:44:13 -080037/* lock to memory controller's control array */
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -070038static DEFINE_MUTEX(mem_ctls_mutex);
Robert P. J. Dayff6ac2a2008-04-29 01:03:17 -070039static LIST_HEAD(mc_devices);
Alan Coxda9bb1d2006-01-18 17:44:13 -080040
Alan Coxda9bb1d2006-01-18 17:44:13 -080041#ifdef CONFIG_EDAC_DEBUG
42
Adrian Bunk2da1c112007-07-19 01:49:32 -070043static void edac_mc_dump_channel(struct channel_info *chan)
Alan Coxda9bb1d2006-01-18 17:44:13 -080044{
45 debugf4("\tchannel = %p\n", chan);
46 debugf4("\tchannel->chan_idx = %d\n", chan->chan_idx);
47 debugf4("\tchannel->ce_count = %d\n", chan->ce_count);
48 debugf4("\tchannel->label = '%s'\n", chan->label);
49 debugf4("\tchannel->csrow = %p\n\n", chan->csrow);
50}
51
Adrian Bunk2da1c112007-07-19 01:49:32 -070052static void edac_mc_dump_csrow(struct csrow_info *csrow)
Alan Coxda9bb1d2006-01-18 17:44:13 -080053{
54 debugf4("\tcsrow = %p\n", csrow);
55 debugf4("\tcsrow->csrow_idx = %d\n", csrow->csrow_idx);
Douglas Thompson079708b2007-07-19 01:49:58 -070056 debugf4("\tcsrow->first_page = 0x%lx\n", csrow->first_page);
Alan Coxda9bb1d2006-01-18 17:44:13 -080057 debugf4("\tcsrow->last_page = 0x%lx\n", csrow->last_page);
58 debugf4("\tcsrow->page_mask = 0x%lx\n", csrow->page_mask);
59 debugf4("\tcsrow->nr_pages = 0x%x\n", csrow->nr_pages);
Douglas Thompson079708b2007-07-19 01:49:58 -070060 debugf4("\tcsrow->nr_channels = %d\n", csrow->nr_channels);
Alan Coxda9bb1d2006-01-18 17:44:13 -080061 debugf4("\tcsrow->channels = %p\n", csrow->channels);
62 debugf4("\tcsrow->mci = %p\n\n", csrow->mci);
63}
64
Adrian Bunk2da1c112007-07-19 01:49:32 -070065static void edac_mc_dump_mci(struct mem_ctl_info *mci)
Alan Coxda9bb1d2006-01-18 17:44:13 -080066{
67 debugf3("\tmci = %p\n", mci);
68 debugf3("\tmci->mtype_cap = %lx\n", mci->mtype_cap);
69 debugf3("\tmci->edac_ctl_cap = %lx\n", mci->edac_ctl_cap);
70 debugf3("\tmci->edac_cap = %lx\n", mci->edac_cap);
71 debugf4("\tmci->edac_check = %p\n", mci->edac_check);
72 debugf3("\tmci->nr_csrows = %d, csrows = %p\n",
73 mci->nr_csrows, mci->csrows);
Doug Thompson37f04582006-06-30 01:56:07 -070074 debugf3("\tdev = %p\n", mci->dev);
Douglas Thompson079708b2007-07-19 01:49:58 -070075 debugf3("\tmod_name:ctl_name = %s:%s\n", mci->mod_name, mci->ctl_name);
Alan Coxda9bb1d2006-01-18 17:44:13 -080076 debugf3("\tpvt_info = %p\n\n", mci->pvt_info);
77}
78
Borislav Petkov239642f2009-11-12 15:33:16 +010079/*
80 * keep those in sync with the enum mem_type
81 */
82const char *edac_mem_types[] = {
83 "Empty csrow",
84 "Reserved csrow type",
85 "Unknown csrow type",
86 "Fast page mode RAM",
87 "Extended data out RAM",
88 "Burst Extended data out RAM",
89 "Single data rate SDRAM",
90 "Registered single data rate SDRAM",
91 "Double data rate SDRAM",
92 "Registered Double data rate SDRAM",
93 "Rambus DRAM",
94 "Unbuffered DDR2 RAM",
95 "Fully buffered DDR2",
96 "Registered DDR2 RAM",
97 "Rambus XDR",
98 "Unbuffered DDR3 RAM",
99 "Registered DDR3 RAM",
100};
101EXPORT_SYMBOL_GPL(edac_mem_types);
102
Douglas Thompson079708b2007-07-19 01:49:58 -0700103#endif /* CONFIG_EDAC_DEBUG */
Alan Coxda9bb1d2006-01-18 17:44:13 -0800104
105/* 'ptr' points to a possibly unaligned item X such that sizeof(X) is 'size'.
106 * Adjust 'ptr' so that its alignment is at least as stringent as what the
107 * compiler would provide for X and return the aligned result.
108 *
109 * If 'size' is a constant, the compiler will optimize this whole function
110 * down to either a no-op or the addition of a constant to the value of 'ptr'.
111 */
Douglas Thompson7391c6d2007-07-19 01:50:21 -0700112void *edac_align_ptr(void *ptr, unsigned size)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800113{
114 unsigned align, r;
115
116 /* Here we assume that the alignment of a "long long" is the most
117 * stringent alignment that the compiler will ever provide by default.
118 * As far as I know, this is a reasonable assumption.
119 */
120 if (size > sizeof(long))
121 align = sizeof(long long);
122 else if (size > sizeof(int))
123 align = sizeof(long);
124 else if (size > sizeof(short))
125 align = sizeof(int);
126 else if (size > sizeof(char))
127 align = sizeof(short);
128 else
Douglas Thompson079708b2007-07-19 01:49:58 -0700129 return (char *)ptr;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800130
131 r = size % align;
132
133 if (r == 0)
Douglas Thompson079708b2007-07-19 01:49:58 -0700134 return (char *)ptr;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800135
Douglas Thompson7391c6d2007-07-19 01:50:21 -0700136 return (void *)(((unsigned long)ptr) + align - r);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800137}
138
Alan Coxda9bb1d2006-01-18 17:44:13 -0800139/**
140 * edac_mc_alloc: Allocate a struct mem_ctl_info structure
141 * @size_pvt: size of private storage needed
142 * @nr_csrows: Number of CWROWS needed for this MC
143 * @nr_chans: Number of channels for the MC
144 *
145 * Everything is kmalloc'ed as one big chunk - more efficient.
146 * Only can be used if all structures have the same lifetime - otherwise
147 * you have to allocate and initialize your own structures.
148 *
149 * Use edac_mc_free() to free mc structures allocated by this function.
150 *
151 * Returns:
152 * NULL allocation failed
153 * struct mem_ctl_info pointer
154 */
155struct mem_ctl_info *edac_mc_alloc(unsigned sz_pvt, unsigned nr_csrows,
Doug Thompsonb8f6f972007-07-19 01:50:26 -0700156 unsigned nr_chans, int edac_index)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800157{
158 struct mem_ctl_info *mci;
159 struct csrow_info *csi, *csrow;
160 struct channel_info *chi, *chp, *chan;
161 void *pvt;
162 unsigned size;
163 int row, chn;
Doug Thompson8096cfa2007-07-19 01:50:27 -0700164 int err;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800165
166 /* Figure out the offsets of the various items from the start of an mc
167 * structure. We want the alignment of each item to be at least as
168 * stringent as what the compiler would provide if we could simply
169 * hardcode everything into a single struct.
170 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700171 mci = (struct mem_ctl_info *)0;
Douglas Thompson7391c6d2007-07-19 01:50:21 -0700172 csi = edac_align_ptr(&mci[1], sizeof(*csi));
173 chi = edac_align_ptr(&csi[nr_csrows], sizeof(*chi));
Douglas Thompsone27e3da2007-07-19 01:49:36 -0700174 pvt = edac_align_ptr(&chi[nr_chans * nr_csrows], sz_pvt);
Douglas Thompson079708b2007-07-19 01:49:58 -0700175 size = ((unsigned long)pvt) + sz_pvt;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800176
Doug Thompson8096cfa2007-07-19 01:50:27 -0700177 mci = kzalloc(size, GFP_KERNEL);
178 if (mci == NULL)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800179 return NULL;
180
181 /* Adjust pointers so they point within the memory we just allocated
182 * rather than an imaginary chunk of memory located at address 0.
183 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700184 csi = (struct csrow_info *)(((char *)mci) + ((unsigned long)csi));
185 chi = (struct channel_info *)(((char *)mci) + ((unsigned long)chi));
186 pvt = sz_pvt ? (((char *)mci) + ((unsigned long)pvt)) : NULL;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800187
Doug Thompsonb8f6f972007-07-19 01:50:26 -0700188 /* setup index and various internal pointers */
189 mci->mc_idx = edac_index;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800190 mci->csrows = csi;
191 mci->pvt_info = pvt;
192 mci->nr_csrows = nr_csrows;
193
194 for (row = 0; row < nr_csrows; row++) {
195 csrow = &csi[row];
196 csrow->csrow_idx = row;
197 csrow->mci = mci;
198 csrow->nr_channels = nr_chans;
199 chp = &chi[row * nr_chans];
200 csrow->channels = chp;
201
202 for (chn = 0; chn < nr_chans; chn++) {
203 chan = &chp[chn];
204 chan->chan_idx = chn;
205 chan->csrow = csrow;
206 }
207 }
208
Dave Jiang81d87cb2007-07-19 01:49:52 -0700209 mci->op_state = OP_ALLOC;
210
Doug Thompson8096cfa2007-07-19 01:50:27 -0700211 /*
212 * Initialize the 'root' kobj for the edac_mc controller
213 */
214 err = edac_mc_register_sysfs_main_kobj(mci);
215 if (err) {
216 kfree(mci);
217 return NULL;
218 }
219
220 /* at this point, the root kobj is valid, and in order to
221 * 'free' the object, then the function:
222 * edac_mc_unregister_sysfs_main_kobj() must be called
223 * which will perform kobj unregistration and the actual free
224 * will occur during the kobject callback operation
225 */
Alan Coxda9bb1d2006-01-18 17:44:13 -0800226 return mci;
227}
Dave Peterson91105402006-03-26 01:38:55 -0800228EXPORT_SYMBOL_GPL(edac_mc_alloc);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800229
Alan Coxda9bb1d2006-01-18 17:44:13 -0800230/**
Doug Thompson8096cfa2007-07-19 01:50:27 -0700231 * edac_mc_free
232 * 'Free' a previously allocated 'mci' structure
Alan Coxda9bb1d2006-01-18 17:44:13 -0800233 * @mci: pointer to a struct mem_ctl_info structure
Alan Coxda9bb1d2006-01-18 17:44:13 -0800234 */
235void edac_mc_free(struct mem_ctl_info *mci)
236{
Doug Thompson8096cfa2007-07-19 01:50:27 -0700237 edac_mc_unregister_sysfs_main_kobj(mci);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800238}
Dave Peterson91105402006-03-26 01:38:55 -0800239EXPORT_SYMBOL_GPL(edac_mc_free);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800240
Doug Thompsonbce19682007-07-26 10:41:14 -0700241
242/*
243 * find_mci_by_dev
244 *
245 * scan list of controllers looking for the one that manages
246 * the 'dev' device
247 */
Doug Thompson37f04582006-06-30 01:56:07 -0700248static struct mem_ctl_info *find_mci_by_dev(struct device *dev)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800249{
250 struct mem_ctl_info *mci;
251 struct list_head *item;
252
Dave Peterson537fba22006-03-26 01:38:40 -0800253 debugf3("%s()\n", __func__);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800254
255 list_for_each(item, &mc_devices) {
256 mci = list_entry(item, struct mem_ctl_info, link);
257
Doug Thompson37f04582006-06-30 01:56:07 -0700258 if (mci->dev == dev)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800259 return mci;
260 }
261
262 return NULL;
263}
264
Dave Jiang81d87cb2007-07-19 01:49:52 -0700265/*
266 * handler for EDAC to check if NMI type handler has asserted interrupt
267 */
268static int edac_mc_assert_error_check_and_clear(void)
269{
Dave Jiang66ee2f92007-07-19 01:49:54 -0700270 int old_state;
Dave Jiang81d87cb2007-07-19 01:49:52 -0700271
Douglas Thompson079708b2007-07-19 01:49:58 -0700272 if (edac_op_state == EDAC_OPSTATE_POLL)
Dave Jiang81d87cb2007-07-19 01:49:52 -0700273 return 1;
274
Dave Jiang66ee2f92007-07-19 01:49:54 -0700275 old_state = edac_err_assert;
276 edac_err_assert = 0;
Dave Jiang81d87cb2007-07-19 01:49:52 -0700277
Dave Jiang66ee2f92007-07-19 01:49:54 -0700278 return old_state;
Dave Jiang81d87cb2007-07-19 01:49:52 -0700279}
280
281/*
282 * edac_mc_workq_function
283 * performs the operation scheduled by a workq request
284 */
Dave Jiang81d87cb2007-07-19 01:49:52 -0700285static void edac_mc_workq_function(struct work_struct *work_req)
286{
Jean Delvarefbeb4382009-04-13 14:40:21 -0700287 struct delayed_work *d_work = to_delayed_work(work_req);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700288 struct mem_ctl_info *mci = to_edac_mem_ctl_work(d_work);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700289
290 mutex_lock(&mem_ctls_mutex);
291
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700292 /* if this control struct has movd to offline state, we are done */
293 if (mci->op_state == OP_OFFLINE) {
294 mutex_unlock(&mem_ctls_mutex);
295 return;
296 }
297
Dave Jiang81d87cb2007-07-19 01:49:52 -0700298 /* Only poll controllers that are running polled and have a check */
299 if (edac_mc_assert_error_check_and_clear() && (mci->edac_check != NULL))
300 mci->edac_check(mci);
301
Dave Jiang81d87cb2007-07-19 01:49:52 -0700302 mutex_unlock(&mem_ctls_mutex);
303
304 /* Reschedule */
Dave Jiang4de78c62007-07-19 01:49:54 -0700305 queue_delayed_work(edac_workqueue, &mci->work,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700306 msecs_to_jiffies(edac_mc_get_poll_msec()));
Dave Jiang81d87cb2007-07-19 01:49:52 -0700307}
308
309/*
310 * edac_mc_workq_setup
311 * initialize a workq item for this mci
312 * passing in the new delay period in msec
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700313 *
314 * locking model:
315 *
316 * called with the mem_ctls_mutex held
Dave Jiang81d87cb2007-07-19 01:49:52 -0700317 */
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700318static void edac_mc_workq_setup(struct mem_ctl_info *mci, unsigned msec)
Dave Jiang81d87cb2007-07-19 01:49:52 -0700319{
320 debugf0("%s()\n", __func__);
321
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700322 /* if this instance is not in the POLL state, then simply return */
323 if (mci->op_state != OP_RUNNING_POLL)
324 return;
325
Dave Jiang81d87cb2007-07-19 01:49:52 -0700326 INIT_DELAYED_WORK(&mci->work, edac_mc_workq_function);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700327 queue_delayed_work(edac_workqueue, &mci->work, msecs_to_jiffies(msec));
328}
329
330/*
331 * edac_mc_workq_teardown
332 * stop the workq processing on this mci
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700333 *
334 * locking model:
335 *
336 * called WITHOUT lock held
Dave Jiang81d87cb2007-07-19 01:49:52 -0700337 */
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700338static void edac_mc_workq_teardown(struct mem_ctl_info *mci)
Dave Jiang81d87cb2007-07-19 01:49:52 -0700339{
340 int status;
341
Borislav Petkov00740c52010-09-26 12:42:23 +0200342 if (mci->op_state != OP_RUNNING_POLL)
343 return;
344
Doug Thompsonbce19682007-07-26 10:41:14 -0700345 status = cancel_delayed_work(&mci->work);
346 if (status == 0) {
347 debugf0("%s() not canceled, flush the queue\n",
348 __func__);
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700349
Doug Thompsonbce19682007-07-26 10:41:14 -0700350 /* workq instance might be running, wait for it */
351 flush_workqueue(edac_workqueue);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700352 }
353}
354
355/*
Doug Thompsonbce19682007-07-26 10:41:14 -0700356 * edac_mc_reset_delay_period(unsigned long value)
357 *
358 * user space has updated our poll period value, need to
359 * reset our workq delays
Dave Jiang81d87cb2007-07-19 01:49:52 -0700360 */
Doug Thompsonbce19682007-07-26 10:41:14 -0700361void edac_mc_reset_delay_period(int value)
Dave Jiang81d87cb2007-07-19 01:49:52 -0700362{
Doug Thompsonbce19682007-07-26 10:41:14 -0700363 struct mem_ctl_info *mci;
364 struct list_head *item;
Dave Jiang81d87cb2007-07-19 01:49:52 -0700365
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700366 mutex_lock(&mem_ctls_mutex);
367
Doug Thompsonbce19682007-07-26 10:41:14 -0700368 /* scan the list and turn off all workq timers, doing so under lock
369 */
370 list_for_each(item, &mc_devices) {
371 mci = list_entry(item, struct mem_ctl_info, link);
372
373 if (mci->op_state == OP_RUNNING_POLL)
374 cancel_delayed_work(&mci->work);
375 }
376
377 mutex_unlock(&mem_ctls_mutex);
378
379
380 /* re-walk the list, and reset the poll delay */
381 mutex_lock(&mem_ctls_mutex);
382
383 list_for_each(item, &mc_devices) {
384 mci = list_entry(item, struct mem_ctl_info, link);
385
386 edac_mc_workq_setup(mci, (unsigned long) value);
387 }
Dave Jiang81d87cb2007-07-19 01:49:52 -0700388
389 mutex_unlock(&mem_ctls_mutex);
390}
391
Doug Thompsonbce19682007-07-26 10:41:14 -0700392
393
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700394/* Return 0 on success, 1 on failure.
395 * Before calling this function, caller must
396 * assign a unique value to mci->mc_idx.
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700397 *
398 * locking model:
399 *
400 * called with the mem_ctls_mutex lock held
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700401 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700402static int add_mc_to_global_list(struct mem_ctl_info *mci)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800403{
404 struct list_head *item, *insert_before;
405 struct mem_ctl_info *p;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800406
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700407 insert_before = &mc_devices;
408
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700409 p = find_mci_by_dev(mci->dev);
410 if (unlikely(p != NULL))
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700411 goto fail0;
412
413 list_for_each(item, &mc_devices) {
414 p = list_entry(item, struct mem_ctl_info, link);
415
416 if (p->mc_idx >= mci->mc_idx) {
417 if (unlikely(p->mc_idx == mci->mc_idx))
418 goto fail1;
419
420 insert_before = item;
421 break;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800422 }
Alan Coxda9bb1d2006-01-18 17:44:13 -0800423 }
424
425 list_add_tail_rcu(&mci->link, insert_before);
Dave Jiangc0d12172007-07-19 01:49:46 -0700426 atomic_inc(&edac_handlers);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800427 return 0;
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700428
Douglas Thompson052dfb42007-07-19 01:50:13 -0700429fail0:
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700430 edac_printk(KERN_WARNING, EDAC_MC,
Kay Sievers281efb12009-01-06 14:42:57 -0800431 "%s (%s) %s %s already assigned %d\n", dev_name(p->dev),
Stephen Rothwell17aa7e02008-05-05 13:54:19 +1000432 edac_dev_name(mci), p->mod_name, p->ctl_name, p->mc_idx);
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700433 return 1;
434
Douglas Thompson052dfb42007-07-19 01:50:13 -0700435fail1:
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700436 edac_printk(KERN_WARNING, EDAC_MC,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700437 "bug in low-level driver: attempt to assign\n"
438 " duplicate mc_idx %d in %s()\n", p->mc_idx, __func__);
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700439 return 1;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800440}
441
Dave Petersone7ecd892006-03-26 01:38:52 -0800442static void complete_mc_list_del(struct rcu_head *head)
Dave Petersona1d03fc2006-03-26 01:38:46 -0800443{
444 struct mem_ctl_info *mci;
445
446 mci = container_of(head, struct mem_ctl_info, rcu);
447 INIT_LIST_HEAD(&mci->link);
Dave Petersona1d03fc2006-03-26 01:38:46 -0800448}
449
Dave Petersone7ecd892006-03-26 01:38:52 -0800450static void del_mc_from_global_list(struct mem_ctl_info *mci)
Dave Petersona1d03fc2006-03-26 01:38:46 -0800451{
Dave Jiangc0d12172007-07-19 01:49:46 -0700452 atomic_dec(&edac_handlers);
Dave Petersona1d03fc2006-03-26 01:38:46 -0800453 list_del_rcu(&mci->link);
Dave Petersona1d03fc2006-03-26 01:38:46 -0800454 call_rcu(&mci->rcu, complete_mc_list_del);
Jesper Dangaard Brouer458e5ff2009-09-23 15:57:29 -0700455 rcu_barrier();
Dave Petersona1d03fc2006-03-26 01:38:46 -0800456}
457
Alan Coxda9bb1d2006-01-18 17:44:13 -0800458/**
Douglas Thompson5da08312007-07-19 01:49:31 -0700459 * edac_mc_find: Search for a mem_ctl_info structure whose index is 'idx'.
460 *
461 * If found, return a pointer to the structure.
462 * Else return NULL.
463 *
464 * Caller must hold mem_ctls_mutex.
465 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700466struct mem_ctl_info *edac_mc_find(int idx)
Douglas Thompson5da08312007-07-19 01:49:31 -0700467{
468 struct list_head *item;
469 struct mem_ctl_info *mci;
470
471 list_for_each(item, &mc_devices) {
472 mci = list_entry(item, struct mem_ctl_info, link);
473
474 if (mci->mc_idx >= idx) {
475 if (mci->mc_idx == idx)
476 return mci;
477
478 break;
479 }
480 }
481
482 return NULL;
483}
484EXPORT_SYMBOL(edac_mc_find);
485
486/**
Dave Peterson472678e2006-03-26 01:38:49 -0800487 * edac_mc_add_mc: Insert the 'mci' structure into the mci global list and
488 * create sysfs entries associated with mci structure
Alan Coxda9bb1d2006-01-18 17:44:13 -0800489 * @mci: pointer to the mci structure to be added to the list
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700490 * @mc_idx: A unique numeric identifier to be assigned to the 'mci' structure.
Alan Coxda9bb1d2006-01-18 17:44:13 -0800491 *
492 * Return:
493 * 0 Success
494 * !0 Failure
495 */
496
497/* FIXME - should a warning be printed if no error detection? correction? */
Doug Thompsonb8f6f972007-07-19 01:50:26 -0700498int edac_mc_add_mc(struct mem_ctl_info *mci)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800499{
Dave Peterson537fba22006-03-26 01:38:40 -0800500 debugf0("%s()\n", __func__);
Doug Thompsonb8f6f972007-07-19 01:50:26 -0700501
Alan Coxda9bb1d2006-01-18 17:44:13 -0800502#ifdef CONFIG_EDAC_DEBUG
503 if (edac_debug_level >= 3)
504 edac_mc_dump_mci(mci);
Dave Petersone7ecd892006-03-26 01:38:52 -0800505
Alan Coxda9bb1d2006-01-18 17:44:13 -0800506 if (edac_debug_level >= 4) {
507 int i;
508
509 for (i = 0; i < mci->nr_csrows; i++) {
510 int j;
Dave Petersone7ecd892006-03-26 01:38:52 -0800511
Alan Coxda9bb1d2006-01-18 17:44:13 -0800512 edac_mc_dump_csrow(&mci->csrows[i]);
513 for (j = 0; j < mci->csrows[i].nr_channels; j++)
Douglas Thompson079708b2007-07-19 01:49:58 -0700514 edac_mc_dump_channel(&mci->csrows[i].
Douglas Thompson052dfb42007-07-19 01:50:13 -0700515 channels[j]);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800516 }
517 }
518#endif
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700519 mutex_lock(&mem_ctls_mutex);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800520
521 if (add_mc_to_global_list(mci))
Dave Peterson028a7b62006-03-26 01:38:47 -0800522 goto fail0;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800523
524 /* set load time so that error rate can be tracked */
525 mci->start_time = jiffies;
526
eric wollesen9794f332007-02-12 00:53:08 -0800527 if (edac_create_sysfs_mci_device(mci)) {
528 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700529 "failed to create sysfs device\n");
eric wollesen9794f332007-02-12 00:53:08 -0800530 goto fail1;
531 }
Alan Coxda9bb1d2006-01-18 17:44:13 -0800532
Dave Jiang81d87cb2007-07-19 01:49:52 -0700533 /* If there IS a check routine, then we are running POLLED */
534 if (mci->edac_check != NULL) {
535 /* This instance is NOW RUNNING */
536 mci->op_state = OP_RUNNING_POLL;
537
538 edac_mc_workq_setup(mci, edac_mc_get_poll_msec());
539 } else {
540 mci->op_state = OP_RUNNING_INTERRUPT;
541 }
542
Alan Coxda9bb1d2006-01-18 17:44:13 -0800543 /* Report action taken */
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700544 edac_mc_printk(mci, KERN_INFO, "Giving out device to '%s' '%s':"
Stephen Rothwell17aa7e02008-05-05 13:54:19 +1000545 " DEV %s\n", mci->mod_name, mci->ctl_name, edac_dev_name(mci));
Alan Coxda9bb1d2006-01-18 17:44:13 -0800546
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700547 mutex_unlock(&mem_ctls_mutex);
Dave Peterson028a7b62006-03-26 01:38:47 -0800548 return 0;
549
Douglas Thompson052dfb42007-07-19 01:50:13 -0700550fail1:
Dave Peterson028a7b62006-03-26 01:38:47 -0800551 del_mc_from_global_list(mci);
552
Douglas Thompson052dfb42007-07-19 01:50:13 -0700553fail0:
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700554 mutex_unlock(&mem_ctls_mutex);
Dave Peterson028a7b62006-03-26 01:38:47 -0800555 return 1;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800556}
Dave Peterson91105402006-03-26 01:38:55 -0800557EXPORT_SYMBOL_GPL(edac_mc_add_mc);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800558
Alan Coxda9bb1d2006-01-18 17:44:13 -0800559/**
Dave Peterson472678e2006-03-26 01:38:49 -0800560 * edac_mc_del_mc: Remove sysfs entries for specified mci structure and
561 * remove mci structure from global list
Doug Thompson37f04582006-06-30 01:56:07 -0700562 * @pdev: Pointer to 'struct device' representing mci structure to remove.
Alan Coxda9bb1d2006-01-18 17:44:13 -0800563 *
Dave Peterson18dbc332006-03-26 01:38:50 -0800564 * Return pointer to removed mci structure, or NULL if device not found.
Alan Coxda9bb1d2006-01-18 17:44:13 -0800565 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700566struct mem_ctl_info *edac_mc_del_mc(struct device *dev)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800567{
Dave Peterson18dbc332006-03-26 01:38:50 -0800568 struct mem_ctl_info *mci;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800569
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700570 debugf0("%s()\n", __func__);
571
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700572 mutex_lock(&mem_ctls_mutex);
Dave Peterson18dbc332006-03-26 01:38:50 -0800573
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700574 /* find the requested mci struct in the global list */
575 mci = find_mci_by_dev(dev);
576 if (mci == NULL) {
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700577 mutex_unlock(&mem_ctls_mutex);
Dave Peterson18dbc332006-03-26 01:38:50 -0800578 return NULL;
579 }
580
Dave Jiang81d87cb2007-07-19 01:49:52 -0700581 /* marking MCI offline */
582 mci->op_state = OP_OFFLINE;
583
Alan Coxda9bb1d2006-01-18 17:44:13 -0800584 del_mc_from_global_list(mci);
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700585 mutex_unlock(&mem_ctls_mutex);
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700586
587 /* flush workq processes and remove sysfs */
588 edac_mc_workq_teardown(mci);
589 edac_remove_sysfs_mci_device(mci);
590
Dave Peterson537fba22006-03-26 01:38:40 -0800591 edac_printk(KERN_INFO, EDAC_MC,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700592 "Removed device %d for %s %s: DEV %s\n", mci->mc_idx,
Stephen Rothwell17aa7e02008-05-05 13:54:19 +1000593 mci->mod_name, mci->ctl_name, edac_dev_name(mci));
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700594
Dave Peterson18dbc332006-03-26 01:38:50 -0800595 return mci;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800596}
Dave Peterson91105402006-03-26 01:38:55 -0800597EXPORT_SYMBOL_GPL(edac_mc_del_mc);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800598
Adrian Bunk2da1c112007-07-19 01:49:32 -0700599static void edac_mc_scrub_block(unsigned long page, unsigned long offset,
600 u32 size)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800601{
602 struct page *pg;
603 void *virt_addr;
604 unsigned long flags = 0;
605
Dave Peterson537fba22006-03-26 01:38:40 -0800606 debugf3("%s()\n", __func__);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800607
608 /* ECC error page was not in our memory. Ignore it. */
Douglas Thompson079708b2007-07-19 01:49:58 -0700609 if (!pfn_valid(page))
Alan Coxda9bb1d2006-01-18 17:44:13 -0800610 return;
611
612 /* Find the actual page structure then map it and fix */
613 pg = pfn_to_page(page);
614
615 if (PageHighMem(pg))
616 local_irq_save(flags);
617
618 virt_addr = kmap_atomic(pg, KM_BOUNCE_READ);
619
620 /* Perform architecture specific atomic scrub operation */
621 atomic_scrub(virt_addr + offset, size);
622
623 /* Unmap and complete */
624 kunmap_atomic(virt_addr, KM_BOUNCE_READ);
625
626 if (PageHighMem(pg))
627 local_irq_restore(flags);
628}
629
Alan Coxda9bb1d2006-01-18 17:44:13 -0800630/* FIXME - should return -1 */
Dave Petersone7ecd892006-03-26 01:38:52 -0800631int edac_mc_find_csrow_by_page(struct mem_ctl_info *mci, unsigned long page)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800632{
633 struct csrow_info *csrows = mci->csrows;
634 int row, i;
635
Dave Peterson537fba22006-03-26 01:38:40 -0800636 debugf1("MC%d: %s(): 0x%lx\n", mci->mc_idx, __func__, page);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800637 row = -1;
638
639 for (i = 0; i < mci->nr_csrows; i++) {
640 struct csrow_info *csrow = &csrows[i];
641
642 if (csrow->nr_pages == 0)
643 continue;
644
Dave Peterson537fba22006-03-26 01:38:40 -0800645 debugf3("MC%d: %s(): first(0x%lx) page(0x%lx) last(0x%lx) "
646 "mask(0x%lx)\n", mci->mc_idx, __func__,
647 csrow->first_page, page, csrow->last_page,
648 csrow->page_mask);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800649
650 if ((page >= csrow->first_page) &&
651 (page <= csrow->last_page) &&
652 ((page & csrow->page_mask) ==
653 (csrow->first_page & csrow->page_mask))) {
654 row = i;
655 break;
656 }
657 }
658
659 if (row == -1)
Dave Peterson537fba22006-03-26 01:38:40 -0800660 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700661 "could not look up page error address %lx\n",
662 (unsigned long)page);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800663
664 return row;
665}
Dave Peterson91105402006-03-26 01:38:55 -0800666EXPORT_SYMBOL_GPL(edac_mc_find_csrow_by_page);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800667
Alan Coxda9bb1d2006-01-18 17:44:13 -0800668/* FIXME - setable log (warning/emerg) levels */
669/* FIXME - integrate with evlog: http://evlog.sourceforge.net/ */
670void edac_mc_handle_ce(struct mem_ctl_info *mci,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700671 unsigned long page_frame_number,
672 unsigned long offset_in_page, unsigned long syndrome,
673 int row, int channel, const char *msg)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800674{
675 unsigned long remapped_page;
676
Dave Peterson537fba22006-03-26 01:38:40 -0800677 debugf3("MC%d: %s()\n", mci->mc_idx, __func__);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800678
679 /* FIXME - maybe make panic on INTERNAL ERROR an option */
680 if (row >= mci->nr_csrows || row < 0) {
681 /* something is wrong */
Dave Peterson537fba22006-03-26 01:38:40 -0800682 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700683 "INTERNAL ERROR: row out of range "
684 "(%d >= %d)\n", row, mci->nr_csrows);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800685 edac_mc_handle_ce_no_info(mci, "INTERNAL ERROR");
686 return;
687 }
Dave Petersone7ecd892006-03-26 01:38:52 -0800688
Alan Coxda9bb1d2006-01-18 17:44:13 -0800689 if (channel >= mci->csrows[row].nr_channels || channel < 0) {
690 /* something is wrong */
Dave Peterson537fba22006-03-26 01:38:40 -0800691 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700692 "INTERNAL ERROR: channel out of range "
693 "(%d >= %d)\n", channel,
694 mci->csrows[row].nr_channels);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800695 edac_mc_handle_ce_no_info(mci, "INTERNAL ERROR");
696 return;
697 }
698
Dave Jiang4de78c62007-07-19 01:49:54 -0700699 if (edac_mc_get_log_ce())
Alan Coxda9bb1d2006-01-18 17:44:13 -0800700 /* FIXME - put in DIMM location */
Dave Peterson537fba22006-03-26 01:38:40 -0800701 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700702 "CE page 0x%lx, offset 0x%lx, grain %d, syndrome "
703 "0x%lx, row %d, channel %d, label \"%s\": %s\n",
704 page_frame_number, offset_in_page,
705 mci->csrows[row].grain, syndrome, row, channel,
706 mci->csrows[row].channels[channel].label, msg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800707
708 mci->ce_count++;
709 mci->csrows[row].ce_count++;
710 mci->csrows[row].channels[channel].ce_count++;
711
712 if (mci->scrub_mode & SCRUB_SW_SRC) {
713 /*
714 * Some MC's can remap memory so that it is still available
715 * at a different address when PCI devices map into memory.
716 * MC's that can't do this lose the memory where PCI devices
717 * are mapped. This mapping is MC dependant and so we call
718 * back into the MC driver for it to map the MC page to
719 * a physical (CPU) page which can then be mapped to a virtual
720 * page - which can then be scrubbed.
721 */
722 remapped_page = mci->ctl_page_to_phys ?
Douglas Thompson052dfb42007-07-19 01:50:13 -0700723 mci->ctl_page_to_phys(mci, page_frame_number) :
724 page_frame_number;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800725
726 edac_mc_scrub_block(remapped_page, offset_in_page,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700727 mci->csrows[row].grain);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800728 }
729}
Dave Peterson91105402006-03-26 01:38:55 -0800730EXPORT_SYMBOL_GPL(edac_mc_handle_ce);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800731
Dave Petersone7ecd892006-03-26 01:38:52 -0800732void edac_mc_handle_ce_no_info(struct mem_ctl_info *mci, const char *msg)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800733{
Dave Jiang4de78c62007-07-19 01:49:54 -0700734 if (edac_mc_get_log_ce())
Dave Peterson537fba22006-03-26 01:38:40 -0800735 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700736 "CE - no information available: %s\n", msg);
Dave Petersone7ecd892006-03-26 01:38:52 -0800737
Alan Coxda9bb1d2006-01-18 17:44:13 -0800738 mci->ce_noinfo_count++;
739 mci->ce_count++;
740}
Dave Peterson91105402006-03-26 01:38:55 -0800741EXPORT_SYMBOL_GPL(edac_mc_handle_ce_no_info);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800742
Alan Coxda9bb1d2006-01-18 17:44:13 -0800743void edac_mc_handle_ue(struct mem_ctl_info *mci,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700744 unsigned long page_frame_number,
745 unsigned long offset_in_page, int row, const char *msg)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800746{
747 int len = EDAC_MC_LABEL_LEN * 4;
748 char labels[len + 1];
749 char *pos = labels;
750 int chan;
751 int chars;
752
Dave Peterson537fba22006-03-26 01:38:40 -0800753 debugf3("MC%d: %s()\n", mci->mc_idx, __func__);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800754
755 /* FIXME - maybe make panic on INTERNAL ERROR an option */
756 if (row >= mci->nr_csrows || row < 0) {
757 /* something is wrong */
Dave Peterson537fba22006-03-26 01:38:40 -0800758 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700759 "INTERNAL ERROR: row out of range "
760 "(%d >= %d)\n", row, mci->nr_csrows);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800761 edac_mc_handle_ue_no_info(mci, "INTERNAL ERROR");
762 return;
763 }
764
765 chars = snprintf(pos, len + 1, "%s",
Douglas Thompson079708b2007-07-19 01:49:58 -0700766 mci->csrows[row].channels[0].label);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800767 len -= chars;
768 pos += chars;
Dave Petersone7ecd892006-03-26 01:38:52 -0800769
Alan Coxda9bb1d2006-01-18 17:44:13 -0800770 for (chan = 1; (chan < mci->csrows[row].nr_channels) && (len > 0);
Douglas Thompson052dfb42007-07-19 01:50:13 -0700771 chan++) {
Alan Coxda9bb1d2006-01-18 17:44:13 -0800772 chars = snprintf(pos, len + 1, ":%s",
Douglas Thompson079708b2007-07-19 01:49:58 -0700773 mci->csrows[row].channels[chan].label);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800774 len -= chars;
775 pos += chars;
776 }
777
Dave Jiang4de78c62007-07-19 01:49:54 -0700778 if (edac_mc_get_log_ue())
Dave Peterson537fba22006-03-26 01:38:40 -0800779 edac_mc_printk(mci, KERN_EMERG,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700780 "UE page 0x%lx, offset 0x%lx, grain %d, row %d, "
781 "labels \"%s\": %s\n", page_frame_number,
782 offset_in_page, mci->csrows[row].grain, row,
783 labels, msg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800784
Dave Jiang4de78c62007-07-19 01:49:54 -0700785 if (edac_mc_get_panic_on_ue())
Dave Petersone7ecd892006-03-26 01:38:52 -0800786 panic("EDAC MC%d: UE page 0x%lx, offset 0x%lx, grain %d, "
Douglas Thompson052dfb42007-07-19 01:50:13 -0700787 "row %d, labels \"%s\": %s\n", mci->mc_idx,
788 page_frame_number, offset_in_page,
789 mci->csrows[row].grain, row, labels, msg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800790
791 mci->ue_count++;
792 mci->csrows[row].ue_count++;
793}
Dave Peterson91105402006-03-26 01:38:55 -0800794EXPORT_SYMBOL_GPL(edac_mc_handle_ue);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800795
Dave Petersone7ecd892006-03-26 01:38:52 -0800796void edac_mc_handle_ue_no_info(struct mem_ctl_info *mci, const char *msg)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800797{
Dave Jiang4de78c62007-07-19 01:49:54 -0700798 if (edac_mc_get_panic_on_ue())
Alan Coxda9bb1d2006-01-18 17:44:13 -0800799 panic("EDAC MC%d: Uncorrected Error", mci->mc_idx);
800
Dave Jiang4de78c62007-07-19 01:49:54 -0700801 if (edac_mc_get_log_ue())
Dave Peterson537fba22006-03-26 01:38:40 -0800802 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700803 "UE - no information available: %s\n", msg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800804 mci->ue_noinfo_count++;
805 mci->ue_count++;
806}
Douglas Thompson079708b2007-07-19 01:49:58 -0700807EXPORT_SYMBOL_GPL(edac_mc_handle_ue_no_info);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800808
eric wollesen9794f332007-02-12 00:53:08 -0800809/*************************************************************
810 * On Fully Buffered DIMM modules, this help function is
811 * called to process UE events
812 */
813void edac_mc_handle_fbd_ue(struct mem_ctl_info *mci,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700814 unsigned int csrow,
815 unsigned int channela,
816 unsigned int channelb, char *msg)
eric wollesen9794f332007-02-12 00:53:08 -0800817{
818 int len = EDAC_MC_LABEL_LEN * 4;
819 char labels[len + 1];
820 char *pos = labels;
821 int chars;
822
823 if (csrow >= mci->nr_csrows) {
824 /* something is wrong */
825 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700826 "INTERNAL ERROR: row out of range (%d >= %d)\n",
827 csrow, mci->nr_csrows);
eric wollesen9794f332007-02-12 00:53:08 -0800828 edac_mc_handle_ue_no_info(mci, "INTERNAL ERROR");
829 return;
830 }
831
832 if (channela >= mci->csrows[csrow].nr_channels) {
833 /* something is wrong */
834 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700835 "INTERNAL ERROR: channel-a out of range "
836 "(%d >= %d)\n",
837 channela, mci->csrows[csrow].nr_channels);
eric wollesen9794f332007-02-12 00:53:08 -0800838 edac_mc_handle_ue_no_info(mci, "INTERNAL ERROR");
839 return;
840 }
841
842 if (channelb >= mci->csrows[csrow].nr_channels) {
843 /* something is wrong */
844 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700845 "INTERNAL ERROR: channel-b out of range "
846 "(%d >= %d)\n",
847 channelb, mci->csrows[csrow].nr_channels);
eric wollesen9794f332007-02-12 00:53:08 -0800848 edac_mc_handle_ue_no_info(mci, "INTERNAL ERROR");
849 return;
850 }
851
852 mci->ue_count++;
853 mci->csrows[csrow].ue_count++;
854
855 /* Generate the DIMM labels from the specified channels */
856 chars = snprintf(pos, len + 1, "%s",
857 mci->csrows[csrow].channels[channela].label);
Douglas Thompson079708b2007-07-19 01:49:58 -0700858 len -= chars;
859 pos += chars;
eric wollesen9794f332007-02-12 00:53:08 -0800860 chars = snprintf(pos, len + 1, "-%s",
861 mci->csrows[csrow].channels[channelb].label);
862
Dave Jiang4de78c62007-07-19 01:49:54 -0700863 if (edac_mc_get_log_ue())
eric wollesen9794f332007-02-12 00:53:08 -0800864 edac_mc_printk(mci, KERN_EMERG,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700865 "UE row %d, channel-a= %d channel-b= %d "
866 "labels \"%s\": %s\n", csrow, channela, channelb,
867 labels, msg);
eric wollesen9794f332007-02-12 00:53:08 -0800868
Dave Jiang4de78c62007-07-19 01:49:54 -0700869 if (edac_mc_get_panic_on_ue())
eric wollesen9794f332007-02-12 00:53:08 -0800870 panic("UE row %d, channel-a= %d channel-b= %d "
Douglas Thompson052dfb42007-07-19 01:50:13 -0700871 "labels \"%s\": %s\n", csrow, channela,
872 channelb, labels, msg);
eric wollesen9794f332007-02-12 00:53:08 -0800873}
874EXPORT_SYMBOL(edac_mc_handle_fbd_ue);
875
876/*************************************************************
877 * On Fully Buffered DIMM modules, this help function is
878 * called to process CE events
879 */
880void edac_mc_handle_fbd_ce(struct mem_ctl_info *mci,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700881 unsigned int csrow, unsigned int channel, char *msg)
eric wollesen9794f332007-02-12 00:53:08 -0800882{
883
884 /* Ensure boundary values */
885 if (csrow >= mci->nr_csrows) {
886 /* something is wrong */
887 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700888 "INTERNAL ERROR: row out of range (%d >= %d)\n",
889 csrow, mci->nr_csrows);
eric wollesen9794f332007-02-12 00:53:08 -0800890 edac_mc_handle_ce_no_info(mci, "INTERNAL ERROR");
891 return;
892 }
893 if (channel >= mci->csrows[csrow].nr_channels) {
894 /* something is wrong */
895 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700896 "INTERNAL ERROR: channel out of range (%d >= %d)\n",
897 channel, mci->csrows[csrow].nr_channels);
eric wollesen9794f332007-02-12 00:53:08 -0800898 edac_mc_handle_ce_no_info(mci, "INTERNAL ERROR");
899 return;
900 }
901
Dave Jiang4de78c62007-07-19 01:49:54 -0700902 if (edac_mc_get_log_ce())
eric wollesen9794f332007-02-12 00:53:08 -0800903 /* FIXME - put in DIMM location */
904 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700905 "CE row %d, channel %d, label \"%s\": %s\n",
906 csrow, channel,
907 mci->csrows[csrow].channels[channel].label, msg);
eric wollesen9794f332007-02-12 00:53:08 -0800908
909 mci->ce_count++;
910 mci->csrows[csrow].ce_count++;
911 mci->csrows[csrow].channels[channel].ce_count++;
912}
Douglas Thompson079708b2007-07-19 01:49:58 -0700913EXPORT_SYMBOL(edac_mc_handle_fbd_ce);