blob: feef7733fae7702733feb642bfcf0ac7c431f484 [file] [log] [blame]
Alan Coxda9bb1d2006-01-18 17:44:13 -08001/*
2 * edac_mc kernel module
Doug Thompson49c0dab72006-07-10 04:45:19 -07003 * (C) 2005, 2006 Linux Networx (http://lnxi.com)
Alan Coxda9bb1d2006-01-18 17:44:13 -08004 * This file may be distributed under the terms of the
5 * GNU General Public License.
6 *
7 * Written by Thayne Harbaugh
8 * Based on work by Dan Hollis <goemon at anime dot net> and others.
9 * http://www.anime.net/~goemon/linux-ecc/
10 *
11 * Modified by Dave Peterson and Doug Thompson
12 *
13 */
14
Alan Coxda9bb1d2006-01-18 17:44:13 -080015#include <linux/module.h>
16#include <linux/proc_fs.h>
17#include <linux/kernel.h>
18#include <linux/types.h>
19#include <linux/smp.h>
20#include <linux/init.h>
21#include <linux/sysctl.h>
22#include <linux/highmem.h>
23#include <linux/timer.h>
24#include <linux/slab.h>
25#include <linux/jiffies.h>
26#include <linux/spinlock.h>
27#include <linux/list.h>
Alan Coxda9bb1d2006-01-18 17:44:13 -080028#include <linux/ctype.h>
Dave Jiangc0d12172007-07-19 01:49:46 -070029#include <linux/edac.h>
Alan Coxda9bb1d2006-01-18 17:44:13 -080030#include <asm/uaccess.h>
31#include <asm/page.h>
32#include <asm/edac.h>
Douglas Thompson20bcb7a2007-07-19 01:49:47 -070033#include "edac_core.h"
Douglas Thompson7c9281d2007-07-19 01:49:33 -070034#include "edac_module.h"
Alan Coxda9bb1d2006-01-18 17:44:13 -080035
Alan Coxda9bb1d2006-01-18 17:44:13 -080036/* lock to memory controller's control array */
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -070037static DEFINE_MUTEX(mem_ctls_mutex);
Robert P. J. Dayff6ac2a2008-04-29 01:03:17 -070038static LIST_HEAD(mc_devices);
Alan Coxda9bb1d2006-01-18 17:44:13 -080039
Alan Coxda9bb1d2006-01-18 17:44:13 -080040#ifdef CONFIG_EDAC_DEBUG
41
Mauro Carvalho Chehaba4b4be32012-01-27 10:26:13 -030042static void edac_mc_dump_channel(struct rank_info *chan)
Alan Coxda9bb1d2006-01-18 17:44:13 -080043{
44 debugf4("\tchannel = %p\n", chan);
45 debugf4("\tchannel->chan_idx = %d\n", chan->chan_idx);
46 debugf4("\tchannel->ce_count = %d\n", chan->ce_count);
47 debugf4("\tchannel->label = '%s'\n", chan->label);
48 debugf4("\tchannel->csrow = %p\n\n", chan->csrow);
49}
50
Adrian Bunk2da1c112007-07-19 01:49:32 -070051static void edac_mc_dump_csrow(struct csrow_info *csrow)
Alan Coxda9bb1d2006-01-18 17:44:13 -080052{
53 debugf4("\tcsrow = %p\n", csrow);
54 debugf4("\tcsrow->csrow_idx = %d\n", csrow->csrow_idx);
Douglas Thompson079708b2007-07-19 01:49:58 -070055 debugf4("\tcsrow->first_page = 0x%lx\n", csrow->first_page);
Alan Coxda9bb1d2006-01-18 17:44:13 -080056 debugf4("\tcsrow->last_page = 0x%lx\n", csrow->last_page);
57 debugf4("\tcsrow->page_mask = 0x%lx\n", csrow->page_mask);
58 debugf4("\tcsrow->nr_pages = 0x%x\n", csrow->nr_pages);
Douglas Thompson079708b2007-07-19 01:49:58 -070059 debugf4("\tcsrow->nr_channels = %d\n", csrow->nr_channels);
Alan Coxda9bb1d2006-01-18 17:44:13 -080060 debugf4("\tcsrow->channels = %p\n", csrow->channels);
61 debugf4("\tcsrow->mci = %p\n\n", csrow->mci);
62}
63
Adrian Bunk2da1c112007-07-19 01:49:32 -070064static void edac_mc_dump_mci(struct mem_ctl_info *mci)
Alan Coxda9bb1d2006-01-18 17:44:13 -080065{
66 debugf3("\tmci = %p\n", mci);
67 debugf3("\tmci->mtype_cap = %lx\n", mci->mtype_cap);
68 debugf3("\tmci->edac_ctl_cap = %lx\n", mci->edac_ctl_cap);
69 debugf3("\tmci->edac_cap = %lx\n", mci->edac_cap);
70 debugf4("\tmci->edac_check = %p\n", mci->edac_check);
71 debugf3("\tmci->nr_csrows = %d, csrows = %p\n",
72 mci->nr_csrows, mci->csrows);
Doug Thompson37f04582006-06-30 01:56:07 -070073 debugf3("\tdev = %p\n", mci->dev);
Douglas Thompson079708b2007-07-19 01:49:58 -070074 debugf3("\tmod_name:ctl_name = %s:%s\n", mci->mod_name, mci->ctl_name);
Alan Coxda9bb1d2006-01-18 17:44:13 -080075 debugf3("\tpvt_info = %p\n\n", mci->pvt_info);
76}
77
Borislav Petkov24f9a7f2010-10-07 18:29:15 +020078#endif /* CONFIG_EDAC_DEBUG */
79
Borislav Petkov239642f2009-11-12 15:33:16 +010080/*
81 * keep those in sync with the enum mem_type
82 */
83const char *edac_mem_types[] = {
84 "Empty csrow",
85 "Reserved csrow type",
86 "Unknown csrow type",
87 "Fast page mode RAM",
88 "Extended data out RAM",
89 "Burst Extended data out RAM",
90 "Single data rate SDRAM",
91 "Registered single data rate SDRAM",
92 "Double data rate SDRAM",
93 "Registered Double data rate SDRAM",
94 "Rambus DRAM",
95 "Unbuffered DDR2 RAM",
96 "Fully buffered DDR2",
97 "Registered DDR2 RAM",
98 "Rambus XDR",
99 "Unbuffered DDR3 RAM",
100 "Registered DDR3 RAM",
101};
102EXPORT_SYMBOL_GPL(edac_mem_types);
103
Alan Coxda9bb1d2006-01-18 17:44:13 -0800104/* 'ptr' points to a possibly unaligned item X such that sizeof(X) is 'size'.
105 * Adjust 'ptr' so that its alignment is at least as stringent as what the
106 * compiler would provide for X and return the aligned result.
107 *
108 * If 'size' is a constant, the compiler will optimize this whole function
109 * down to either a no-op or the addition of a constant to the value of 'ptr'.
110 */
Douglas Thompson7391c6d2007-07-19 01:50:21 -0700111void *edac_align_ptr(void *ptr, unsigned size)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800112{
113 unsigned align, r;
114
115 /* Here we assume that the alignment of a "long long" is the most
116 * stringent alignment that the compiler will ever provide by default.
117 * As far as I know, this is a reasonable assumption.
118 */
119 if (size > sizeof(long))
120 align = sizeof(long long);
121 else if (size > sizeof(int))
122 align = sizeof(long);
123 else if (size > sizeof(short))
124 align = sizeof(int);
125 else if (size > sizeof(char))
126 align = sizeof(short);
127 else
Douglas Thompson079708b2007-07-19 01:49:58 -0700128 return (char *)ptr;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800129
130 r = size % align;
131
132 if (r == 0)
Douglas Thompson079708b2007-07-19 01:49:58 -0700133 return (char *)ptr;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800134
Douglas Thompson7391c6d2007-07-19 01:50:21 -0700135 return (void *)(((unsigned long)ptr) + align - r);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800136}
137
Alan Coxda9bb1d2006-01-18 17:44:13 -0800138/**
139 * edac_mc_alloc: Allocate a struct mem_ctl_info structure
140 * @size_pvt: size of private storage needed
141 * @nr_csrows: Number of CWROWS needed for this MC
142 * @nr_chans: Number of channels for the MC
143 *
144 * Everything is kmalloc'ed as one big chunk - more efficient.
145 * Only can be used if all structures have the same lifetime - otherwise
146 * you have to allocate and initialize your own structures.
147 *
148 * Use edac_mc_free() to free mc structures allocated by this function.
149 *
150 * Returns:
151 * NULL allocation failed
152 * struct mem_ctl_info pointer
153 */
154struct mem_ctl_info *edac_mc_alloc(unsigned sz_pvt, unsigned nr_csrows,
Doug Thompsonb8f6f972007-07-19 01:50:26 -0700155 unsigned nr_chans, int edac_index)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800156{
157 struct mem_ctl_info *mci;
158 struct csrow_info *csi, *csrow;
Mauro Carvalho Chehaba4b4be32012-01-27 10:26:13 -0300159 struct rank_info *chi, *chp, *chan;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800160 void *pvt;
161 unsigned size;
162 int row, chn;
Doug Thompson8096cfa2007-07-19 01:50:27 -0700163 int err;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800164
165 /* Figure out the offsets of the various items from the start of an mc
166 * structure. We want the alignment of each item to be at least as
167 * stringent as what the compiler would provide if we could simply
168 * hardcode everything into a single struct.
169 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700170 mci = (struct mem_ctl_info *)0;
Douglas Thompson7391c6d2007-07-19 01:50:21 -0700171 csi = edac_align_ptr(&mci[1], sizeof(*csi));
172 chi = edac_align_ptr(&csi[nr_csrows], sizeof(*chi));
Douglas Thompsone27e3da2007-07-19 01:49:36 -0700173 pvt = edac_align_ptr(&chi[nr_chans * nr_csrows], sz_pvt);
Douglas Thompson079708b2007-07-19 01:49:58 -0700174 size = ((unsigned long)pvt) + sz_pvt;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800175
Doug Thompson8096cfa2007-07-19 01:50:27 -0700176 mci = kzalloc(size, GFP_KERNEL);
177 if (mci == NULL)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800178 return NULL;
179
180 /* Adjust pointers so they point within the memory we just allocated
181 * rather than an imaginary chunk of memory located at address 0.
182 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700183 csi = (struct csrow_info *)(((char *)mci) + ((unsigned long)csi));
Mauro Carvalho Chehaba4b4be32012-01-27 10:26:13 -0300184 chi = (struct rank_info *)(((char *)mci) + ((unsigned long)chi));
Douglas Thompson079708b2007-07-19 01:49:58 -0700185 pvt = sz_pvt ? (((char *)mci) + ((unsigned long)pvt)) : NULL;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800186
Doug Thompsonb8f6f972007-07-19 01:50:26 -0700187 /* setup index and various internal pointers */
188 mci->mc_idx = edac_index;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800189 mci->csrows = csi;
190 mci->pvt_info = pvt;
191 mci->nr_csrows = nr_csrows;
192
193 for (row = 0; row < nr_csrows; row++) {
194 csrow = &csi[row];
195 csrow->csrow_idx = row;
196 csrow->mci = mci;
197 csrow->nr_channels = nr_chans;
198 chp = &chi[row * nr_chans];
199 csrow->channels = chp;
200
201 for (chn = 0; chn < nr_chans; chn++) {
202 chan = &chp[chn];
203 chan->chan_idx = chn;
204 chan->csrow = csrow;
205 }
206 }
207
Dave Jiang81d87cb2007-07-19 01:49:52 -0700208 mci->op_state = OP_ALLOC;
Mauro Carvalho Chehab6fe11082010-08-12 00:30:25 -0300209 INIT_LIST_HEAD(&mci->grp_kobj_list);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700210
Doug Thompson8096cfa2007-07-19 01:50:27 -0700211 /*
212 * Initialize the 'root' kobj for the edac_mc controller
213 */
214 err = edac_mc_register_sysfs_main_kobj(mci);
215 if (err) {
216 kfree(mci);
217 return NULL;
218 }
219
220 /* at this point, the root kobj is valid, and in order to
221 * 'free' the object, then the function:
222 * edac_mc_unregister_sysfs_main_kobj() must be called
223 * which will perform kobj unregistration and the actual free
224 * will occur during the kobject callback operation
225 */
Alan Coxda9bb1d2006-01-18 17:44:13 -0800226 return mci;
227}
Dave Peterson91105402006-03-26 01:38:55 -0800228EXPORT_SYMBOL_GPL(edac_mc_alloc);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800229
Alan Coxda9bb1d2006-01-18 17:44:13 -0800230/**
Doug Thompson8096cfa2007-07-19 01:50:27 -0700231 * edac_mc_free
232 * 'Free' a previously allocated 'mci' structure
Alan Coxda9bb1d2006-01-18 17:44:13 -0800233 * @mci: pointer to a struct mem_ctl_info structure
Alan Coxda9bb1d2006-01-18 17:44:13 -0800234 */
235void edac_mc_free(struct mem_ctl_info *mci)
236{
Mauro Carvalho Chehabbbc560a2010-08-16 18:22:43 -0300237 debugf1("%s()\n", __func__);
238
Doug Thompson8096cfa2007-07-19 01:50:27 -0700239 edac_mc_unregister_sysfs_main_kobj(mci);
Mauro Carvalho Chehabaccf74f2010-08-16 18:34:37 -0300240
241 /* free the mci instance memory here */
242 kfree(mci);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800243}
Dave Peterson91105402006-03-26 01:38:55 -0800244EXPORT_SYMBOL_GPL(edac_mc_free);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800245
Doug Thompsonbce19682007-07-26 10:41:14 -0700246
Mauro Carvalho Chehab939747bd2010-08-10 11:22:01 -0300247/**
Doug Thompsonbce19682007-07-26 10:41:14 -0700248 * find_mci_by_dev
249 *
250 * scan list of controllers looking for the one that manages
251 * the 'dev' device
Mauro Carvalho Chehab939747bd2010-08-10 11:22:01 -0300252 * @dev: pointer to a struct device related with the MCI
Doug Thompsonbce19682007-07-26 10:41:14 -0700253 */
Mauro Carvalho Chehab939747bd2010-08-10 11:22:01 -0300254struct mem_ctl_info *find_mci_by_dev(struct device *dev)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800255{
256 struct mem_ctl_info *mci;
257 struct list_head *item;
258
Dave Peterson537fba22006-03-26 01:38:40 -0800259 debugf3("%s()\n", __func__);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800260
261 list_for_each(item, &mc_devices) {
262 mci = list_entry(item, struct mem_ctl_info, link);
263
Doug Thompson37f04582006-06-30 01:56:07 -0700264 if (mci->dev == dev)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800265 return mci;
266 }
267
268 return NULL;
269}
Mauro Carvalho Chehab939747bd2010-08-10 11:22:01 -0300270EXPORT_SYMBOL_GPL(find_mci_by_dev);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800271
Dave Jiang81d87cb2007-07-19 01:49:52 -0700272/*
273 * handler for EDAC to check if NMI type handler has asserted interrupt
274 */
275static int edac_mc_assert_error_check_and_clear(void)
276{
Dave Jiang66ee2f92007-07-19 01:49:54 -0700277 int old_state;
Dave Jiang81d87cb2007-07-19 01:49:52 -0700278
Douglas Thompson079708b2007-07-19 01:49:58 -0700279 if (edac_op_state == EDAC_OPSTATE_POLL)
Dave Jiang81d87cb2007-07-19 01:49:52 -0700280 return 1;
281
Dave Jiang66ee2f92007-07-19 01:49:54 -0700282 old_state = edac_err_assert;
283 edac_err_assert = 0;
Dave Jiang81d87cb2007-07-19 01:49:52 -0700284
Dave Jiang66ee2f92007-07-19 01:49:54 -0700285 return old_state;
Dave Jiang81d87cb2007-07-19 01:49:52 -0700286}
287
288/*
289 * edac_mc_workq_function
290 * performs the operation scheduled by a workq request
291 */
Dave Jiang81d87cb2007-07-19 01:49:52 -0700292static void edac_mc_workq_function(struct work_struct *work_req)
293{
Jean Delvarefbeb4382009-04-13 14:40:21 -0700294 struct delayed_work *d_work = to_delayed_work(work_req);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700295 struct mem_ctl_info *mci = to_edac_mem_ctl_work(d_work);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700296
297 mutex_lock(&mem_ctls_mutex);
298
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700299 /* if this control struct has movd to offline state, we are done */
300 if (mci->op_state == OP_OFFLINE) {
301 mutex_unlock(&mem_ctls_mutex);
302 return;
303 }
304
Dave Jiang81d87cb2007-07-19 01:49:52 -0700305 /* Only poll controllers that are running polled and have a check */
306 if (edac_mc_assert_error_check_and_clear() && (mci->edac_check != NULL))
307 mci->edac_check(mci);
308
Dave Jiang81d87cb2007-07-19 01:49:52 -0700309 mutex_unlock(&mem_ctls_mutex);
310
311 /* Reschedule */
Dave Jiang4de78c62007-07-19 01:49:54 -0700312 queue_delayed_work(edac_workqueue, &mci->work,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700313 msecs_to_jiffies(edac_mc_get_poll_msec()));
Dave Jiang81d87cb2007-07-19 01:49:52 -0700314}
315
316/*
317 * edac_mc_workq_setup
318 * initialize a workq item for this mci
319 * passing in the new delay period in msec
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700320 *
321 * locking model:
322 *
323 * called with the mem_ctls_mutex held
Dave Jiang81d87cb2007-07-19 01:49:52 -0700324 */
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700325static void edac_mc_workq_setup(struct mem_ctl_info *mci, unsigned msec)
Dave Jiang81d87cb2007-07-19 01:49:52 -0700326{
327 debugf0("%s()\n", __func__);
328
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700329 /* if this instance is not in the POLL state, then simply return */
330 if (mci->op_state != OP_RUNNING_POLL)
331 return;
332
Dave Jiang81d87cb2007-07-19 01:49:52 -0700333 INIT_DELAYED_WORK(&mci->work, edac_mc_workq_function);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700334 queue_delayed_work(edac_workqueue, &mci->work, msecs_to_jiffies(msec));
335}
336
337/*
338 * edac_mc_workq_teardown
339 * stop the workq processing on this mci
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700340 *
341 * locking model:
342 *
343 * called WITHOUT lock held
Dave Jiang81d87cb2007-07-19 01:49:52 -0700344 */
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700345static void edac_mc_workq_teardown(struct mem_ctl_info *mci)
Dave Jiang81d87cb2007-07-19 01:49:52 -0700346{
347 int status;
348
Borislav Petkov00740c52010-09-26 12:42:23 +0200349 if (mci->op_state != OP_RUNNING_POLL)
350 return;
351
Doug Thompsonbce19682007-07-26 10:41:14 -0700352 status = cancel_delayed_work(&mci->work);
353 if (status == 0) {
354 debugf0("%s() not canceled, flush the queue\n",
355 __func__);
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700356
Doug Thompsonbce19682007-07-26 10:41:14 -0700357 /* workq instance might be running, wait for it */
358 flush_workqueue(edac_workqueue);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700359 }
360}
361
362/*
Doug Thompsonbce19682007-07-26 10:41:14 -0700363 * edac_mc_reset_delay_period(unsigned long value)
364 *
365 * user space has updated our poll period value, need to
366 * reset our workq delays
Dave Jiang81d87cb2007-07-19 01:49:52 -0700367 */
Doug Thompsonbce19682007-07-26 10:41:14 -0700368void edac_mc_reset_delay_period(int value)
Dave Jiang81d87cb2007-07-19 01:49:52 -0700369{
Doug Thompsonbce19682007-07-26 10:41:14 -0700370 struct mem_ctl_info *mci;
371 struct list_head *item;
Dave Jiang81d87cb2007-07-19 01:49:52 -0700372
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700373 mutex_lock(&mem_ctls_mutex);
374
Doug Thompsonbce19682007-07-26 10:41:14 -0700375 /* scan the list and turn off all workq timers, doing so under lock
376 */
377 list_for_each(item, &mc_devices) {
378 mci = list_entry(item, struct mem_ctl_info, link);
379
380 if (mci->op_state == OP_RUNNING_POLL)
381 cancel_delayed_work(&mci->work);
382 }
383
384 mutex_unlock(&mem_ctls_mutex);
385
386
387 /* re-walk the list, and reset the poll delay */
388 mutex_lock(&mem_ctls_mutex);
389
390 list_for_each(item, &mc_devices) {
391 mci = list_entry(item, struct mem_ctl_info, link);
392
393 edac_mc_workq_setup(mci, (unsigned long) value);
394 }
Dave Jiang81d87cb2007-07-19 01:49:52 -0700395
396 mutex_unlock(&mem_ctls_mutex);
397}
398
Doug Thompsonbce19682007-07-26 10:41:14 -0700399
400
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700401/* Return 0 on success, 1 on failure.
402 * Before calling this function, caller must
403 * assign a unique value to mci->mc_idx.
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700404 *
405 * locking model:
406 *
407 * called with the mem_ctls_mutex lock held
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700408 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700409static int add_mc_to_global_list(struct mem_ctl_info *mci)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800410{
411 struct list_head *item, *insert_before;
412 struct mem_ctl_info *p;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800413
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700414 insert_before = &mc_devices;
415
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700416 p = find_mci_by_dev(mci->dev);
417 if (unlikely(p != NULL))
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700418 goto fail0;
419
420 list_for_each(item, &mc_devices) {
421 p = list_entry(item, struct mem_ctl_info, link);
422
423 if (p->mc_idx >= mci->mc_idx) {
424 if (unlikely(p->mc_idx == mci->mc_idx))
425 goto fail1;
426
427 insert_before = item;
428 break;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800429 }
Alan Coxda9bb1d2006-01-18 17:44:13 -0800430 }
431
432 list_add_tail_rcu(&mci->link, insert_before);
Dave Jiangc0d12172007-07-19 01:49:46 -0700433 atomic_inc(&edac_handlers);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800434 return 0;
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700435
Douglas Thompson052dfb42007-07-19 01:50:13 -0700436fail0:
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700437 edac_printk(KERN_WARNING, EDAC_MC,
Kay Sievers281efb12009-01-06 14:42:57 -0800438 "%s (%s) %s %s already assigned %d\n", dev_name(p->dev),
Stephen Rothwell17aa7e02008-05-05 13:54:19 +1000439 edac_dev_name(mci), p->mod_name, p->ctl_name, p->mc_idx);
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700440 return 1;
441
Douglas Thompson052dfb42007-07-19 01:50:13 -0700442fail1:
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700443 edac_printk(KERN_WARNING, EDAC_MC,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700444 "bug in low-level driver: attempt to assign\n"
445 " duplicate mc_idx %d in %s()\n", p->mc_idx, __func__);
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700446 return 1;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800447}
448
Dave Petersone7ecd892006-03-26 01:38:52 -0800449static void del_mc_from_global_list(struct mem_ctl_info *mci)
Dave Petersona1d03fc2006-03-26 01:38:46 -0800450{
Dave Jiangc0d12172007-07-19 01:49:46 -0700451 atomic_dec(&edac_handlers);
Dave Petersona1d03fc2006-03-26 01:38:46 -0800452 list_del_rcu(&mci->link);
Lai Jiangshane2e77092011-05-26 16:25:58 -0700453
454 /* these are for safe removal of devices from global list while
455 * NMI handlers may be traversing list
456 */
457 synchronize_rcu();
458 INIT_LIST_HEAD(&mci->link);
Dave Petersona1d03fc2006-03-26 01:38:46 -0800459}
460
Alan Coxda9bb1d2006-01-18 17:44:13 -0800461/**
Douglas Thompson5da08312007-07-19 01:49:31 -0700462 * edac_mc_find: Search for a mem_ctl_info structure whose index is 'idx'.
463 *
464 * If found, return a pointer to the structure.
465 * Else return NULL.
466 *
467 * Caller must hold mem_ctls_mutex.
468 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700469struct mem_ctl_info *edac_mc_find(int idx)
Douglas Thompson5da08312007-07-19 01:49:31 -0700470{
471 struct list_head *item;
472 struct mem_ctl_info *mci;
473
474 list_for_each(item, &mc_devices) {
475 mci = list_entry(item, struct mem_ctl_info, link);
476
477 if (mci->mc_idx >= idx) {
478 if (mci->mc_idx == idx)
479 return mci;
480
481 break;
482 }
483 }
484
485 return NULL;
486}
487EXPORT_SYMBOL(edac_mc_find);
488
489/**
Dave Peterson472678e2006-03-26 01:38:49 -0800490 * edac_mc_add_mc: Insert the 'mci' structure into the mci global list and
491 * create sysfs entries associated with mci structure
Alan Coxda9bb1d2006-01-18 17:44:13 -0800492 * @mci: pointer to the mci structure to be added to the list
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700493 * @mc_idx: A unique numeric identifier to be assigned to the 'mci' structure.
Alan Coxda9bb1d2006-01-18 17:44:13 -0800494 *
495 * Return:
496 * 0 Success
497 * !0 Failure
498 */
499
500/* FIXME - should a warning be printed if no error detection? correction? */
Doug Thompsonb8f6f972007-07-19 01:50:26 -0700501int edac_mc_add_mc(struct mem_ctl_info *mci)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800502{
Dave Peterson537fba22006-03-26 01:38:40 -0800503 debugf0("%s()\n", __func__);
Doug Thompsonb8f6f972007-07-19 01:50:26 -0700504
Alan Coxda9bb1d2006-01-18 17:44:13 -0800505#ifdef CONFIG_EDAC_DEBUG
506 if (edac_debug_level >= 3)
507 edac_mc_dump_mci(mci);
Dave Petersone7ecd892006-03-26 01:38:52 -0800508
Alan Coxda9bb1d2006-01-18 17:44:13 -0800509 if (edac_debug_level >= 4) {
510 int i;
511
512 for (i = 0; i < mci->nr_csrows; i++) {
513 int j;
Dave Petersone7ecd892006-03-26 01:38:52 -0800514
Alan Coxda9bb1d2006-01-18 17:44:13 -0800515 edac_mc_dump_csrow(&mci->csrows[i]);
516 for (j = 0; j < mci->csrows[i].nr_channels; j++)
Douglas Thompson079708b2007-07-19 01:49:58 -0700517 edac_mc_dump_channel(&mci->csrows[i].
Douglas Thompson052dfb42007-07-19 01:50:13 -0700518 channels[j]);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800519 }
520 }
521#endif
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700522 mutex_lock(&mem_ctls_mutex);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800523
524 if (add_mc_to_global_list(mci))
Dave Peterson028a7b62006-03-26 01:38:47 -0800525 goto fail0;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800526
527 /* set load time so that error rate can be tracked */
528 mci->start_time = jiffies;
529
eric wollesen9794f332007-02-12 00:53:08 -0800530 if (edac_create_sysfs_mci_device(mci)) {
531 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700532 "failed to create sysfs device\n");
eric wollesen9794f332007-02-12 00:53:08 -0800533 goto fail1;
534 }
Alan Coxda9bb1d2006-01-18 17:44:13 -0800535
Dave Jiang81d87cb2007-07-19 01:49:52 -0700536 /* If there IS a check routine, then we are running POLLED */
537 if (mci->edac_check != NULL) {
538 /* This instance is NOW RUNNING */
539 mci->op_state = OP_RUNNING_POLL;
540
541 edac_mc_workq_setup(mci, edac_mc_get_poll_msec());
542 } else {
543 mci->op_state = OP_RUNNING_INTERRUPT;
544 }
545
Alan Coxda9bb1d2006-01-18 17:44:13 -0800546 /* Report action taken */
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700547 edac_mc_printk(mci, KERN_INFO, "Giving out device to '%s' '%s':"
Stephen Rothwell17aa7e02008-05-05 13:54:19 +1000548 " DEV %s\n", mci->mod_name, mci->ctl_name, edac_dev_name(mci));
Alan Coxda9bb1d2006-01-18 17:44:13 -0800549
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700550 mutex_unlock(&mem_ctls_mutex);
Dave Peterson028a7b62006-03-26 01:38:47 -0800551 return 0;
552
Douglas Thompson052dfb42007-07-19 01:50:13 -0700553fail1:
Dave Peterson028a7b62006-03-26 01:38:47 -0800554 del_mc_from_global_list(mci);
555
Douglas Thompson052dfb42007-07-19 01:50:13 -0700556fail0:
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700557 mutex_unlock(&mem_ctls_mutex);
Dave Peterson028a7b62006-03-26 01:38:47 -0800558 return 1;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800559}
Dave Peterson91105402006-03-26 01:38:55 -0800560EXPORT_SYMBOL_GPL(edac_mc_add_mc);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800561
Alan Coxda9bb1d2006-01-18 17:44:13 -0800562/**
Dave Peterson472678e2006-03-26 01:38:49 -0800563 * edac_mc_del_mc: Remove sysfs entries for specified mci structure and
564 * remove mci structure from global list
Doug Thompson37f04582006-06-30 01:56:07 -0700565 * @pdev: Pointer to 'struct device' representing mci structure to remove.
Alan Coxda9bb1d2006-01-18 17:44:13 -0800566 *
Dave Peterson18dbc332006-03-26 01:38:50 -0800567 * Return pointer to removed mci structure, or NULL if device not found.
Alan Coxda9bb1d2006-01-18 17:44:13 -0800568 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700569struct mem_ctl_info *edac_mc_del_mc(struct device *dev)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800570{
Dave Peterson18dbc332006-03-26 01:38:50 -0800571 struct mem_ctl_info *mci;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800572
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700573 debugf0("%s()\n", __func__);
574
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700575 mutex_lock(&mem_ctls_mutex);
Dave Peterson18dbc332006-03-26 01:38:50 -0800576
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700577 /* find the requested mci struct in the global list */
578 mci = find_mci_by_dev(dev);
579 if (mci == NULL) {
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700580 mutex_unlock(&mem_ctls_mutex);
Dave Peterson18dbc332006-03-26 01:38:50 -0800581 return NULL;
582 }
583
Alan Coxda9bb1d2006-01-18 17:44:13 -0800584 del_mc_from_global_list(mci);
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700585 mutex_unlock(&mem_ctls_mutex);
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700586
Borislav Petkovbb31b3122010-12-02 17:48:35 +0100587 /* flush workq processes */
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700588 edac_mc_workq_teardown(mci);
Borislav Petkovbb31b3122010-12-02 17:48:35 +0100589
590 /* marking MCI offline */
591 mci->op_state = OP_OFFLINE;
592
593 /* remove from sysfs */
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700594 edac_remove_sysfs_mci_device(mci);
595
Dave Peterson537fba22006-03-26 01:38:40 -0800596 edac_printk(KERN_INFO, EDAC_MC,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700597 "Removed device %d for %s %s: DEV %s\n", mci->mc_idx,
Stephen Rothwell17aa7e02008-05-05 13:54:19 +1000598 mci->mod_name, mci->ctl_name, edac_dev_name(mci));
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700599
Dave Peterson18dbc332006-03-26 01:38:50 -0800600 return mci;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800601}
Dave Peterson91105402006-03-26 01:38:55 -0800602EXPORT_SYMBOL_GPL(edac_mc_del_mc);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800603
Adrian Bunk2da1c112007-07-19 01:49:32 -0700604static void edac_mc_scrub_block(unsigned long page, unsigned long offset,
605 u32 size)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800606{
607 struct page *pg;
608 void *virt_addr;
609 unsigned long flags = 0;
610
Dave Peterson537fba22006-03-26 01:38:40 -0800611 debugf3("%s()\n", __func__);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800612
613 /* ECC error page was not in our memory. Ignore it. */
Douglas Thompson079708b2007-07-19 01:49:58 -0700614 if (!pfn_valid(page))
Alan Coxda9bb1d2006-01-18 17:44:13 -0800615 return;
616
617 /* Find the actual page structure then map it and fix */
618 pg = pfn_to_page(page);
619
620 if (PageHighMem(pg))
621 local_irq_save(flags);
622
Cong Wang4e5df7c2011-11-25 23:14:19 +0800623 virt_addr = kmap_atomic(pg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800624
625 /* Perform architecture specific atomic scrub operation */
626 atomic_scrub(virt_addr + offset, size);
627
628 /* Unmap and complete */
Cong Wang4e5df7c2011-11-25 23:14:19 +0800629 kunmap_atomic(virt_addr);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800630
631 if (PageHighMem(pg))
632 local_irq_restore(flags);
633}
634
Alan Coxda9bb1d2006-01-18 17:44:13 -0800635/* FIXME - should return -1 */
Dave Petersone7ecd892006-03-26 01:38:52 -0800636int edac_mc_find_csrow_by_page(struct mem_ctl_info *mci, unsigned long page)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800637{
638 struct csrow_info *csrows = mci->csrows;
639 int row, i;
640
Dave Peterson537fba22006-03-26 01:38:40 -0800641 debugf1("MC%d: %s(): 0x%lx\n", mci->mc_idx, __func__, page);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800642 row = -1;
643
644 for (i = 0; i < mci->nr_csrows; i++) {
645 struct csrow_info *csrow = &csrows[i];
646
647 if (csrow->nr_pages == 0)
648 continue;
649
Dave Peterson537fba22006-03-26 01:38:40 -0800650 debugf3("MC%d: %s(): first(0x%lx) page(0x%lx) last(0x%lx) "
651 "mask(0x%lx)\n", mci->mc_idx, __func__,
652 csrow->first_page, page, csrow->last_page,
653 csrow->page_mask);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800654
655 if ((page >= csrow->first_page) &&
656 (page <= csrow->last_page) &&
657 ((page & csrow->page_mask) ==
658 (csrow->first_page & csrow->page_mask))) {
659 row = i;
660 break;
661 }
662 }
663
664 if (row == -1)
Dave Peterson537fba22006-03-26 01:38:40 -0800665 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700666 "could not look up page error address %lx\n",
667 (unsigned long)page);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800668
669 return row;
670}
Dave Peterson91105402006-03-26 01:38:55 -0800671EXPORT_SYMBOL_GPL(edac_mc_find_csrow_by_page);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800672
Alan Coxda9bb1d2006-01-18 17:44:13 -0800673/* FIXME - setable log (warning/emerg) levels */
674/* FIXME - integrate with evlog: http://evlog.sourceforge.net/ */
675void edac_mc_handle_ce(struct mem_ctl_info *mci,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700676 unsigned long page_frame_number,
677 unsigned long offset_in_page, unsigned long syndrome,
678 int row, int channel, const char *msg)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800679{
680 unsigned long remapped_page;
681
Dave Peterson537fba22006-03-26 01:38:40 -0800682 debugf3("MC%d: %s()\n", mci->mc_idx, __func__);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800683
684 /* FIXME - maybe make panic on INTERNAL ERROR an option */
685 if (row >= mci->nr_csrows || row < 0) {
686 /* something is wrong */
Dave Peterson537fba22006-03-26 01:38:40 -0800687 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700688 "INTERNAL ERROR: row out of range "
689 "(%d >= %d)\n", row, mci->nr_csrows);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800690 edac_mc_handle_ce_no_info(mci, "INTERNAL ERROR");
691 return;
692 }
Dave Petersone7ecd892006-03-26 01:38:52 -0800693
Alan Coxda9bb1d2006-01-18 17:44:13 -0800694 if (channel >= mci->csrows[row].nr_channels || channel < 0) {
695 /* something is wrong */
Dave Peterson537fba22006-03-26 01:38:40 -0800696 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700697 "INTERNAL ERROR: channel out of range "
698 "(%d >= %d)\n", channel,
699 mci->csrows[row].nr_channels);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800700 edac_mc_handle_ce_no_info(mci, "INTERNAL ERROR");
701 return;
702 }
703
Dave Jiang4de78c62007-07-19 01:49:54 -0700704 if (edac_mc_get_log_ce())
Alan Coxda9bb1d2006-01-18 17:44:13 -0800705 /* FIXME - put in DIMM location */
Dave Peterson537fba22006-03-26 01:38:40 -0800706 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700707 "CE page 0x%lx, offset 0x%lx, grain %d, syndrome "
708 "0x%lx, row %d, channel %d, label \"%s\": %s\n",
709 page_frame_number, offset_in_page,
710 mci->csrows[row].grain, syndrome, row, channel,
711 mci->csrows[row].channels[channel].label, msg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800712
713 mci->ce_count++;
714 mci->csrows[row].ce_count++;
715 mci->csrows[row].channels[channel].ce_count++;
716
717 if (mci->scrub_mode & SCRUB_SW_SRC) {
718 /*
719 * Some MC's can remap memory so that it is still available
720 * at a different address when PCI devices map into memory.
721 * MC's that can't do this lose the memory where PCI devices
Lucas De Marchi25985ed2011-03-30 22:57:33 -0300722 * are mapped. This mapping is MC dependent and so we call
Alan Coxda9bb1d2006-01-18 17:44:13 -0800723 * back into the MC driver for it to map the MC page to
724 * a physical (CPU) page which can then be mapped to a virtual
725 * page - which can then be scrubbed.
726 */
727 remapped_page = mci->ctl_page_to_phys ?
Douglas Thompson052dfb42007-07-19 01:50:13 -0700728 mci->ctl_page_to_phys(mci, page_frame_number) :
729 page_frame_number;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800730
731 edac_mc_scrub_block(remapped_page, offset_in_page,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700732 mci->csrows[row].grain);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800733 }
734}
Dave Peterson91105402006-03-26 01:38:55 -0800735EXPORT_SYMBOL_GPL(edac_mc_handle_ce);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800736
Dave Petersone7ecd892006-03-26 01:38:52 -0800737void edac_mc_handle_ce_no_info(struct mem_ctl_info *mci, const char *msg)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800738{
Dave Jiang4de78c62007-07-19 01:49:54 -0700739 if (edac_mc_get_log_ce())
Dave Peterson537fba22006-03-26 01:38:40 -0800740 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700741 "CE - no information available: %s\n", msg);
Dave Petersone7ecd892006-03-26 01:38:52 -0800742
Alan Coxda9bb1d2006-01-18 17:44:13 -0800743 mci->ce_noinfo_count++;
744 mci->ce_count++;
745}
Dave Peterson91105402006-03-26 01:38:55 -0800746EXPORT_SYMBOL_GPL(edac_mc_handle_ce_no_info);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800747
Alan Coxda9bb1d2006-01-18 17:44:13 -0800748void edac_mc_handle_ue(struct mem_ctl_info *mci,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700749 unsigned long page_frame_number,
750 unsigned long offset_in_page, int row, const char *msg)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800751{
752 int len = EDAC_MC_LABEL_LEN * 4;
753 char labels[len + 1];
754 char *pos = labels;
755 int chan;
756 int chars;
757
Dave Peterson537fba22006-03-26 01:38:40 -0800758 debugf3("MC%d: %s()\n", mci->mc_idx, __func__);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800759
760 /* FIXME - maybe make panic on INTERNAL ERROR an option */
761 if (row >= mci->nr_csrows || row < 0) {
762 /* something is wrong */
Dave Peterson537fba22006-03-26 01:38:40 -0800763 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700764 "INTERNAL ERROR: row out of range "
765 "(%d >= %d)\n", row, mci->nr_csrows);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800766 edac_mc_handle_ue_no_info(mci, "INTERNAL ERROR");
767 return;
768 }
769
770 chars = snprintf(pos, len + 1, "%s",
Douglas Thompson079708b2007-07-19 01:49:58 -0700771 mci->csrows[row].channels[0].label);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800772 len -= chars;
773 pos += chars;
Dave Petersone7ecd892006-03-26 01:38:52 -0800774
Alan Coxda9bb1d2006-01-18 17:44:13 -0800775 for (chan = 1; (chan < mci->csrows[row].nr_channels) && (len > 0);
Douglas Thompson052dfb42007-07-19 01:50:13 -0700776 chan++) {
Alan Coxda9bb1d2006-01-18 17:44:13 -0800777 chars = snprintf(pos, len + 1, ":%s",
Douglas Thompson079708b2007-07-19 01:49:58 -0700778 mci->csrows[row].channels[chan].label);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800779 len -= chars;
780 pos += chars;
781 }
782
Dave Jiang4de78c62007-07-19 01:49:54 -0700783 if (edac_mc_get_log_ue())
Dave Peterson537fba22006-03-26 01:38:40 -0800784 edac_mc_printk(mci, KERN_EMERG,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700785 "UE page 0x%lx, offset 0x%lx, grain %d, row %d, "
786 "labels \"%s\": %s\n", page_frame_number,
787 offset_in_page, mci->csrows[row].grain, row,
788 labels, msg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800789
Dave Jiang4de78c62007-07-19 01:49:54 -0700790 if (edac_mc_get_panic_on_ue())
Dave Petersone7ecd892006-03-26 01:38:52 -0800791 panic("EDAC MC%d: UE page 0x%lx, offset 0x%lx, grain %d, "
Douglas Thompson052dfb42007-07-19 01:50:13 -0700792 "row %d, labels \"%s\": %s\n", mci->mc_idx,
793 page_frame_number, offset_in_page,
794 mci->csrows[row].grain, row, labels, msg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800795
796 mci->ue_count++;
797 mci->csrows[row].ue_count++;
798}
Dave Peterson91105402006-03-26 01:38:55 -0800799EXPORT_SYMBOL_GPL(edac_mc_handle_ue);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800800
Dave Petersone7ecd892006-03-26 01:38:52 -0800801void edac_mc_handle_ue_no_info(struct mem_ctl_info *mci, const char *msg)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800802{
Dave Jiang4de78c62007-07-19 01:49:54 -0700803 if (edac_mc_get_panic_on_ue())
Alan Coxda9bb1d2006-01-18 17:44:13 -0800804 panic("EDAC MC%d: Uncorrected Error", mci->mc_idx);
805
Dave Jiang4de78c62007-07-19 01:49:54 -0700806 if (edac_mc_get_log_ue())
Dave Peterson537fba22006-03-26 01:38:40 -0800807 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700808 "UE - no information available: %s\n", msg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800809 mci->ue_noinfo_count++;
810 mci->ue_count++;
811}
Douglas Thompson079708b2007-07-19 01:49:58 -0700812EXPORT_SYMBOL_GPL(edac_mc_handle_ue_no_info);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800813
eric wollesen9794f332007-02-12 00:53:08 -0800814/*************************************************************
815 * On Fully Buffered DIMM modules, this help function is
816 * called to process UE events
817 */
818void edac_mc_handle_fbd_ue(struct mem_ctl_info *mci,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700819 unsigned int csrow,
820 unsigned int channela,
821 unsigned int channelb, char *msg)
eric wollesen9794f332007-02-12 00:53:08 -0800822{
823 int len = EDAC_MC_LABEL_LEN * 4;
824 char labels[len + 1];
825 char *pos = labels;
826 int chars;
827
828 if (csrow >= mci->nr_csrows) {
829 /* something is wrong */
830 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700831 "INTERNAL ERROR: row out of range (%d >= %d)\n",
832 csrow, mci->nr_csrows);
eric wollesen9794f332007-02-12 00:53:08 -0800833 edac_mc_handle_ue_no_info(mci, "INTERNAL ERROR");
834 return;
835 }
836
837 if (channela >= mci->csrows[csrow].nr_channels) {
838 /* something is wrong */
839 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700840 "INTERNAL ERROR: channel-a out of range "
841 "(%d >= %d)\n",
842 channela, mci->csrows[csrow].nr_channels);
eric wollesen9794f332007-02-12 00:53:08 -0800843 edac_mc_handle_ue_no_info(mci, "INTERNAL ERROR");
844 return;
845 }
846
847 if (channelb >= mci->csrows[csrow].nr_channels) {
848 /* something is wrong */
849 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700850 "INTERNAL ERROR: channel-b out of range "
851 "(%d >= %d)\n",
852 channelb, mci->csrows[csrow].nr_channels);
eric wollesen9794f332007-02-12 00:53:08 -0800853 edac_mc_handle_ue_no_info(mci, "INTERNAL ERROR");
854 return;
855 }
856
857 mci->ue_count++;
858 mci->csrows[csrow].ue_count++;
859
860 /* Generate the DIMM labels from the specified channels */
861 chars = snprintf(pos, len + 1, "%s",
862 mci->csrows[csrow].channels[channela].label);
Douglas Thompson079708b2007-07-19 01:49:58 -0700863 len -= chars;
864 pos += chars;
eric wollesen9794f332007-02-12 00:53:08 -0800865 chars = snprintf(pos, len + 1, "-%s",
866 mci->csrows[csrow].channels[channelb].label);
867
Dave Jiang4de78c62007-07-19 01:49:54 -0700868 if (edac_mc_get_log_ue())
eric wollesen9794f332007-02-12 00:53:08 -0800869 edac_mc_printk(mci, KERN_EMERG,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700870 "UE row %d, channel-a= %d channel-b= %d "
871 "labels \"%s\": %s\n", csrow, channela, channelb,
872 labels, msg);
eric wollesen9794f332007-02-12 00:53:08 -0800873
Dave Jiang4de78c62007-07-19 01:49:54 -0700874 if (edac_mc_get_panic_on_ue())
eric wollesen9794f332007-02-12 00:53:08 -0800875 panic("UE row %d, channel-a= %d channel-b= %d "
Douglas Thompson052dfb42007-07-19 01:50:13 -0700876 "labels \"%s\": %s\n", csrow, channela,
877 channelb, labels, msg);
eric wollesen9794f332007-02-12 00:53:08 -0800878}
879EXPORT_SYMBOL(edac_mc_handle_fbd_ue);
880
881/*************************************************************
882 * On Fully Buffered DIMM modules, this help function is
883 * called to process CE events
884 */
885void edac_mc_handle_fbd_ce(struct mem_ctl_info *mci,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700886 unsigned int csrow, unsigned int channel, char *msg)
eric wollesen9794f332007-02-12 00:53:08 -0800887{
888
889 /* Ensure boundary values */
890 if (csrow >= mci->nr_csrows) {
891 /* something is wrong */
892 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700893 "INTERNAL ERROR: row out of range (%d >= %d)\n",
894 csrow, mci->nr_csrows);
eric wollesen9794f332007-02-12 00:53:08 -0800895 edac_mc_handle_ce_no_info(mci, "INTERNAL ERROR");
896 return;
897 }
898 if (channel >= mci->csrows[csrow].nr_channels) {
899 /* something is wrong */
900 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700901 "INTERNAL ERROR: channel out of range (%d >= %d)\n",
902 channel, mci->csrows[csrow].nr_channels);
eric wollesen9794f332007-02-12 00:53:08 -0800903 edac_mc_handle_ce_no_info(mci, "INTERNAL ERROR");
904 return;
905 }
906
Dave Jiang4de78c62007-07-19 01:49:54 -0700907 if (edac_mc_get_log_ce())
eric wollesen9794f332007-02-12 00:53:08 -0800908 /* FIXME - put in DIMM location */
909 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700910 "CE row %d, channel %d, label \"%s\": %s\n",
911 csrow, channel,
912 mci->csrows[csrow].channels[channel].label, msg);
eric wollesen9794f332007-02-12 00:53:08 -0800913
914 mci->ce_count++;
915 mci->csrows[csrow].ce_count++;
916 mci->csrows[csrow].channels[channel].ce_count++;
917}
Douglas Thompson079708b2007-07-19 01:49:58 -0700918EXPORT_SYMBOL(edac_mc_handle_fbd_ce);