blob: 6b7e723e46be5445996041a880b5d387253a9417 [file] [log] [blame]
Alan Coxda9bb1d2006-01-18 17:44:13 -08001/*
2 * edac_mc kernel module
Doug Thompson49c0dab72006-07-10 04:45:19 -07003 * (C) 2005, 2006 Linux Networx (http://lnxi.com)
Alan Coxda9bb1d2006-01-18 17:44:13 -08004 * This file may be distributed under the terms of the
5 * GNU General Public License.
6 *
7 * Written by Thayne Harbaugh
8 * Based on work by Dan Hollis <goemon at anime dot net> and others.
9 * http://www.anime.net/~goemon/linux-ecc/
10 *
11 * Modified by Dave Peterson and Doug Thompson
12 *
13 */
14
Alan Coxda9bb1d2006-01-18 17:44:13 -080015#include <linux/module.h>
16#include <linux/proc_fs.h>
17#include <linux/kernel.h>
18#include <linux/types.h>
19#include <linux/smp.h>
20#include <linux/init.h>
21#include <linux/sysctl.h>
22#include <linux/highmem.h>
23#include <linux/timer.h>
24#include <linux/slab.h>
25#include <linux/jiffies.h>
26#include <linux/spinlock.h>
27#include <linux/list.h>
28#include <linux/sysdev.h>
29#include <linux/ctype.h>
Dave Jiangc0d12172007-07-19 01:49:46 -070030#include <linux/edac.h>
Alan Coxda9bb1d2006-01-18 17:44:13 -080031#include <asm/uaccess.h>
32#include <asm/page.h>
33#include <asm/edac.h>
Douglas Thompson20bcb7a2007-07-19 01:49:47 -070034#include "edac_core.h"
Douglas Thompson7c9281d2007-07-19 01:49:33 -070035#include "edac_module.h"
Alan Coxda9bb1d2006-01-18 17:44:13 -080036
Alan Coxda9bb1d2006-01-18 17:44:13 -080037/* lock to memory controller's control array */
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -070038static DEFINE_MUTEX(mem_ctls_mutex);
Robert P. J. Dayff6ac2a2008-04-29 01:03:17 -070039static LIST_HEAD(mc_devices);
Alan Coxda9bb1d2006-01-18 17:44:13 -080040
Alan Coxda9bb1d2006-01-18 17:44:13 -080041#ifdef CONFIG_EDAC_DEBUG
42
Adrian Bunk2da1c112007-07-19 01:49:32 -070043static void edac_mc_dump_channel(struct channel_info *chan)
Alan Coxda9bb1d2006-01-18 17:44:13 -080044{
45 debugf4("\tchannel = %p\n", chan);
46 debugf4("\tchannel->chan_idx = %d\n", chan->chan_idx);
47 debugf4("\tchannel->ce_count = %d\n", chan->ce_count);
48 debugf4("\tchannel->label = '%s'\n", chan->label);
49 debugf4("\tchannel->csrow = %p\n\n", chan->csrow);
50}
51
Adrian Bunk2da1c112007-07-19 01:49:32 -070052static void edac_mc_dump_csrow(struct csrow_info *csrow)
Alan Coxda9bb1d2006-01-18 17:44:13 -080053{
54 debugf4("\tcsrow = %p\n", csrow);
55 debugf4("\tcsrow->csrow_idx = %d\n", csrow->csrow_idx);
Douglas Thompson079708b2007-07-19 01:49:58 -070056 debugf4("\tcsrow->first_page = 0x%lx\n", csrow->first_page);
Alan Coxda9bb1d2006-01-18 17:44:13 -080057 debugf4("\tcsrow->last_page = 0x%lx\n", csrow->last_page);
58 debugf4("\tcsrow->page_mask = 0x%lx\n", csrow->page_mask);
59 debugf4("\tcsrow->nr_pages = 0x%x\n", csrow->nr_pages);
Douglas Thompson079708b2007-07-19 01:49:58 -070060 debugf4("\tcsrow->nr_channels = %d\n", csrow->nr_channels);
Alan Coxda9bb1d2006-01-18 17:44:13 -080061 debugf4("\tcsrow->channels = %p\n", csrow->channels);
62 debugf4("\tcsrow->mci = %p\n\n", csrow->mci);
63}
64
Adrian Bunk2da1c112007-07-19 01:49:32 -070065static void edac_mc_dump_mci(struct mem_ctl_info *mci)
Alan Coxda9bb1d2006-01-18 17:44:13 -080066{
67 debugf3("\tmci = %p\n", mci);
68 debugf3("\tmci->mtype_cap = %lx\n", mci->mtype_cap);
69 debugf3("\tmci->edac_ctl_cap = %lx\n", mci->edac_ctl_cap);
70 debugf3("\tmci->edac_cap = %lx\n", mci->edac_cap);
71 debugf4("\tmci->edac_check = %p\n", mci->edac_check);
72 debugf3("\tmci->nr_csrows = %d, csrows = %p\n",
73 mci->nr_csrows, mci->csrows);
Doug Thompson37f04582006-06-30 01:56:07 -070074 debugf3("\tdev = %p\n", mci->dev);
Douglas Thompson079708b2007-07-19 01:49:58 -070075 debugf3("\tmod_name:ctl_name = %s:%s\n", mci->mod_name, mci->ctl_name);
Alan Coxda9bb1d2006-01-18 17:44:13 -080076 debugf3("\tpvt_info = %p\n\n", mci->pvt_info);
77}
78
Borislav Petkov239642f2009-11-12 15:33:16 +010079/*
80 * keep those in sync with the enum mem_type
81 */
82const char *edac_mem_types[] = {
83 "Empty csrow",
84 "Reserved csrow type",
85 "Unknown csrow type",
86 "Fast page mode RAM",
87 "Extended data out RAM",
88 "Burst Extended data out RAM",
89 "Single data rate SDRAM",
90 "Registered single data rate SDRAM",
91 "Double data rate SDRAM",
92 "Registered Double data rate SDRAM",
93 "Rambus DRAM",
94 "Unbuffered DDR2 RAM",
95 "Fully buffered DDR2",
96 "Registered DDR2 RAM",
97 "Rambus XDR",
98 "Unbuffered DDR3 RAM",
99 "Registered DDR3 RAM",
100};
101EXPORT_SYMBOL_GPL(edac_mem_types);
102
Douglas Thompson079708b2007-07-19 01:49:58 -0700103#endif /* CONFIG_EDAC_DEBUG */
Alan Coxda9bb1d2006-01-18 17:44:13 -0800104
105/* 'ptr' points to a possibly unaligned item X such that sizeof(X) is 'size'.
106 * Adjust 'ptr' so that its alignment is at least as stringent as what the
107 * compiler would provide for X and return the aligned result.
108 *
109 * If 'size' is a constant, the compiler will optimize this whole function
110 * down to either a no-op or the addition of a constant to the value of 'ptr'.
111 */
Douglas Thompson7391c6d2007-07-19 01:50:21 -0700112void *edac_align_ptr(void *ptr, unsigned size)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800113{
114 unsigned align, r;
115
116 /* Here we assume that the alignment of a "long long" is the most
117 * stringent alignment that the compiler will ever provide by default.
118 * As far as I know, this is a reasonable assumption.
119 */
120 if (size > sizeof(long))
121 align = sizeof(long long);
122 else if (size > sizeof(int))
123 align = sizeof(long);
124 else if (size > sizeof(short))
125 align = sizeof(int);
126 else if (size > sizeof(char))
127 align = sizeof(short);
128 else
Douglas Thompson079708b2007-07-19 01:49:58 -0700129 return (char *)ptr;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800130
131 r = size % align;
132
133 if (r == 0)
Douglas Thompson079708b2007-07-19 01:49:58 -0700134 return (char *)ptr;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800135
Douglas Thompson7391c6d2007-07-19 01:50:21 -0700136 return (void *)(((unsigned long)ptr) + align - r);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800137}
138
Alan Coxda9bb1d2006-01-18 17:44:13 -0800139/**
140 * edac_mc_alloc: Allocate a struct mem_ctl_info structure
141 * @size_pvt: size of private storage needed
142 * @nr_csrows: Number of CWROWS needed for this MC
143 * @nr_chans: Number of channels for the MC
144 *
145 * Everything is kmalloc'ed as one big chunk - more efficient.
146 * Only can be used if all structures have the same lifetime - otherwise
147 * you have to allocate and initialize your own structures.
148 *
149 * Use edac_mc_free() to free mc structures allocated by this function.
150 *
151 * Returns:
152 * NULL allocation failed
153 * struct mem_ctl_info pointer
154 */
155struct mem_ctl_info *edac_mc_alloc(unsigned sz_pvt, unsigned nr_csrows,
Doug Thompsonb8f6f972007-07-19 01:50:26 -0700156 unsigned nr_chans, int edac_index)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800157{
158 struct mem_ctl_info *mci;
159 struct csrow_info *csi, *csrow;
160 struct channel_info *chi, *chp, *chan;
161 void *pvt;
162 unsigned size;
163 int row, chn;
Doug Thompson8096cfa2007-07-19 01:50:27 -0700164 int err;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800165
166 /* Figure out the offsets of the various items from the start of an mc
167 * structure. We want the alignment of each item to be at least as
168 * stringent as what the compiler would provide if we could simply
169 * hardcode everything into a single struct.
170 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700171 mci = (struct mem_ctl_info *)0;
Douglas Thompson7391c6d2007-07-19 01:50:21 -0700172 csi = edac_align_ptr(&mci[1], sizeof(*csi));
173 chi = edac_align_ptr(&csi[nr_csrows], sizeof(*chi));
Douglas Thompsone27e3da2007-07-19 01:49:36 -0700174 pvt = edac_align_ptr(&chi[nr_chans * nr_csrows], sz_pvt);
Douglas Thompson079708b2007-07-19 01:49:58 -0700175 size = ((unsigned long)pvt) + sz_pvt;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800176
Doug Thompson8096cfa2007-07-19 01:50:27 -0700177 mci = kzalloc(size, GFP_KERNEL);
178 if (mci == NULL)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800179 return NULL;
180
181 /* Adjust pointers so they point within the memory we just allocated
182 * rather than an imaginary chunk of memory located at address 0.
183 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700184 csi = (struct csrow_info *)(((char *)mci) + ((unsigned long)csi));
185 chi = (struct channel_info *)(((char *)mci) + ((unsigned long)chi));
186 pvt = sz_pvt ? (((char *)mci) + ((unsigned long)pvt)) : NULL;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800187
Doug Thompsonb8f6f972007-07-19 01:50:26 -0700188 /* setup index and various internal pointers */
189 mci->mc_idx = edac_index;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800190 mci->csrows = csi;
191 mci->pvt_info = pvt;
192 mci->nr_csrows = nr_csrows;
193
194 for (row = 0; row < nr_csrows; row++) {
195 csrow = &csi[row];
196 csrow->csrow_idx = row;
197 csrow->mci = mci;
198 csrow->nr_channels = nr_chans;
199 chp = &chi[row * nr_chans];
200 csrow->channels = chp;
201
202 for (chn = 0; chn < nr_chans; chn++) {
203 chan = &chp[chn];
204 chan->chan_idx = chn;
205 chan->csrow = csrow;
206 }
207 }
208
Dave Jiang81d87cb2007-07-19 01:49:52 -0700209 mci->op_state = OP_ALLOC;
210
Doug Thompson8096cfa2007-07-19 01:50:27 -0700211 /*
212 * Initialize the 'root' kobj for the edac_mc controller
213 */
214 err = edac_mc_register_sysfs_main_kobj(mci);
215 if (err) {
216 kfree(mci);
217 return NULL;
218 }
219
220 /* at this point, the root kobj is valid, and in order to
221 * 'free' the object, then the function:
222 * edac_mc_unregister_sysfs_main_kobj() must be called
223 * which will perform kobj unregistration and the actual free
224 * will occur during the kobject callback operation
225 */
Alan Coxda9bb1d2006-01-18 17:44:13 -0800226 return mci;
227}
Dave Peterson91105402006-03-26 01:38:55 -0800228EXPORT_SYMBOL_GPL(edac_mc_alloc);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800229
Alan Coxda9bb1d2006-01-18 17:44:13 -0800230/**
Doug Thompson8096cfa2007-07-19 01:50:27 -0700231 * edac_mc_free
232 * 'Free' a previously allocated 'mci' structure
Alan Coxda9bb1d2006-01-18 17:44:13 -0800233 * @mci: pointer to a struct mem_ctl_info structure
Alan Coxda9bb1d2006-01-18 17:44:13 -0800234 */
235void edac_mc_free(struct mem_ctl_info *mci)
236{
Doug Thompson8096cfa2007-07-19 01:50:27 -0700237 edac_mc_unregister_sysfs_main_kobj(mci);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800238}
Dave Peterson91105402006-03-26 01:38:55 -0800239EXPORT_SYMBOL_GPL(edac_mc_free);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800240
Doug Thompsonbce19682007-07-26 10:41:14 -0700241
Mauro Carvalho Chehab939747bd2010-08-10 11:22:01 -0300242/**
Doug Thompsonbce19682007-07-26 10:41:14 -0700243 * find_mci_by_dev
244 *
245 * scan list of controllers looking for the one that manages
246 * the 'dev' device
Mauro Carvalho Chehab939747bd2010-08-10 11:22:01 -0300247 * @dev: pointer to a struct device related with the MCI
Doug Thompsonbce19682007-07-26 10:41:14 -0700248 */
Mauro Carvalho Chehab939747bd2010-08-10 11:22:01 -0300249struct mem_ctl_info *find_mci_by_dev(struct device *dev)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800250{
251 struct mem_ctl_info *mci;
252 struct list_head *item;
253
Dave Peterson537fba22006-03-26 01:38:40 -0800254 debugf3("%s()\n", __func__);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800255
256 list_for_each(item, &mc_devices) {
257 mci = list_entry(item, struct mem_ctl_info, link);
258
Doug Thompson37f04582006-06-30 01:56:07 -0700259 if (mci->dev == dev)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800260 return mci;
261 }
262
263 return NULL;
264}
Mauro Carvalho Chehab939747bd2010-08-10 11:22:01 -0300265EXPORT_SYMBOL_GPL(find_mci_by_dev);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800266
Dave Jiang81d87cb2007-07-19 01:49:52 -0700267/*
268 * handler for EDAC to check if NMI type handler has asserted interrupt
269 */
270static int edac_mc_assert_error_check_and_clear(void)
271{
Dave Jiang66ee2f92007-07-19 01:49:54 -0700272 int old_state;
Dave Jiang81d87cb2007-07-19 01:49:52 -0700273
Douglas Thompson079708b2007-07-19 01:49:58 -0700274 if (edac_op_state == EDAC_OPSTATE_POLL)
Dave Jiang81d87cb2007-07-19 01:49:52 -0700275 return 1;
276
Dave Jiang66ee2f92007-07-19 01:49:54 -0700277 old_state = edac_err_assert;
278 edac_err_assert = 0;
Dave Jiang81d87cb2007-07-19 01:49:52 -0700279
Dave Jiang66ee2f92007-07-19 01:49:54 -0700280 return old_state;
Dave Jiang81d87cb2007-07-19 01:49:52 -0700281}
282
283/*
284 * edac_mc_workq_function
285 * performs the operation scheduled by a workq request
286 */
Dave Jiang81d87cb2007-07-19 01:49:52 -0700287static void edac_mc_workq_function(struct work_struct *work_req)
288{
Jean Delvarefbeb4382009-04-13 14:40:21 -0700289 struct delayed_work *d_work = to_delayed_work(work_req);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700290 struct mem_ctl_info *mci = to_edac_mem_ctl_work(d_work);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700291
292 mutex_lock(&mem_ctls_mutex);
293
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700294 /* if this control struct has movd to offline state, we are done */
295 if (mci->op_state == OP_OFFLINE) {
296 mutex_unlock(&mem_ctls_mutex);
297 return;
298 }
299
Dave Jiang81d87cb2007-07-19 01:49:52 -0700300 /* Only poll controllers that are running polled and have a check */
301 if (edac_mc_assert_error_check_and_clear() && (mci->edac_check != NULL))
302 mci->edac_check(mci);
303
Dave Jiang81d87cb2007-07-19 01:49:52 -0700304 mutex_unlock(&mem_ctls_mutex);
305
306 /* Reschedule */
Dave Jiang4de78c62007-07-19 01:49:54 -0700307 queue_delayed_work(edac_workqueue, &mci->work,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700308 msecs_to_jiffies(edac_mc_get_poll_msec()));
Dave Jiang81d87cb2007-07-19 01:49:52 -0700309}
310
311/*
312 * edac_mc_workq_setup
313 * initialize a workq item for this mci
314 * passing in the new delay period in msec
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700315 *
316 * locking model:
317 *
318 * called with the mem_ctls_mutex held
Dave Jiang81d87cb2007-07-19 01:49:52 -0700319 */
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700320static void edac_mc_workq_setup(struct mem_ctl_info *mci, unsigned msec)
Dave Jiang81d87cb2007-07-19 01:49:52 -0700321{
322 debugf0("%s()\n", __func__);
323
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700324 /* if this instance is not in the POLL state, then simply return */
325 if (mci->op_state != OP_RUNNING_POLL)
326 return;
327
Dave Jiang81d87cb2007-07-19 01:49:52 -0700328 INIT_DELAYED_WORK(&mci->work, edac_mc_workq_function);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700329 queue_delayed_work(edac_workqueue, &mci->work, msecs_to_jiffies(msec));
330}
331
332/*
333 * edac_mc_workq_teardown
334 * stop the workq processing on this mci
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700335 *
336 * locking model:
337 *
338 * called WITHOUT lock held
Dave Jiang81d87cb2007-07-19 01:49:52 -0700339 */
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700340static void edac_mc_workq_teardown(struct mem_ctl_info *mci)
Dave Jiang81d87cb2007-07-19 01:49:52 -0700341{
342 int status;
343
Borislav Petkov00740c52010-09-26 12:42:23 +0200344 if (mci->op_state != OP_RUNNING_POLL)
345 return;
346
Doug Thompsonbce19682007-07-26 10:41:14 -0700347 status = cancel_delayed_work(&mci->work);
348 if (status == 0) {
349 debugf0("%s() not canceled, flush the queue\n",
350 __func__);
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700351
Doug Thompsonbce19682007-07-26 10:41:14 -0700352 /* workq instance might be running, wait for it */
353 flush_workqueue(edac_workqueue);
Dave Jiang81d87cb2007-07-19 01:49:52 -0700354 }
355}
356
357/*
Doug Thompsonbce19682007-07-26 10:41:14 -0700358 * edac_mc_reset_delay_period(unsigned long value)
359 *
360 * user space has updated our poll period value, need to
361 * reset our workq delays
Dave Jiang81d87cb2007-07-19 01:49:52 -0700362 */
Doug Thompsonbce19682007-07-26 10:41:14 -0700363void edac_mc_reset_delay_period(int value)
Dave Jiang81d87cb2007-07-19 01:49:52 -0700364{
Doug Thompsonbce19682007-07-26 10:41:14 -0700365 struct mem_ctl_info *mci;
366 struct list_head *item;
Dave Jiang81d87cb2007-07-19 01:49:52 -0700367
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700368 mutex_lock(&mem_ctls_mutex);
369
Doug Thompsonbce19682007-07-26 10:41:14 -0700370 /* scan the list and turn off all workq timers, doing so under lock
371 */
372 list_for_each(item, &mc_devices) {
373 mci = list_entry(item, struct mem_ctl_info, link);
374
375 if (mci->op_state == OP_RUNNING_POLL)
376 cancel_delayed_work(&mci->work);
377 }
378
379 mutex_unlock(&mem_ctls_mutex);
380
381
382 /* re-walk the list, and reset the poll delay */
383 mutex_lock(&mem_ctls_mutex);
384
385 list_for_each(item, &mc_devices) {
386 mci = list_entry(item, struct mem_ctl_info, link);
387
388 edac_mc_workq_setup(mci, (unsigned long) value);
389 }
Dave Jiang81d87cb2007-07-19 01:49:52 -0700390
391 mutex_unlock(&mem_ctls_mutex);
392}
393
Doug Thompsonbce19682007-07-26 10:41:14 -0700394
395
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700396/* Return 0 on success, 1 on failure.
397 * Before calling this function, caller must
398 * assign a unique value to mci->mc_idx.
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700399 *
400 * locking model:
401 *
402 * called with the mem_ctls_mutex lock held
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700403 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700404static int add_mc_to_global_list(struct mem_ctl_info *mci)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800405{
406 struct list_head *item, *insert_before;
407 struct mem_ctl_info *p;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800408
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700409 insert_before = &mc_devices;
410
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700411 p = find_mci_by_dev(mci->dev);
412 if (unlikely(p != NULL))
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700413 goto fail0;
414
415 list_for_each(item, &mc_devices) {
416 p = list_entry(item, struct mem_ctl_info, link);
417
418 if (p->mc_idx >= mci->mc_idx) {
419 if (unlikely(p->mc_idx == mci->mc_idx))
420 goto fail1;
421
422 insert_before = item;
423 break;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800424 }
Alan Coxda9bb1d2006-01-18 17:44:13 -0800425 }
426
427 list_add_tail_rcu(&mci->link, insert_before);
Dave Jiangc0d12172007-07-19 01:49:46 -0700428 atomic_inc(&edac_handlers);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800429 return 0;
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700430
Douglas Thompson052dfb42007-07-19 01:50:13 -0700431fail0:
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700432 edac_printk(KERN_WARNING, EDAC_MC,
Kay Sievers281efb12009-01-06 14:42:57 -0800433 "%s (%s) %s %s already assigned %d\n", dev_name(p->dev),
Stephen Rothwell17aa7e02008-05-05 13:54:19 +1000434 edac_dev_name(mci), p->mod_name, p->ctl_name, p->mc_idx);
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700435 return 1;
436
Douglas Thompson052dfb42007-07-19 01:50:13 -0700437fail1:
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700438 edac_printk(KERN_WARNING, EDAC_MC,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700439 "bug in low-level driver: attempt to assign\n"
440 " duplicate mc_idx %d in %s()\n", p->mc_idx, __func__);
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700441 return 1;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800442}
443
Dave Petersone7ecd892006-03-26 01:38:52 -0800444static void complete_mc_list_del(struct rcu_head *head)
Dave Petersona1d03fc2006-03-26 01:38:46 -0800445{
446 struct mem_ctl_info *mci;
447
448 mci = container_of(head, struct mem_ctl_info, rcu);
449 INIT_LIST_HEAD(&mci->link);
Dave Petersona1d03fc2006-03-26 01:38:46 -0800450}
451
Dave Petersone7ecd892006-03-26 01:38:52 -0800452static void del_mc_from_global_list(struct mem_ctl_info *mci)
Dave Petersona1d03fc2006-03-26 01:38:46 -0800453{
Dave Jiangc0d12172007-07-19 01:49:46 -0700454 atomic_dec(&edac_handlers);
Dave Petersona1d03fc2006-03-26 01:38:46 -0800455 list_del_rcu(&mci->link);
Dave Petersona1d03fc2006-03-26 01:38:46 -0800456 call_rcu(&mci->rcu, complete_mc_list_del);
Jesper Dangaard Brouer458e5ff2009-09-23 15:57:29 -0700457 rcu_barrier();
Dave Petersona1d03fc2006-03-26 01:38:46 -0800458}
459
Alan Coxda9bb1d2006-01-18 17:44:13 -0800460/**
Douglas Thompson5da08312007-07-19 01:49:31 -0700461 * edac_mc_find: Search for a mem_ctl_info structure whose index is 'idx'.
462 *
463 * If found, return a pointer to the structure.
464 * Else return NULL.
465 *
466 * Caller must hold mem_ctls_mutex.
467 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700468struct mem_ctl_info *edac_mc_find(int idx)
Douglas Thompson5da08312007-07-19 01:49:31 -0700469{
470 struct list_head *item;
471 struct mem_ctl_info *mci;
472
473 list_for_each(item, &mc_devices) {
474 mci = list_entry(item, struct mem_ctl_info, link);
475
476 if (mci->mc_idx >= idx) {
477 if (mci->mc_idx == idx)
478 return mci;
479
480 break;
481 }
482 }
483
484 return NULL;
485}
486EXPORT_SYMBOL(edac_mc_find);
487
488/**
Dave Peterson472678e2006-03-26 01:38:49 -0800489 * edac_mc_add_mc: Insert the 'mci' structure into the mci global list and
490 * create sysfs entries associated with mci structure
Alan Coxda9bb1d2006-01-18 17:44:13 -0800491 * @mci: pointer to the mci structure to be added to the list
Doug Thompson2d7bbb92006-06-30 01:56:08 -0700492 * @mc_idx: A unique numeric identifier to be assigned to the 'mci' structure.
Alan Coxda9bb1d2006-01-18 17:44:13 -0800493 *
494 * Return:
495 * 0 Success
496 * !0 Failure
497 */
498
499/* FIXME - should a warning be printed if no error detection? correction? */
Doug Thompsonb8f6f972007-07-19 01:50:26 -0700500int edac_mc_add_mc(struct mem_ctl_info *mci)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800501{
Dave Peterson537fba22006-03-26 01:38:40 -0800502 debugf0("%s()\n", __func__);
Doug Thompsonb8f6f972007-07-19 01:50:26 -0700503
Alan Coxda9bb1d2006-01-18 17:44:13 -0800504#ifdef CONFIG_EDAC_DEBUG
505 if (edac_debug_level >= 3)
506 edac_mc_dump_mci(mci);
Dave Petersone7ecd892006-03-26 01:38:52 -0800507
Alan Coxda9bb1d2006-01-18 17:44:13 -0800508 if (edac_debug_level >= 4) {
509 int i;
510
511 for (i = 0; i < mci->nr_csrows; i++) {
512 int j;
Dave Petersone7ecd892006-03-26 01:38:52 -0800513
Alan Coxda9bb1d2006-01-18 17:44:13 -0800514 edac_mc_dump_csrow(&mci->csrows[i]);
515 for (j = 0; j < mci->csrows[i].nr_channels; j++)
Douglas Thompson079708b2007-07-19 01:49:58 -0700516 edac_mc_dump_channel(&mci->csrows[i].
Douglas Thompson052dfb42007-07-19 01:50:13 -0700517 channels[j]);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800518 }
519 }
520#endif
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700521 mutex_lock(&mem_ctls_mutex);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800522
523 if (add_mc_to_global_list(mci))
Dave Peterson028a7b62006-03-26 01:38:47 -0800524 goto fail0;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800525
526 /* set load time so that error rate can be tracked */
527 mci->start_time = jiffies;
528
eric wollesen9794f332007-02-12 00:53:08 -0800529 if (edac_create_sysfs_mci_device(mci)) {
530 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700531 "failed to create sysfs device\n");
eric wollesen9794f332007-02-12 00:53:08 -0800532 goto fail1;
533 }
Alan Coxda9bb1d2006-01-18 17:44:13 -0800534
Dave Jiang81d87cb2007-07-19 01:49:52 -0700535 /* If there IS a check routine, then we are running POLLED */
536 if (mci->edac_check != NULL) {
537 /* This instance is NOW RUNNING */
538 mci->op_state = OP_RUNNING_POLL;
539
540 edac_mc_workq_setup(mci, edac_mc_get_poll_msec());
541 } else {
542 mci->op_state = OP_RUNNING_INTERRUPT;
543 }
544
Alan Coxda9bb1d2006-01-18 17:44:13 -0800545 /* Report action taken */
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700546 edac_mc_printk(mci, KERN_INFO, "Giving out device to '%s' '%s':"
Stephen Rothwell17aa7e02008-05-05 13:54:19 +1000547 " DEV %s\n", mci->mod_name, mci->ctl_name, edac_dev_name(mci));
Alan Coxda9bb1d2006-01-18 17:44:13 -0800548
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700549 mutex_unlock(&mem_ctls_mutex);
Dave Peterson028a7b62006-03-26 01:38:47 -0800550 return 0;
551
Douglas Thompson052dfb42007-07-19 01:50:13 -0700552fail1:
Dave Peterson028a7b62006-03-26 01:38:47 -0800553 del_mc_from_global_list(mci);
554
Douglas Thompson052dfb42007-07-19 01:50:13 -0700555fail0:
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700556 mutex_unlock(&mem_ctls_mutex);
Dave Peterson028a7b62006-03-26 01:38:47 -0800557 return 1;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800558}
Dave Peterson91105402006-03-26 01:38:55 -0800559EXPORT_SYMBOL_GPL(edac_mc_add_mc);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800560
Alan Coxda9bb1d2006-01-18 17:44:13 -0800561/**
Dave Peterson472678e2006-03-26 01:38:49 -0800562 * edac_mc_del_mc: Remove sysfs entries for specified mci structure and
563 * remove mci structure from global list
Doug Thompson37f04582006-06-30 01:56:07 -0700564 * @pdev: Pointer to 'struct device' representing mci structure to remove.
Alan Coxda9bb1d2006-01-18 17:44:13 -0800565 *
Dave Peterson18dbc332006-03-26 01:38:50 -0800566 * Return pointer to removed mci structure, or NULL if device not found.
Alan Coxda9bb1d2006-01-18 17:44:13 -0800567 */
Douglas Thompson079708b2007-07-19 01:49:58 -0700568struct mem_ctl_info *edac_mc_del_mc(struct device *dev)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800569{
Dave Peterson18dbc332006-03-26 01:38:50 -0800570 struct mem_ctl_info *mci;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800571
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700572 debugf0("%s()\n", __func__);
573
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700574 mutex_lock(&mem_ctls_mutex);
Dave Peterson18dbc332006-03-26 01:38:50 -0800575
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700576 /* find the requested mci struct in the global list */
577 mci = find_mci_by_dev(dev);
578 if (mci == NULL) {
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700579 mutex_unlock(&mem_ctls_mutex);
Dave Peterson18dbc332006-03-26 01:38:50 -0800580 return NULL;
581 }
582
Dave Jiang81d87cb2007-07-19 01:49:52 -0700583 /* marking MCI offline */
584 mci->op_state = OP_OFFLINE;
585
Alan Coxda9bb1d2006-01-18 17:44:13 -0800586 del_mc_from_global_list(mci);
Matthias Kaehlcke63b7df92007-07-19 01:49:38 -0700587 mutex_unlock(&mem_ctls_mutex);
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700588
589 /* flush workq processes and remove sysfs */
590 edac_mc_workq_teardown(mci);
591 edac_remove_sysfs_mci_device(mci);
592
Dave Peterson537fba22006-03-26 01:38:40 -0800593 edac_printk(KERN_INFO, EDAC_MC,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700594 "Removed device %d for %s %s: DEV %s\n", mci->mc_idx,
Stephen Rothwell17aa7e02008-05-05 13:54:19 +1000595 mci->mod_name, mci->ctl_name, edac_dev_name(mci));
Doug Thompsonbf52fa42007-07-19 01:50:30 -0700596
Dave Peterson18dbc332006-03-26 01:38:50 -0800597 return mci;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800598}
Dave Peterson91105402006-03-26 01:38:55 -0800599EXPORT_SYMBOL_GPL(edac_mc_del_mc);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800600
Adrian Bunk2da1c112007-07-19 01:49:32 -0700601static void edac_mc_scrub_block(unsigned long page, unsigned long offset,
602 u32 size)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800603{
604 struct page *pg;
605 void *virt_addr;
606 unsigned long flags = 0;
607
Dave Peterson537fba22006-03-26 01:38:40 -0800608 debugf3("%s()\n", __func__);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800609
610 /* ECC error page was not in our memory. Ignore it. */
Douglas Thompson079708b2007-07-19 01:49:58 -0700611 if (!pfn_valid(page))
Alan Coxda9bb1d2006-01-18 17:44:13 -0800612 return;
613
614 /* Find the actual page structure then map it and fix */
615 pg = pfn_to_page(page);
616
617 if (PageHighMem(pg))
618 local_irq_save(flags);
619
620 virt_addr = kmap_atomic(pg, KM_BOUNCE_READ);
621
622 /* Perform architecture specific atomic scrub operation */
623 atomic_scrub(virt_addr + offset, size);
624
625 /* Unmap and complete */
626 kunmap_atomic(virt_addr, KM_BOUNCE_READ);
627
628 if (PageHighMem(pg))
629 local_irq_restore(flags);
630}
631
Alan Coxda9bb1d2006-01-18 17:44:13 -0800632/* FIXME - should return -1 */
Dave Petersone7ecd892006-03-26 01:38:52 -0800633int edac_mc_find_csrow_by_page(struct mem_ctl_info *mci, unsigned long page)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800634{
635 struct csrow_info *csrows = mci->csrows;
636 int row, i;
637
Dave Peterson537fba22006-03-26 01:38:40 -0800638 debugf1("MC%d: %s(): 0x%lx\n", mci->mc_idx, __func__, page);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800639 row = -1;
640
641 for (i = 0; i < mci->nr_csrows; i++) {
642 struct csrow_info *csrow = &csrows[i];
643
644 if (csrow->nr_pages == 0)
645 continue;
646
Dave Peterson537fba22006-03-26 01:38:40 -0800647 debugf3("MC%d: %s(): first(0x%lx) page(0x%lx) last(0x%lx) "
648 "mask(0x%lx)\n", mci->mc_idx, __func__,
649 csrow->first_page, page, csrow->last_page,
650 csrow->page_mask);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800651
652 if ((page >= csrow->first_page) &&
653 (page <= csrow->last_page) &&
654 ((page & csrow->page_mask) ==
655 (csrow->first_page & csrow->page_mask))) {
656 row = i;
657 break;
658 }
659 }
660
661 if (row == -1)
Dave Peterson537fba22006-03-26 01:38:40 -0800662 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700663 "could not look up page error address %lx\n",
664 (unsigned long)page);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800665
666 return row;
667}
Dave Peterson91105402006-03-26 01:38:55 -0800668EXPORT_SYMBOL_GPL(edac_mc_find_csrow_by_page);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800669
Alan Coxda9bb1d2006-01-18 17:44:13 -0800670/* FIXME - setable log (warning/emerg) levels */
671/* FIXME - integrate with evlog: http://evlog.sourceforge.net/ */
672void edac_mc_handle_ce(struct mem_ctl_info *mci,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700673 unsigned long page_frame_number,
674 unsigned long offset_in_page, unsigned long syndrome,
675 int row, int channel, const char *msg)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800676{
677 unsigned long remapped_page;
678
Dave Peterson537fba22006-03-26 01:38:40 -0800679 debugf3("MC%d: %s()\n", mci->mc_idx, __func__);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800680
681 /* FIXME - maybe make panic on INTERNAL ERROR an option */
682 if (row >= mci->nr_csrows || row < 0) {
683 /* something is wrong */
Dave Peterson537fba22006-03-26 01:38:40 -0800684 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700685 "INTERNAL ERROR: row out of range "
686 "(%d >= %d)\n", row, mci->nr_csrows);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800687 edac_mc_handle_ce_no_info(mci, "INTERNAL ERROR");
688 return;
689 }
Dave Petersone7ecd892006-03-26 01:38:52 -0800690
Alan Coxda9bb1d2006-01-18 17:44:13 -0800691 if (channel >= mci->csrows[row].nr_channels || channel < 0) {
692 /* something is wrong */
Dave Peterson537fba22006-03-26 01:38:40 -0800693 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700694 "INTERNAL ERROR: channel out of range "
695 "(%d >= %d)\n", channel,
696 mci->csrows[row].nr_channels);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800697 edac_mc_handle_ce_no_info(mci, "INTERNAL ERROR");
698 return;
699 }
700
Dave Jiang4de78c62007-07-19 01:49:54 -0700701 if (edac_mc_get_log_ce())
Alan Coxda9bb1d2006-01-18 17:44:13 -0800702 /* FIXME - put in DIMM location */
Dave Peterson537fba22006-03-26 01:38:40 -0800703 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700704 "CE page 0x%lx, offset 0x%lx, grain %d, syndrome "
705 "0x%lx, row %d, channel %d, label \"%s\": %s\n",
706 page_frame_number, offset_in_page,
707 mci->csrows[row].grain, syndrome, row, channel,
708 mci->csrows[row].channels[channel].label, msg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800709
710 mci->ce_count++;
711 mci->csrows[row].ce_count++;
712 mci->csrows[row].channels[channel].ce_count++;
713
714 if (mci->scrub_mode & SCRUB_SW_SRC) {
715 /*
716 * Some MC's can remap memory so that it is still available
717 * at a different address when PCI devices map into memory.
718 * MC's that can't do this lose the memory where PCI devices
719 * are mapped. This mapping is MC dependant and so we call
720 * back into the MC driver for it to map the MC page to
721 * a physical (CPU) page which can then be mapped to a virtual
722 * page - which can then be scrubbed.
723 */
724 remapped_page = mci->ctl_page_to_phys ?
Douglas Thompson052dfb42007-07-19 01:50:13 -0700725 mci->ctl_page_to_phys(mci, page_frame_number) :
726 page_frame_number;
Alan Coxda9bb1d2006-01-18 17:44:13 -0800727
728 edac_mc_scrub_block(remapped_page, offset_in_page,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700729 mci->csrows[row].grain);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800730 }
731}
Dave Peterson91105402006-03-26 01:38:55 -0800732EXPORT_SYMBOL_GPL(edac_mc_handle_ce);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800733
Dave Petersone7ecd892006-03-26 01:38:52 -0800734void edac_mc_handle_ce_no_info(struct mem_ctl_info *mci, const char *msg)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800735{
Dave Jiang4de78c62007-07-19 01:49:54 -0700736 if (edac_mc_get_log_ce())
Dave Peterson537fba22006-03-26 01:38:40 -0800737 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700738 "CE - no information available: %s\n", msg);
Dave Petersone7ecd892006-03-26 01:38:52 -0800739
Alan Coxda9bb1d2006-01-18 17:44:13 -0800740 mci->ce_noinfo_count++;
741 mci->ce_count++;
742}
Dave Peterson91105402006-03-26 01:38:55 -0800743EXPORT_SYMBOL_GPL(edac_mc_handle_ce_no_info);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800744
Alan Coxda9bb1d2006-01-18 17:44:13 -0800745void edac_mc_handle_ue(struct mem_ctl_info *mci,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700746 unsigned long page_frame_number,
747 unsigned long offset_in_page, int row, const char *msg)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800748{
749 int len = EDAC_MC_LABEL_LEN * 4;
750 char labels[len + 1];
751 char *pos = labels;
752 int chan;
753 int chars;
754
Dave Peterson537fba22006-03-26 01:38:40 -0800755 debugf3("MC%d: %s()\n", mci->mc_idx, __func__);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800756
757 /* FIXME - maybe make panic on INTERNAL ERROR an option */
758 if (row >= mci->nr_csrows || row < 0) {
759 /* something is wrong */
Dave Peterson537fba22006-03-26 01:38:40 -0800760 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700761 "INTERNAL ERROR: row out of range "
762 "(%d >= %d)\n", row, mci->nr_csrows);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800763 edac_mc_handle_ue_no_info(mci, "INTERNAL ERROR");
764 return;
765 }
766
767 chars = snprintf(pos, len + 1, "%s",
Douglas Thompson079708b2007-07-19 01:49:58 -0700768 mci->csrows[row].channels[0].label);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800769 len -= chars;
770 pos += chars;
Dave Petersone7ecd892006-03-26 01:38:52 -0800771
Alan Coxda9bb1d2006-01-18 17:44:13 -0800772 for (chan = 1; (chan < mci->csrows[row].nr_channels) && (len > 0);
Douglas Thompson052dfb42007-07-19 01:50:13 -0700773 chan++) {
Alan Coxda9bb1d2006-01-18 17:44:13 -0800774 chars = snprintf(pos, len + 1, ":%s",
Douglas Thompson079708b2007-07-19 01:49:58 -0700775 mci->csrows[row].channels[chan].label);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800776 len -= chars;
777 pos += chars;
778 }
779
Dave Jiang4de78c62007-07-19 01:49:54 -0700780 if (edac_mc_get_log_ue())
Dave Peterson537fba22006-03-26 01:38:40 -0800781 edac_mc_printk(mci, KERN_EMERG,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700782 "UE page 0x%lx, offset 0x%lx, grain %d, row %d, "
783 "labels \"%s\": %s\n", page_frame_number,
784 offset_in_page, mci->csrows[row].grain, row,
785 labels, msg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800786
Dave Jiang4de78c62007-07-19 01:49:54 -0700787 if (edac_mc_get_panic_on_ue())
Dave Petersone7ecd892006-03-26 01:38:52 -0800788 panic("EDAC MC%d: UE page 0x%lx, offset 0x%lx, grain %d, "
Douglas Thompson052dfb42007-07-19 01:50:13 -0700789 "row %d, labels \"%s\": %s\n", mci->mc_idx,
790 page_frame_number, offset_in_page,
791 mci->csrows[row].grain, row, labels, msg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800792
793 mci->ue_count++;
794 mci->csrows[row].ue_count++;
795}
Dave Peterson91105402006-03-26 01:38:55 -0800796EXPORT_SYMBOL_GPL(edac_mc_handle_ue);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800797
Dave Petersone7ecd892006-03-26 01:38:52 -0800798void edac_mc_handle_ue_no_info(struct mem_ctl_info *mci, const char *msg)
Alan Coxda9bb1d2006-01-18 17:44:13 -0800799{
Dave Jiang4de78c62007-07-19 01:49:54 -0700800 if (edac_mc_get_panic_on_ue())
Alan Coxda9bb1d2006-01-18 17:44:13 -0800801 panic("EDAC MC%d: Uncorrected Error", mci->mc_idx);
802
Dave Jiang4de78c62007-07-19 01:49:54 -0700803 if (edac_mc_get_log_ue())
Dave Peterson537fba22006-03-26 01:38:40 -0800804 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700805 "UE - no information available: %s\n", msg);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800806 mci->ue_noinfo_count++;
807 mci->ue_count++;
808}
Douglas Thompson079708b2007-07-19 01:49:58 -0700809EXPORT_SYMBOL_GPL(edac_mc_handle_ue_no_info);
Alan Coxda9bb1d2006-01-18 17:44:13 -0800810
eric wollesen9794f332007-02-12 00:53:08 -0800811/*************************************************************
812 * On Fully Buffered DIMM modules, this help function is
813 * called to process UE events
814 */
815void edac_mc_handle_fbd_ue(struct mem_ctl_info *mci,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700816 unsigned int csrow,
817 unsigned int channela,
818 unsigned int channelb, char *msg)
eric wollesen9794f332007-02-12 00:53:08 -0800819{
820 int len = EDAC_MC_LABEL_LEN * 4;
821 char labels[len + 1];
822 char *pos = labels;
823 int chars;
824
825 if (csrow >= mci->nr_csrows) {
826 /* something is wrong */
827 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700828 "INTERNAL ERROR: row out of range (%d >= %d)\n",
829 csrow, mci->nr_csrows);
eric wollesen9794f332007-02-12 00:53:08 -0800830 edac_mc_handle_ue_no_info(mci, "INTERNAL ERROR");
831 return;
832 }
833
834 if (channela >= mci->csrows[csrow].nr_channels) {
835 /* something is wrong */
836 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700837 "INTERNAL ERROR: channel-a out of range "
838 "(%d >= %d)\n",
839 channela, mci->csrows[csrow].nr_channels);
eric wollesen9794f332007-02-12 00:53:08 -0800840 edac_mc_handle_ue_no_info(mci, "INTERNAL ERROR");
841 return;
842 }
843
844 if (channelb >= mci->csrows[csrow].nr_channels) {
845 /* something is wrong */
846 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700847 "INTERNAL ERROR: channel-b out of range "
848 "(%d >= %d)\n",
849 channelb, mci->csrows[csrow].nr_channels);
eric wollesen9794f332007-02-12 00:53:08 -0800850 edac_mc_handle_ue_no_info(mci, "INTERNAL ERROR");
851 return;
852 }
853
854 mci->ue_count++;
855 mci->csrows[csrow].ue_count++;
856
857 /* Generate the DIMM labels from the specified channels */
858 chars = snprintf(pos, len + 1, "%s",
859 mci->csrows[csrow].channels[channela].label);
Douglas Thompson079708b2007-07-19 01:49:58 -0700860 len -= chars;
861 pos += chars;
eric wollesen9794f332007-02-12 00:53:08 -0800862 chars = snprintf(pos, len + 1, "-%s",
863 mci->csrows[csrow].channels[channelb].label);
864
Dave Jiang4de78c62007-07-19 01:49:54 -0700865 if (edac_mc_get_log_ue())
eric wollesen9794f332007-02-12 00:53:08 -0800866 edac_mc_printk(mci, KERN_EMERG,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700867 "UE row %d, channel-a= %d channel-b= %d "
868 "labels \"%s\": %s\n", csrow, channela, channelb,
869 labels, msg);
eric wollesen9794f332007-02-12 00:53:08 -0800870
Dave Jiang4de78c62007-07-19 01:49:54 -0700871 if (edac_mc_get_panic_on_ue())
eric wollesen9794f332007-02-12 00:53:08 -0800872 panic("UE row %d, channel-a= %d channel-b= %d "
Douglas Thompson052dfb42007-07-19 01:50:13 -0700873 "labels \"%s\": %s\n", csrow, channela,
874 channelb, labels, msg);
eric wollesen9794f332007-02-12 00:53:08 -0800875}
876EXPORT_SYMBOL(edac_mc_handle_fbd_ue);
877
878/*************************************************************
879 * On Fully Buffered DIMM modules, this help function is
880 * called to process CE events
881 */
882void edac_mc_handle_fbd_ce(struct mem_ctl_info *mci,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700883 unsigned int csrow, unsigned int channel, char *msg)
eric wollesen9794f332007-02-12 00:53:08 -0800884{
885
886 /* Ensure boundary values */
887 if (csrow >= mci->nr_csrows) {
888 /* something is wrong */
889 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700890 "INTERNAL ERROR: row out of range (%d >= %d)\n",
891 csrow, mci->nr_csrows);
eric wollesen9794f332007-02-12 00:53:08 -0800892 edac_mc_handle_ce_no_info(mci, "INTERNAL ERROR");
893 return;
894 }
895 if (channel >= mci->csrows[csrow].nr_channels) {
896 /* something is wrong */
897 edac_mc_printk(mci, KERN_ERR,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700898 "INTERNAL ERROR: channel out of range (%d >= %d)\n",
899 channel, mci->csrows[csrow].nr_channels);
eric wollesen9794f332007-02-12 00:53:08 -0800900 edac_mc_handle_ce_no_info(mci, "INTERNAL ERROR");
901 return;
902 }
903
Dave Jiang4de78c62007-07-19 01:49:54 -0700904 if (edac_mc_get_log_ce())
eric wollesen9794f332007-02-12 00:53:08 -0800905 /* FIXME - put in DIMM location */
906 edac_mc_printk(mci, KERN_WARNING,
Douglas Thompson052dfb42007-07-19 01:50:13 -0700907 "CE row %d, channel %d, label \"%s\": %s\n",
908 csrow, channel,
909 mci->csrows[csrow].channels[channel].label, msg);
eric wollesen9794f332007-02-12 00:53:08 -0800910
911 mci->ce_count++;
912 mci->csrows[csrow].ce_count++;
913 mci->csrows[csrow].channels[channel].ce_count++;
914}
Douglas Thompson079708b2007-07-19 01:49:58 -0700915EXPORT_SYMBOL(edac_mc_handle_fbd_ce);