blob: a2a9ad499b6b228b5766a50539a316002b3b57ed [file] [log] [blame]
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001/*
2 * Intel 7300 class Memory Controllers kernel module (Clarksboro)
3 *
4 * This file may be distributed under the terms of the
5 * GNU General Public License version 2 only.
6 *
7 * Copyright (c) 2010 by:
8 * Mauro Carvalho Chehab <mchehab@redhat.com>
9 *
10 * Red Hat Inc. http://www.redhat.com
11 *
12 * Intel 7300 Chipset Memory Controller Hub (MCH) - Datasheet
13 * http://www.intel.com/Assets/PDF/datasheet/318082.pdf
14 *
15 * TODO: The chipset allow checking for PCI Express errors also. Currently,
16 * the driver covers only memory error errors
17 *
18 * This driver uses "csrows" EDAC attribute to represent DIMM slot#
19 */
20
21#include <linux/module.h>
22#include <linux/init.h>
23#include <linux/pci.h>
24#include <linux/pci_ids.h>
25#include <linux/slab.h>
26#include <linux/edac.h>
27#include <linux/mmzone.h>
28
29#include "edac_core.h"
30
31/*
32 * Alter this version for the I7300 module when modifications are made
33 */
34#define I7300_REVISION " Ver: 1.0.0 " __DATE__
35
36#define EDAC_MOD_STR "i7300_edac"
37
38#define i7300_printk(level, fmt, arg...) \
39 edac_printk(level, "i7300", fmt, ##arg)
40
41#define i7300_mc_printk(mci, level, fmt, arg...) \
42 edac_mc_chipset_printk(mci, level, "i7300", fmt, ##arg)
43
Mauro Carvalho Chehabb4552ac2010-08-27 16:43:01 -030044/***********************************************
45 * i7300 Limit constants Structs and static vars
46 ***********************************************/
47
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -030048/*
49 * Memory topology is organized as:
50 * Branch 0 - 2 channels: channels 0 and 1 (FDB0 PCI dev 21.0)
51 * Branch 1 - 2 channels: channels 2 and 3 (FDB1 PCI dev 22.0)
52 * Each channel can have to 8 DIMM sets (called as SLOTS)
53 * Slots should generally be filled in pairs
54 * Except on Single Channel mode of operation
55 * just slot 0/channel0 filled on this mode
56 * On normal operation mode, the two channels on a branch should be
Mauro Carvalho Chehabc3af2ea2010-08-26 19:54:51 -030057 * filled together for the same SLOT#
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -030058 * When in mirrored mode, Branch 1 replicate memory at Branch 0, so, the four
59 * channels on both branches should be filled
60 */
61
62/* Limits for i7300 */
63#define MAX_SLOTS 8
64#define MAX_BRANCHES 2
65#define MAX_CH_PER_BRANCH 2
66#define MAX_CHANNELS (MAX_CH_PER_BRANCH * MAX_BRANCHES)
67#define MAX_MIR 3
68
69#define to_channel(ch, branch) ((((branch)) << 1) | (ch))
70
71#define to_csrow(slot, ch, branch) \
72 (to_channel(ch, branch) | ((slot) << 2))
73
Mauro Carvalho Chehabb4552ac2010-08-27 16:43:01 -030074/* Device name and register DID (Device ID) */
75struct i7300_dev_info {
76 const char *ctl_name; /* name for this device */
77 u16 fsb_mapping_errors; /* DID for the branchmap,control */
78};
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -030079
Mauro Carvalho Chehabb4552ac2010-08-27 16:43:01 -030080/* Table of devices attributes supported by this driver */
81static const struct i7300_dev_info i7300_devs[] = {
82 {
83 .ctl_name = "I7300",
84 .fsb_mapping_errors = PCI_DEVICE_ID_INTEL_I7300_MCH_ERR,
85 },
86};
87
88struct i7300_dimm_info {
89 int megabytes; /* size, 0 means not present */
90};
91
92/* driver private data structure */
93struct i7300_pvt {
94 struct pci_dev *pci_dev_16_0_fsb_ctlr; /* 16.0 */
95 struct pci_dev *pci_dev_16_1_fsb_addr_map; /* 16.1 */
96 struct pci_dev *pci_dev_16_2_fsb_err_regs; /* 16.2 */
97 struct pci_dev *pci_dev_2x_0_fbd_branch[MAX_BRANCHES]; /* 21.0 and 22.0 */
98
99 u16 tolm; /* top of low memory */
100 u64 ambase; /* AMB BAR */
101
102 u32 mc_settings; /* Report several settings */
103 u32 mc_settings_a;
104
105 u16 mir[MAX_MIR]; /* Memory Interleave Reg*/
106
107 u16 mtr[MAX_SLOTS][MAX_BRANCHES]; /* Memory Technlogy Reg */
108 u16 ambpresent[MAX_CHANNELS]; /* AMB present regs */
109
110 /* DIMM information matrix, allocating architecture maximums */
111 struct i7300_dimm_info dimm_info[MAX_SLOTS][MAX_CHANNELS];
112
113 /* Temporary buffer for use when preparing error messages */
114 char *tmp_prt_buffer;
115};
116
117/* FIXME: Why do we need to have this static? */
118static struct edac_pci_ctl_info *i7300_pci;
119
120/***************************************************
121 * i7300 Register definitions for memory enumeration
122 ***************************************************/
123
124/*
Mauro Carvalho Chehabc3af2ea2010-08-26 19:54:51 -0300125 * Device 16,
126 * Function 0: System Address (not documented)
127 * Function 1: Memory Branch Map, Control, Errors Register
128 */
129
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300130 /* OFFSETS for Function 0 */
Mauro Carvalho Chehabaf3d8832010-08-26 20:58:45 -0300131#define AMBASE 0x48 /* AMB Mem Mapped Reg Region Base */
132#define MAXCH 0x56 /* Max Channel Number */
133#define MAXDIMMPERCH 0x57 /* Max DIMM PER Channel Number */
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300134
135 /* OFFSETS for Function 1 */
Mauro Carvalho Chehabaf3d8832010-08-26 20:58:45 -0300136#define MC_SETTINGS 0x40
Mauro Carvalho Chehabbb81a212010-08-27 09:04:11 -0300137 #define IS_MIRRORED(mc) ((mc) & (1 << 16))
138 #define IS_ECC_ENABLED(mc) ((mc) & (1 << 5))
139 #define IS_RETRY_ENABLED(mc) ((mc) & (1 << 31))
140 #define IS_SCRBALGO_ENHANCED(mc) ((mc) & (1 << 8))
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300141
Mauro Carvalho Chehabbb81a212010-08-27 09:04:11 -0300142#define MC_SETTINGS_A 0x58
143 #define IS_SINGLE_MODE(mca) ((mca) & (1 << 14))
Mauro Carvalho Chehabd7de2bd2010-08-27 08:56:48 -0300144
Mauro Carvalho Chehabaf3d8832010-08-26 20:58:45 -0300145#define TOLM 0x6C
Mauro Carvalho Chehabaf3d8832010-08-26 20:58:45 -0300146
147#define MIR0 0x80
148#define MIR1 0x84
149#define MIR2 0x88
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300150
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300151/*
152 * Note: Other Intel EDAC drivers use AMBPRESENT to identify if the available
153 * memory. From datasheet item 7.3.1 (FB-DIMM technology & organization), it
154 * seems that we cannot use this information directly for the same usage.
155 * Each memory slot may have up to 2 AMB interfaces, one for income and another
156 * for outcome interface to the next slot.
157 * For now, the driver just stores the AMB present registers, but rely only at
158 * the MTR info to detect memory.
159 * Datasheet is also not clear about how to map each AMBPRESENT registers to
160 * one of the 4 available channels.
161 */
162#define AMBPRESENT_0 0x64
163#define AMBPRESENT_1 0x66
164
165const static u16 mtr_regs [MAX_SLOTS] = {
166 0x80, 0x84, 0x88, 0x8c,
167 0x82, 0x86, 0x8a, 0x8e
168};
169
Mauro Carvalho Chehabb4552ac2010-08-27 16:43:01 -0300170/*
171 * Defines to extract the vaious fields from the
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300172 * MTRx - Memory Technology Registers
173 */
174#define MTR_DIMMS_PRESENT(mtr) ((mtr) & (1 << 8))
175#define MTR_DIMMS_ETHROTTLE(mtr) ((mtr) & (1 << 7))
176#define MTR_DRAM_WIDTH(mtr) (((mtr) & (1 << 6)) ? 8 : 4)
177#define MTR_DRAM_BANKS(mtr) (((mtr) & (1 << 5)) ? 8 : 4)
178#define MTR_DIMM_RANKS(mtr) (((mtr) & (1 << 4)) ? 1 : 0)
179#define MTR_DIMM_ROWS(mtr) (((mtr) >> 2) & 0x3)
180#define MTR_DRAM_BANKS_ADDR_BITS 2
181#define MTR_DIMM_ROWS_ADDR_BITS(mtr) (MTR_DIMM_ROWS(mtr) + 13)
182#define MTR_DIMM_COLS(mtr) ((mtr) & 0x3)
183#define MTR_DIMM_COLS_ADDR_BITS(mtr) (MTR_DIMM_COLS(mtr) + 10)
184
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300185#ifdef CONFIG_EDAC_DEBUG
186/* MTR NUMROW */
187static const char *numrow_toString[] = {
188 "8,192 - 13 rows",
189 "16,384 - 14 rows",
190 "32,768 - 15 rows",
191 "65,536 - 16 rows"
192};
193
194/* MTR NUMCOL */
195static const char *numcol_toString[] = {
196 "1,024 - 10 columns",
197 "2,048 - 11 columns",
198 "4,096 - 12 columns",
199 "reserved"
200};
201#endif
202
Mauro Carvalho Chehabc3af2ea2010-08-26 19:54:51 -0300203/************************************************
204 * i7300 Register definitions for error detection
205 ************************************************/
Mauro Carvalho Chehab57021912010-08-27 10:22:36 -0300206
207/*
208 * Device 16.1: FBD Error Registers
209 */
210#define FERR_FAT_FBD 0x98
211static const char *ferr_fat_fbd_name[] = {
212 [22] = "Non-Redundant Fast Reset Timeout",
213 [2] = ">Tmid Thermal event with intelligent throttling disabled",
214 [1] = "Memory or FBD configuration CRC read error",
215 [0] = "Memory Write error on non-redundant retry or "
216 "FBD configuration Write error on retry",
217};
218#define GET_FBD_FAT_IDX(fbderr) (fbderr & (3 << 28))
219#define FERR_FAT_FBD_ERR_MASK ((1 << 0) | (1 << 1) | (1 << 2) | (1 << 3))
220
221#define FERR_NF_FBD 0xa0
222static const char *ferr_nf_fbd_name[] = {
223 [24] = "DIMM-Spare Copy Completed",
224 [23] = "DIMM-Spare Copy Initiated",
225 [22] = "Redundant Fast Reset Timeout",
226 [21] = "Memory Write error on redundant retry",
227 [18] = "SPD protocol Error",
228 [17] = "FBD Northbound parity error on FBD Sync Status",
229 [16] = "Correctable Patrol Data ECC",
230 [15] = "Correctable Resilver- or Spare-Copy Data ECC",
231 [14] = "Correctable Mirrored Demand Data ECC",
232 [13] = "Correctable Non-Mirrored Demand Data ECC",
233 [11] = "Memory or FBD configuration CRC read error",
234 [10] = "FBD Configuration Write error on first attempt",
235 [9] = "Memory Write error on first attempt",
236 [8] = "Non-Aliased Uncorrectable Patrol Data ECC",
237 [7] = "Non-Aliased Uncorrectable Resilver- or Spare-Copy Data ECC",
238 [6] = "Non-Aliased Uncorrectable Mirrored Demand Data ECC",
239 [5] = "Non-Aliased Uncorrectable Non-Mirrored Demand Data ECC",
240 [4] = "Aliased Uncorrectable Patrol Data ECC",
241 [3] = "Aliased Uncorrectable Resilver- or Spare-Copy Data ECC",
242 [2] = "Aliased Uncorrectable Mirrored Demand Data ECC",
243 [1] = "Aliased Uncorrectable Non-Mirrored Demand Data ECC",
244 [0] = "Uncorrectable Data ECC on Replay",
245};
246#define GET_FBD_NF_IDX(fbderr) (fbderr & (3 << 28))
247#define FERR_NF_FBD_ERR_MASK ((1 << 24) | (1 << 23) | (1 << 22) | (1 << 21) |\
248 (1 << 18) | (1 << 17) | (1 << 16) | (1 << 15) |\
249 (1 << 14) | (1 << 13) | (1 << 11) | (1 << 10) |\
250 (1 << 9) | (1 << 8) | (1 << 7) | (1 << 6) |\
251 (1 << 5) | (1 << 4) | (1 << 3) | (1 << 2) |\
252 (1 << 1) | (1 << 0))
253
254#define EMASK_FBD 0xa8
255#define EMASK_FBD_ERR_MASK ((1 << 27) | (1 << 26) | (1 << 25) | (1 << 24) |\
256 (1 << 22) | (1 << 21) | (1 << 20) | (1 << 19) |\
257 (1 << 18) | (1 << 17) | (1 << 16) | (1 << 14) |\
258 (1 << 13) | (1 << 12) | (1 << 11) | (1 << 10) |\
259 (1 << 9) | (1 << 8) | (1 << 7) | (1 << 6) |\
260 (1 << 5) | (1 << 4) | (1 << 3) | (1 << 2) |\
261 (1 << 1) | (1 << 0))
262
Mauro Carvalho Chehabc3af2ea2010-08-26 19:54:51 -0300263/*
264 * Device 16.2: Global Error Registers
265 */
266
Mauro Carvalho Chehab5de6e072010-08-27 00:16:12 -0300267#define FERR_GLOBAL_HI 0x48
268static const char *ferr_global_hi_name[] = {
269 [3] = "FSB 3 Fatal Error",
270 [2] = "FSB 2 Fatal Error",
271 [1] = "FSB 1 Fatal Error",
272 [0] = "FSB 0 Fatal Error",
273};
274#define ferr_global_hi_is_fatal(errno) 1
275
Mauro Carvalho Chehabc3af2ea2010-08-26 19:54:51 -0300276#define FERR_GLOBAL_LO 0x40
Mauro Carvalho Chehab5de6e072010-08-27 00:16:12 -0300277static const char *ferr_global_lo_name[] = {
Mauro Carvalho Chehabc3af2ea2010-08-26 19:54:51 -0300278 [31] = "Internal MCH Fatal Error",
279 [30] = "Intel QuickData Technology Device Fatal Error",
280 [29] = "FSB1 Fatal Error",
281 [28] = "FSB0 Fatal Error",
282 [27] = "FBD Channel 3 Fatal Error",
283 [26] = "FBD Channel 2 Fatal Error",
284 [25] = "FBD Channel 1 Fatal Error",
285 [24] = "FBD Channel 0 Fatal Error",
286 [23] = "PCI Express Device 7Fatal Error",
287 [22] = "PCI Express Device 6 Fatal Error",
288 [21] = "PCI Express Device 5 Fatal Error",
289 [20] = "PCI Express Device 4 Fatal Error",
290 [19] = "PCI Express Device 3 Fatal Error",
291 [18] = "PCI Express Device 2 Fatal Error",
292 [17] = "PCI Express Device 1 Fatal Error",
293 [16] = "ESI Fatal Error",
294 [15] = "Internal MCH Non-Fatal Error",
295 [14] = "Intel QuickData Technology Device Non Fatal Error",
296 [13] = "FSB1 Non-Fatal Error",
297 [12] = "FSB 0 Non-Fatal Error",
298 [11] = "FBD Channel 3 Non-Fatal Error",
299 [10] = "FBD Channel 2 Non-Fatal Error",
300 [9] = "FBD Channel 1 Non-Fatal Error",
301 [8] = "FBD Channel 0 Non-Fatal Error",
302 [7] = "PCI Express Device 7 Non-Fatal Error",
303 [6] = "PCI Express Device 6 Non-Fatal Error",
304 [5] = "PCI Express Device 5 Non-Fatal Error",
305 [4] = "PCI Express Device 4 Non-Fatal Error",
306 [3] = "PCI Express Device 3 Non-Fatal Error",
307 [2] = "PCI Express Device 2 Non-Fatal Error",
308 [1] = "PCI Express Device 1 Non-Fatal Error",
309 [0] = "ESI Non-Fatal Error",
310};
Mauro Carvalho Chehab5de6e072010-08-27 00:16:12 -0300311#define ferr_global_lo_is_fatal(errno) ((errno < 16) ? 0 : 1)
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300312
Mauro Carvalho Chehab8199d8c2010-08-27 11:51:48 -0300313#define NRECMEMA 0xbe
314 #define NRECMEMA_BANK(v) (((v) >> 12) & 7)
315 #define NRECMEMA_RANK(v) (((v) >> 8) & 15)
316
317#define NRECMEMB 0xc0
318 #define NRECMEMB_IS_WR(v) ((v) & (1 << 31))
319 #define NRECMEMB_CAS(v) (((v) >> 16) & 0x1fff)
320 #define NRECMEMB_RAS(v) ((v) & 0xffff)
321
Mauro Carvalho Chehab32f94722010-08-27 12:13:05 -0300322#define REDMEMA 0xdc
323
Mauro Carvalho Chehab37b69cf2010-08-27 15:44:43 -0300324#define REDMEMB 0x7c
325 #define IS_SECOND_CH(v) ((v) * (1 << 17))
326
Mauro Carvalho Chehab32f94722010-08-27 12:13:05 -0300327#define RECMEMA 0xe0
328 #define RECMEMA_BANK(v) (((v) >> 12) & 7)
329 #define RECMEMA_RANK(v) (((v) >> 8) & 15)
330
331#define RECMEMB 0xe4
332 #define RECMEMB_IS_WR(v) ((v) & (1 << 31))
333 #define RECMEMB_CAS(v) (((v) >> 16) & 0x1fff)
334 #define RECMEMB_RAS(v) ((v) & 0xffff)
335
Mauro Carvalho Chehab5de6e072010-08-27 00:16:12 -0300336/********************************************
337 * i7300 Functions related to error detection
338 ********************************************/
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300339
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300340/**
341 * get_err_from_table() - Gets the error message from a table
342 * @table: table name (array of char *)
343 * @size: number of elements at the table
344 * @pos: position of the element to be returned
345 *
346 * This is a small routine that gets the pos-th element of a table. If the
347 * element doesn't exist (or it is empty), it returns "reserved".
348 * Instead of calling it directly, the better is to call via the macro
349 * GET_ERR_FROM_TABLE(), that automatically checks the table size via
350 * ARRAY_SIZE() macro
351 */
352static const char *get_err_from_table(const char *table[], int size, int pos)
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300353{
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300354 if (unlikely(pos >= size))
355 return "Reserved";
356
357 if (unlikely(!table[pos]))
Mauro Carvalho Chehab5de6e072010-08-27 00:16:12 -0300358 return "Reserved";
359
360 return table[pos];
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300361}
Mauro Carvalho Chehab5de6e072010-08-27 00:16:12 -0300362
363#define GET_ERR_FROM_TABLE(table, pos) \
364 get_err_from_table(table, ARRAY_SIZE(table), pos)
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300365
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300366/**
367 * i7300_process_error_global() - Retrieve the hardware error information from
368 * the hardware global error registers and
369 * sends it to dmesg
370 * @mci: struct mem_ctl_info pointer
Mauro Carvalho Chehab5de6e072010-08-27 00:16:12 -0300371 */
Mauro Carvalho Chehabf4277422010-08-27 10:33:25 -0300372static void i7300_process_error_global(struct mem_ctl_info *mci)
Mauro Carvalho Chehab5de6e072010-08-27 00:16:12 -0300373{
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300374 struct i7300_pvt *pvt;
Mauro Carvalho Chehab5de6e072010-08-27 00:16:12 -0300375 u32 errnum, value;
376 unsigned long errors;
377 const char *specific;
378 bool is_fatal;
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300379
380 pvt = mci->pvt_info;
381
382 /* read in the 1st FATAL error register */
Mauro Carvalho Chehab5de6e072010-08-27 00:16:12 -0300383 pci_read_config_dword(pvt->pci_dev_16_2_fsb_err_regs,
384 FERR_GLOBAL_HI, &value);
385 if (unlikely(value)) {
386 errors = value;
387 errnum = find_first_bit(&errors,
388 ARRAY_SIZE(ferr_global_hi_name));
389 specific = GET_ERR_FROM_TABLE(ferr_global_hi_name, errnum);
390 is_fatal = ferr_global_hi_is_fatal(errnum);
Mauro Carvalho Chehab86002322010-08-27 00:46:57 -0300391
392 /* Clear the error bit */
393 pci_write_config_dword(pvt->pci_dev_16_2_fsb_err_regs,
394 FERR_GLOBAL_HI, value);
395
Mauro Carvalho Chehab5de6e072010-08-27 00:16:12 -0300396 goto error_global;
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300397 }
398
Mauro Carvalho Chehab5de6e072010-08-27 00:16:12 -0300399 pci_read_config_dword(pvt->pci_dev_16_2_fsb_err_regs,
400 FERR_GLOBAL_LO, &value);
401 if (unlikely(value)) {
402 errors = value;
403 errnum = find_first_bit(&errors,
404 ARRAY_SIZE(ferr_global_lo_name));
405 specific = GET_ERR_FROM_TABLE(ferr_global_lo_name, errnum);
406 is_fatal = ferr_global_lo_is_fatal(errnum);
Mauro Carvalho Chehab86002322010-08-27 00:46:57 -0300407
408 /* Clear the error bit */
409 pci_write_config_dword(pvt->pci_dev_16_2_fsb_err_regs,
410 FERR_GLOBAL_LO, value);
411
Mauro Carvalho Chehab5de6e072010-08-27 00:16:12 -0300412 goto error_global;
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300413 }
Mauro Carvalho Chehab5de6e072010-08-27 00:16:12 -0300414 return;
415
416error_global:
417 i7300_mc_printk(mci, KERN_EMERG, "%s misc error: %s\n",
418 is_fatal ? "Fatal" : "NOT fatal", specific);
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300419}
420
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300421/**
422 * i7300_process_fbd_error() - Retrieve the hardware error information from
423 * the FBD error registers and sends it via
424 * EDAC error API calls
425 * @mci: struct mem_ctl_info pointer
Mauro Carvalho Chehab57021912010-08-27 10:22:36 -0300426 */
Mauro Carvalho Chehabf4277422010-08-27 10:33:25 -0300427static void i7300_process_fbd_error(struct mem_ctl_info *mci)
Mauro Carvalho Chehab57021912010-08-27 10:22:36 -0300428{
429 struct i7300_pvt *pvt;
430 u32 errnum, value;
Mauro Carvalho Chehab8199d8c2010-08-27 11:51:48 -0300431 u16 val16;
Mauro Carvalho Chehab37b69cf2010-08-27 15:44:43 -0300432 unsigned branch, channel, bank, rank, cas, ras;
Mauro Carvalho Chehab32f94722010-08-27 12:13:05 -0300433 u32 syndrome;
434
Mauro Carvalho Chehab57021912010-08-27 10:22:36 -0300435 unsigned long errors;
436 const char *specific;
Mauro Carvalho Chehab32f94722010-08-27 12:13:05 -0300437 bool is_wr;
Mauro Carvalho Chehab57021912010-08-27 10:22:36 -0300438
439 pvt = mci->pvt_info;
440
441 /* read in the 1st FATAL error register */
442 pci_read_config_dword(pvt->pci_dev_16_1_fsb_addr_map,
443 FERR_FAT_FBD, &value);
444 if (unlikely(value & FERR_FAT_FBD_ERR_MASK)) {
445 errors = value & FERR_FAT_FBD_ERR_MASK ;
446 errnum = find_first_bit(&errors,
447 ARRAY_SIZE(ferr_fat_fbd_name));
448 specific = GET_ERR_FROM_TABLE(ferr_fat_fbd_name, errnum);
Mauro Carvalho Chehab57021912010-08-27 10:22:36 -0300449
450 branch = (GET_FBD_FAT_IDX(value) == 2) ? 1 : 0;
Mauro Carvalho Chehab8199d8c2010-08-27 11:51:48 -0300451 pci_read_config_word(pvt->pci_dev_16_1_fsb_addr_map,
452 NRECMEMA, &val16);
453 bank = NRECMEMA_BANK(val16);
454 rank = NRECMEMA_RANK(val16);
Mauro Carvalho Chehab57021912010-08-27 10:22:36 -0300455
Mauro Carvalho Chehab8199d8c2010-08-27 11:51:48 -0300456 pci_read_config_dword(pvt->pci_dev_16_1_fsb_addr_map,
457 NRECMEMB, &value);
458
459 is_wr = NRECMEMB_IS_WR(value);
460 cas = NRECMEMB_CAS(value);
461 ras = NRECMEMB_RAS(value);
462
463 snprintf(pvt->tmp_prt_buffer, PAGE_SIZE,
464 "FATAL (Branch=%d DRAM-Bank=%d %s "
465 "RAS=%d CAS=%d Err=0x%lx (%s))",
Mauro Carvalho Chehab32f94722010-08-27 12:13:05 -0300466 branch, bank,
Mauro Carvalho Chehab8199d8c2010-08-27 11:51:48 -0300467 is_wr ? "RDWR" : "RD",
468 ras, cas,
469 errors, specific);
470
471 /* Call the helper to output message */
472 edac_mc_handle_fbd_ue(mci, rank, branch << 1,
473 (branch << 1) + 1,
474 pvt->tmp_prt_buffer);
Mauro Carvalho Chehab57021912010-08-27 10:22:36 -0300475 }
476
477 /* read in the 1st NON-FATAL error register */
478 pci_read_config_dword(pvt->pci_dev_16_1_fsb_addr_map,
479 FERR_NF_FBD, &value);
480 if (unlikely(value & FERR_NF_FBD_ERR_MASK)) {
481 errors = value & FERR_NF_FBD_ERR_MASK;
482 errnum = find_first_bit(&errors,
483 ARRAY_SIZE(ferr_nf_fbd_name));
484 specific = GET_ERR_FROM_TABLE(ferr_nf_fbd_name, errnum);
Mauro Carvalho Chehab57021912010-08-27 10:22:36 -0300485
486 /* Clear the error bit */
487 pci_write_config_dword(pvt->pci_dev_16_2_fsb_err_regs,
488 FERR_GLOBAL_LO, value);
489
Mauro Carvalho Chehab32f94722010-08-27 12:13:05 -0300490 pci_read_config_dword(pvt->pci_dev_16_1_fsb_addr_map,
491 REDMEMA, &syndrome);
492
493 branch = (GET_FBD_FAT_IDX(value) == 2) ? 1 : 0;
494 pci_read_config_word(pvt->pci_dev_16_1_fsb_addr_map,
495 RECMEMA, &val16);
496 bank = RECMEMA_BANK(val16);
497 rank = RECMEMA_RANK(val16);
498
499 pci_read_config_dword(pvt->pci_dev_16_1_fsb_addr_map,
500 RECMEMB, &value);
501
502 is_wr = RECMEMB_IS_WR(value);
503 cas = RECMEMB_CAS(value);
504 ras = RECMEMB_RAS(value);
505
Mauro Carvalho Chehab37b69cf2010-08-27 15:44:43 -0300506 pci_read_config_dword(pvt->pci_dev_16_1_fsb_addr_map,
507 REDMEMB, &value);
508
509 channel = (branch << 1);
510 if (IS_SECOND_CH(value))
511 channel++;
512
Mauro Carvalho Chehab32f94722010-08-27 12:13:05 -0300513 /* Form out message */
514 snprintf(pvt->tmp_prt_buffer, PAGE_SIZE,
Mauro Carvalho Chehab37b69cf2010-08-27 15:44:43 -0300515 "Corrected error (Branch=%d, Channel %d), "
Mauro Carvalho Chehab32f94722010-08-27 12:13:05 -0300516 " DRAM-Bank=%d %s "
517 "RAS=%d CAS=%d, CE Err=0x%lx, Syndrome=0x%08x(%s))",
Mauro Carvalho Chehab37b69cf2010-08-27 15:44:43 -0300518 branch, channel,
Mauro Carvalho Chehab32f94722010-08-27 12:13:05 -0300519 bank,
520 is_wr ? "RDWR" : "RD",
521 ras, cas,
522 errors, syndrome, specific);
523
524 /*
525 * Call the helper to output message
526 * NOTE: Errors are reported per-branch, and not per-channel
527 * Currently, we don't know how to identify the right
528 * channel.
529 */
Mauro Carvalho Chehab37b69cf2010-08-27 15:44:43 -0300530 edac_mc_handle_fbd_ce(mci, rank, channel,
Mauro Carvalho Chehab32f94722010-08-27 12:13:05 -0300531 pvt->tmp_prt_buffer);
Mauro Carvalho Chehab57021912010-08-27 10:22:36 -0300532 }
533 return;
Mauro Carvalho Chehab57021912010-08-27 10:22:36 -0300534}
535
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300536/**
537 * i7300_check_error() - Calls the error checking subroutines
538 * @mci: struct mem_ctl_info pointer
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300539 */
Mauro Carvalho Chehabf4277422010-08-27 10:33:25 -0300540static void i7300_check_error(struct mem_ctl_info *mci)
Mauro Carvalho Chehab5de6e072010-08-27 00:16:12 -0300541{
Mauro Carvalho Chehabf4277422010-08-27 10:33:25 -0300542 i7300_process_error_global(mci);
543 i7300_process_fbd_error(mci);
Mauro Carvalho Chehab5de6e072010-08-27 00:16:12 -0300544};
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300545
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300546/**
547 * i7300_clear_error() - Clears the error registers
548 * @mci: struct mem_ctl_info pointer
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300549 */
550static void i7300_clear_error(struct mem_ctl_info *mci)
551{
Mauro Carvalho Chehabe4327602010-08-27 10:30:18 -0300552 struct i7300_pvt *pvt = mci->pvt_info;
553 u32 value;
554 /*
555 * All error values are RWC - we need to read and write 1 to the
556 * bit that we want to cleanup
557 */
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300558
Mauro Carvalho Chehabe4327602010-08-27 10:30:18 -0300559 /* Clear global error registers */
560 pci_read_config_dword(pvt->pci_dev_16_2_fsb_err_regs,
561 FERR_GLOBAL_HI, &value);
562 pci_write_config_dword(pvt->pci_dev_16_2_fsb_err_regs,
563 FERR_GLOBAL_HI, value);
564
565 pci_read_config_dword(pvt->pci_dev_16_2_fsb_err_regs,
566 FERR_GLOBAL_LO, &value);
567 pci_write_config_dword(pvt->pci_dev_16_2_fsb_err_regs,
568 FERR_GLOBAL_LO, value);
569
570 /* Clear FBD error registers */
571 pci_read_config_dword(pvt->pci_dev_16_1_fsb_addr_map,
572 FERR_FAT_FBD, &value);
573 pci_write_config_dword(pvt->pci_dev_16_1_fsb_addr_map,
574 FERR_FAT_FBD, value);
575
576 pci_read_config_dword(pvt->pci_dev_16_1_fsb_addr_map,
577 FERR_NF_FBD, &value);
578 pci_write_config_dword(pvt->pci_dev_16_1_fsb_addr_map,
579 FERR_NF_FBD, value);
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300580}
581
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300582/**
583 * i7300_enable_error_reporting() - Enable the memory reporting logic at the
584 * hardware
585 * @mci: struct mem_ctl_info pointer
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300586 */
587static void i7300_enable_error_reporting(struct mem_ctl_info *mci)
588{
Mauro Carvalho Chehab57021912010-08-27 10:22:36 -0300589 struct i7300_pvt *pvt = mci->pvt_info;
590 u32 fbd_error_mask;
591
592 /* Read the FBD Error Mask Register */
593 pci_read_config_dword(pvt->pci_dev_16_1_fsb_addr_map,
594 EMASK_FBD, &fbd_error_mask);
595
596 /* Enable with a '0' */
597 fbd_error_mask &= ~(EMASK_FBD_ERR_MASK);
598
599 pci_write_config_dword(pvt->pci_dev_16_1_fsb_addr_map,
600 EMASK_FBD, fbd_error_mask);
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300601}
Mauro Carvalho Chehab5de6e072010-08-27 00:16:12 -0300602
603/************************************************
604 * i7300 Functions related to memory enumberation
605 ************************************************/
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300606
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300607/**
608 * decode_mtr() - Decodes the MTR descriptor, filling the edac structs
609 * @pvt: pointer to the private data struct used by i7300 driver
610 * @slot: DIMM slot (0 to 7)
611 * @ch: Channel number within the branch (0 or 1)
612 * @branch: Branch number (0 or 1)
613 * @dinfo: Pointer to DIMM info where dimm size is stored
614 * @p_csrow: Pointer to the struct csrow_info that corresponds to that element
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300615 */
616static int decode_mtr(struct i7300_pvt *pvt,
617 int slot, int ch, int branch,
618 struct i7300_dimm_info *dinfo,
619 struct csrow_info *p_csrow)
620{
621 int mtr, ans, addrBits, channel;
622
623 channel = to_channel(ch, branch);
624
625 mtr = pvt->mtr[slot][branch];
626 ans = MTR_DIMMS_PRESENT(mtr) ? 1 : 0;
627
628 debugf2("\tMTR%d CH%d: DIMMs are %s (mtr)\n",
629 slot, channel,
630 ans ? "Present" : "NOT Present");
631
632 /* Determine if there is a DIMM present in this DIMM slot */
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300633 if (!ans)
634 return 0;
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300635
636 /* Start with the number of bits for a Bank
637 * on the DRAM */
638 addrBits = MTR_DRAM_BANKS_ADDR_BITS;
639 /* Add thenumber of ROW bits */
640 addrBits += MTR_DIMM_ROWS_ADDR_BITS(mtr);
641 /* add the number of COLUMN bits */
642 addrBits += MTR_DIMM_COLS_ADDR_BITS(mtr);
643 /* add the number of RANK bits */
644 addrBits += MTR_DIMM_RANKS(mtr);
645
646 addrBits += 6; /* add 64 bits per DIMM */
647 addrBits -= 20; /* divide by 2^^20 */
648 addrBits -= 3; /* 8 bits per bytes */
649
650 dinfo->megabytes = 1 << addrBits;
651
652 debugf2("\t\tWIDTH: x%d\n", MTR_DRAM_WIDTH(mtr));
653
654 debugf2("\t\tELECTRICAL THROTTLING is %s\n",
655 MTR_DIMMS_ETHROTTLE(mtr) ? "enabled" : "disabled");
656
657 debugf2("\t\tNUMBANK: %d bank(s)\n", MTR_DRAM_BANKS(mtr));
658 debugf2("\t\tNUMRANK: %s\n", MTR_DIMM_RANKS(mtr) ? "double" : "single");
659 debugf2("\t\tNUMROW: %s\n", numrow_toString[MTR_DIMM_ROWS(mtr)]);
660 debugf2("\t\tNUMCOL: %s\n", numcol_toString[MTR_DIMM_COLS(mtr)]);
661 debugf2("\t\tSIZE: %d MB\n", dinfo->megabytes);
662
663 p_csrow->grain = 8;
664 p_csrow->nr_pages = dinfo->megabytes << 8;
665 p_csrow->mtype = MEM_FB_DDR2;
Mauro Carvalho Chehab116389e2010-08-26 23:19:54 -0300666
667 /*
Mauro Carvalho Chehab15154c52010-08-27 09:16:06 -0300668 * The type of error detection actually depends of the
Mauro Carvalho Chehab116389e2010-08-26 23:19:54 -0300669 * mode of operation. When it is just one single memory chip, at
Mauro Carvalho Chehab15154c52010-08-27 09:16:06 -0300670 * socket 0, channel 0, it uses 8-byte-over-32-byte SECDED+ code.
671 * In normal or mirrored mode, it uses Lockstep mode,
Mauro Carvalho Chehab116389e2010-08-26 23:19:54 -0300672 * with the possibility of using an extended algorithm for x8 memories
673 * See datasheet Sections 7.3.6 to 7.3.8
674 */
Mauro Carvalho Chehab15154c52010-08-27 09:16:06 -0300675
676 if (IS_SINGLE_MODE(pvt->mc_settings_a)) {
677 p_csrow->edac_mode = EDAC_SECDED;
Mauro Carvalho Chehab3b330f62010-08-27 10:39:35 -0300678 debugf2("\t\tECC code is 8-byte-over-32-byte SECDED+ code\n");
Mauro Carvalho Chehab15154c52010-08-27 09:16:06 -0300679 } else {
Mauro Carvalho Chehab3b330f62010-08-27 10:39:35 -0300680 debugf2("\t\tECC code is on Lockstep mode\n");
Mauro Carvalho Chehab28c2ce72010-08-27 11:20:38 -0300681 if (MTR_DRAM_WIDTH(mtr) == 8)
Mauro Carvalho Chehab15154c52010-08-27 09:16:06 -0300682 p_csrow->edac_mode = EDAC_S8ECD8ED;
683 else
684 p_csrow->edac_mode = EDAC_S4ECD4ED;
685 }
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300686
687 /* ask what device type on this row */
Mauro Carvalho Chehab28c2ce72010-08-27 11:20:38 -0300688 if (MTR_DRAM_WIDTH(mtr) == 8) {
Mauro Carvalho Chehab3b330f62010-08-27 10:39:35 -0300689 debugf2("\t\tScrub algorithm for x8 is on %s mode\n",
Mauro Carvalho Chehabd7de2bd2010-08-27 08:56:48 -0300690 IS_SCRBALGO_ENHANCED(pvt->mc_settings) ?
691 "enhanced" : "normal");
692
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300693 p_csrow->dtype = DEV_X8;
Mauro Carvalho Chehabd7de2bd2010-08-27 08:56:48 -0300694 } else
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300695 p_csrow->dtype = DEV_X4;
696
697 return mtr;
698}
699
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300700/**
701 * print_dimm_size() - Prints dump of the memory organization
702 * @pvt: pointer to the private data struct used by i7300 driver
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300703 *
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300704 * Useful for debug. If debug is disabled, this routine do nothing
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300705 */
706static void print_dimm_size(struct i7300_pvt *pvt)
707{
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300708#ifdef CONFIG_EDAC_DEBUG
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300709 struct i7300_dimm_info *dinfo;
Mauro Carvalho Chehab85580ea2010-08-27 11:36:23 -0300710 char *p;
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300711 int space, n;
712 int channel, slot;
713
714 space = PAGE_SIZE;
Mauro Carvalho Chehab85580ea2010-08-27 11:36:23 -0300715 p = pvt->tmp_prt_buffer;
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300716
717 n = snprintf(p, space, " ");
718 p += n;
719 space -= n;
720 for (channel = 0; channel < MAX_CHANNELS; channel++) {
721 n = snprintf(p, space, "channel %d | ", channel);
722 p += n;
723 space -= n;
724 }
Mauro Carvalho Chehab85580ea2010-08-27 11:36:23 -0300725 debugf2("%s\n", pvt->tmp_prt_buffer);
726 p = pvt->tmp_prt_buffer;
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300727 space = PAGE_SIZE;
728 n = snprintf(p, space, "-------------------------------"
729 "------------------------------");
730 p += n;
731 space -= n;
Mauro Carvalho Chehab85580ea2010-08-27 11:36:23 -0300732 debugf2("%s\n", pvt->tmp_prt_buffer);
733 p = pvt->tmp_prt_buffer;
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300734 space = PAGE_SIZE;
735
736 for (slot = 0; slot < MAX_SLOTS; slot++) {
737 n = snprintf(p, space, "csrow/SLOT %d ", slot);
738 p += n;
739 space -= n;
740
741 for (channel = 0; channel < MAX_CHANNELS; channel++) {
742 dinfo = &pvt->dimm_info[slot][channel];
743 n = snprintf(p, space, "%4d MB | ", dinfo->megabytes);
744 p += n;
745 space -= n;
746 }
747
Mauro Carvalho Chehab85580ea2010-08-27 11:36:23 -0300748 debugf2("%s\n", pvt->tmp_prt_buffer);
749 p = pvt->tmp_prt_buffer;
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300750 space = PAGE_SIZE;
751 }
752
753 n = snprintf(p, space, "-------------------------------"
754 "------------------------------");
755 p += n;
756 space -= n;
Mauro Carvalho Chehab85580ea2010-08-27 11:36:23 -0300757 debugf2("%s\n", pvt->tmp_prt_buffer);
758 p = pvt->tmp_prt_buffer;
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300759 space = PAGE_SIZE;
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300760#endif
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300761}
762
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300763/**
764 * i7300_init_csrows() - Initialize the 'csrows' table within
765 * the mci control structure with the
766 * addressing of memory.
767 * @mci: struct mem_ctl_info pointer
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300768 */
769static int i7300_init_csrows(struct mem_ctl_info *mci)
770{
771 struct i7300_pvt *pvt;
772 struct i7300_dimm_info *dinfo;
773 struct csrow_info *p_csrow;
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300774 int rc = -ENODEV;
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300775 int mtr;
776 int ch, branch, slot, channel;
777
778 pvt = mci->pvt_info;
779
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300780 debugf2("Memory Technology Registers:\n");
781
782 /* Get the AMB present registers for the four channels */
783 for (branch = 0; branch < MAX_BRANCHES; branch++) {
784 /* Read and dump branch 0's MTRs */
785 channel = to_channel(0, branch);
Mauro Carvalho Chehab3e57eef2010-08-26 23:38:11 -0300786 pci_read_config_word(pvt->pci_dev_2x_0_fbd_branch[branch], AMBPRESENT_0,
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300787 &pvt->ambpresent[channel]);
788 debugf2("\t\tAMB-present CH%d = 0x%x:\n",
789 channel, pvt->ambpresent[channel]);
790
791 channel = to_channel(1, branch);
Mauro Carvalho Chehab3e57eef2010-08-26 23:38:11 -0300792 pci_read_config_word(pvt->pci_dev_2x_0_fbd_branch[branch], AMBPRESENT_1,
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300793 &pvt->ambpresent[channel]);
794 debugf2("\t\tAMB-present CH%d = 0x%x:\n",
795 channel, pvt->ambpresent[channel]);
796 }
797
798 /* Get the set of MTR[0-7] regs by each branch */
799 for (slot = 0; slot < MAX_SLOTS; slot++) {
800 int where = mtr_regs[slot];
801 for (branch = 0; branch < MAX_BRANCHES; branch++) {
Mauro Carvalho Chehab3e57eef2010-08-26 23:38:11 -0300802 pci_read_config_word(pvt->pci_dev_2x_0_fbd_branch[branch],
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300803 where,
804 &pvt->mtr[slot][branch]);
805 for (ch = 0; ch < MAX_BRANCHES; ch++) {
806 int channel = to_channel(ch, branch);
807
808 dinfo = &pvt->dimm_info[slot][channel];
809 p_csrow = &mci->csrows[slot];
810
811 mtr = decode_mtr(pvt, slot, ch, branch,
812 dinfo, p_csrow);
813 /* if no DIMMS on this row, continue */
814 if (!MTR_DIMMS_PRESENT(mtr))
815 continue;
816
817 p_csrow->csrow_idx = slot;
818
819 /* FAKE OUT VALUES, FIXME */
820 p_csrow->first_page = 0 + slot * 20;
821 p_csrow->last_page = 9 + slot * 20;
822 p_csrow->page_mask = 0xfff;
823
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300824 rc = 0;
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300825 }
826 }
827 }
828
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300829 return rc;
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300830}
831
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300832/**
833 * decode_mir() - Decodes Memory Interleave Register (MIR) info
834 * @int mir_no: number of the MIR register to decode
835 * @mir: array with the MIR data cached on the driver
836 */
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300837static void decode_mir(int mir_no, u16 mir[MAX_MIR])
838{
839 if (mir[mir_no] & 3)
840 debugf2("MIR%d: limit= 0x%x Branch(es) that participate: %s %s\n",
841 mir_no,
842 (mir[mir_no] >> 4) & 0xfff,
843 (mir[mir_no] & 1) ? "B0" : "",
844 (mir[mir_no] & 2) ? "B1": "");
845}
846
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300847/**
848 * i7300_get_mc_regs() - Get the contents of the MC enumeration registers
849 * @mci: struct mem_ctl_info pointer
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300850 *
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300851 * Data read is cached internally for its usage when needed
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300852 */
853static int i7300_get_mc_regs(struct mem_ctl_info *mci)
854{
855 struct i7300_pvt *pvt;
856 u32 actual_tolm;
857 int i, rc;
858
859 pvt = mci->pvt_info;
860
Mauro Carvalho Chehab3e57eef2010-08-26 23:38:11 -0300861 pci_read_config_dword(pvt->pci_dev_16_0_fsb_ctlr, AMBASE,
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300862 (u32 *) &pvt->ambase);
863
864 debugf2("AMBASE= 0x%lx\n", (long unsigned int)pvt->ambase);
865
866 /* Get the Branch Map regs */
Mauro Carvalho Chehab3e57eef2010-08-26 23:38:11 -0300867 pci_read_config_word(pvt->pci_dev_16_1_fsb_addr_map, TOLM, &pvt->tolm);
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300868 pvt->tolm >>= 12;
869 debugf2("TOLM (number of 256M regions) =%u (0x%x)\n", pvt->tolm,
870 pvt->tolm);
871
872 actual_tolm = (u32) ((1000l * pvt->tolm) >> (30 - 28));
873 debugf2("Actual TOLM byte addr=%u.%03u GB (0x%x)\n",
874 actual_tolm/1000, actual_tolm % 1000, pvt->tolm << 28);
875
Mauro Carvalho Chehabaf3d8832010-08-26 20:58:45 -0300876 /* Get memory controller settings */
Mauro Carvalho Chehab3e57eef2010-08-26 23:38:11 -0300877 pci_read_config_dword(pvt->pci_dev_16_1_fsb_addr_map, MC_SETTINGS,
Mauro Carvalho Chehabaf3d8832010-08-26 20:58:45 -0300878 &pvt->mc_settings);
Mauro Carvalho Chehabbb81a212010-08-27 09:04:11 -0300879 pci_read_config_dword(pvt->pci_dev_16_1_fsb_addr_map, MC_SETTINGS_A,
880 &pvt->mc_settings_a);
Mauro Carvalho Chehabd7de2bd2010-08-27 08:56:48 -0300881
Mauro Carvalho Chehabbb81a212010-08-27 09:04:11 -0300882 if (IS_SINGLE_MODE(pvt->mc_settings_a))
883 debugf0("Memory controller operating on single mode\n");
884 else
885 debugf0("Memory controller operating on %s mode\n",
Mauro Carvalho Chehabd7de2bd2010-08-27 08:56:48 -0300886 IS_MIRRORED(pvt->mc_settings) ? "mirrored" : "non-mirrored");
Mauro Carvalho Chehabbb81a212010-08-27 09:04:11 -0300887
Mauro Carvalho Chehabaf3d8832010-08-26 20:58:45 -0300888 debugf0("Error detection is %s\n",
Mauro Carvalho Chehabd7de2bd2010-08-27 08:56:48 -0300889 IS_ECC_ENABLED(pvt->mc_settings) ? "enabled" : "disabled");
890 debugf0("Retry is %s\n",
891 IS_RETRY_ENABLED(pvt->mc_settings) ? "enabled" : "disabled");
Mauro Carvalho Chehabaf3d8832010-08-26 20:58:45 -0300892
893 /* Get Memory Interleave Range registers */
Mauro Carvalho Chehab3e57eef2010-08-26 23:38:11 -0300894 pci_read_config_word(pvt->pci_dev_16_1_fsb_addr_map, MIR0, &pvt->mir[0]);
895 pci_read_config_word(pvt->pci_dev_16_1_fsb_addr_map, MIR1, &pvt->mir[1]);
896 pci_read_config_word(pvt->pci_dev_16_1_fsb_addr_map, MIR2, &pvt->mir[2]);
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300897
898 /* Decode the MIR regs */
899 for (i = 0; i < MAX_MIR; i++)
900 decode_mir(i, pvt->mir);
901
902 rc = i7300_init_csrows(mci);
903 if (rc < 0)
904 return rc;
905
906 /* Go and determine the size of each DIMM and place in an
907 * orderly matrix */
908 print_dimm_size(pvt);
909
910 return 0;
911}
912
Mauro Carvalho Chehab5de6e072010-08-27 00:16:12 -0300913/*************************************************
914 * i7300 Functions related to device probe/release
915 *************************************************/
916
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300917/**
918 * i7300_put_devices() - Release the PCI devices
919 * @mci: struct mem_ctl_info pointer
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300920 */
921static void i7300_put_devices(struct mem_ctl_info *mci)
922{
923 struct i7300_pvt *pvt;
924 int branch;
925
926 pvt = mci->pvt_info;
927
928 /* Decrement usage count for devices */
929 for (branch = 0; branch < MAX_CH_PER_BRANCH; branch++)
Mauro Carvalho Chehab3e57eef2010-08-26 23:38:11 -0300930 pci_dev_put(pvt->pci_dev_2x_0_fbd_branch[branch]);
931 pci_dev_put(pvt->pci_dev_16_2_fsb_err_regs);
932 pci_dev_put(pvt->pci_dev_16_1_fsb_addr_map);
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300933}
934
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300935/**
936 * i7300_get_devices() - Find and perform 'get' operation on the MCH's
937 * device/functions we want to reference for this driver
938 * @mci: struct mem_ctl_info pointer
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300939 *
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300940 * Access and prepare the several devices for usage:
941 * I7300 devices used by this driver:
942 * Device 16, functions 0,1 and 2: PCI_DEVICE_ID_INTEL_I7300_MCH_ERR
943 * Device 21 function 0: PCI_DEVICE_ID_INTEL_I7300_MCH_FB0
944 * Device 22 function 0: PCI_DEVICE_ID_INTEL_I7300_MCH_FB1
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300945 */
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -0300946static int __devinit i7300_get_devices(struct mem_ctl_info *mci)
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300947{
948 struct i7300_pvt *pvt;
949 struct pci_dev *pdev;
950
951 pvt = mci->pvt_info;
952
953 /* Attempt to 'get' the MCH register we want */
954 pdev = NULL;
Mauro Carvalho Chehab3e57eef2010-08-26 23:38:11 -0300955 while (!pvt->pci_dev_16_1_fsb_addr_map || !pvt->pci_dev_16_2_fsb_err_regs) {
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300956 pdev = pci_get_device(PCI_VENDOR_ID_INTEL,
957 PCI_DEVICE_ID_INTEL_I7300_MCH_ERR, pdev);
958 if (!pdev) {
959 /* End of list, leave */
960 i7300_printk(KERN_ERR,
961 "'system address,Process Bus' "
962 "device not found:"
963 "vendor 0x%x device 0x%x ERR funcs "
964 "(broken BIOS?)\n",
965 PCI_VENDOR_ID_INTEL,
966 PCI_DEVICE_ID_INTEL_I7300_MCH_ERR);
967 goto error;
968 }
969
970 /* Store device 16 funcs 1 and 2 */
971 switch (PCI_FUNC(pdev->devfn)) {
972 case 1:
Mauro Carvalho Chehab3e57eef2010-08-26 23:38:11 -0300973 pvt->pci_dev_16_1_fsb_addr_map = pdev;
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300974 break;
975 case 2:
Mauro Carvalho Chehab3e57eef2010-08-26 23:38:11 -0300976 pvt->pci_dev_16_2_fsb_err_regs = pdev;
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300977 break;
978 }
979 }
980
981 debugf1("System Address, processor bus- PCI Bus ID: %s %x:%x\n",
Mauro Carvalho Chehab3e57eef2010-08-26 23:38:11 -0300982 pci_name(pvt->pci_dev_16_0_fsb_ctlr),
983 pvt->pci_dev_16_0_fsb_ctlr->vendor, pvt->pci_dev_16_0_fsb_ctlr->device);
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300984 debugf1("Branchmap, control and errors - PCI Bus ID: %s %x:%x\n",
Mauro Carvalho Chehab3e57eef2010-08-26 23:38:11 -0300985 pci_name(pvt->pci_dev_16_1_fsb_addr_map),
986 pvt->pci_dev_16_1_fsb_addr_map->vendor, pvt->pci_dev_16_1_fsb_addr_map->device);
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300987 debugf1("FSB Error Regs - PCI Bus ID: %s %x:%x\n",
Mauro Carvalho Chehab3e57eef2010-08-26 23:38:11 -0300988 pci_name(pvt->pci_dev_16_2_fsb_err_regs),
989 pvt->pci_dev_16_2_fsb_err_regs->vendor, pvt->pci_dev_16_2_fsb_err_regs->device);
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300990
Mauro Carvalho Chehab3e57eef2010-08-26 23:38:11 -0300991 pvt->pci_dev_2x_0_fbd_branch[0] = pci_get_device(PCI_VENDOR_ID_INTEL,
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300992 PCI_DEVICE_ID_INTEL_I7300_MCH_FB0,
993 NULL);
Mauro Carvalho Chehab3e57eef2010-08-26 23:38:11 -0300994 if (!pvt->pci_dev_2x_0_fbd_branch[0]) {
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -0300995 i7300_printk(KERN_ERR,
996 "MC: 'BRANCH 0' device not found:"
997 "vendor 0x%x device 0x%x Func 0 (broken BIOS?)\n",
998 PCI_VENDOR_ID_INTEL, PCI_DEVICE_ID_INTEL_I7300_MCH_FB0);
999 goto error;
1000 }
1001
Mauro Carvalho Chehab3e57eef2010-08-26 23:38:11 -03001002 pvt->pci_dev_2x_0_fbd_branch[1] = pci_get_device(PCI_VENDOR_ID_INTEL,
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001003 PCI_DEVICE_ID_INTEL_I7300_MCH_FB1,
1004 NULL);
Mauro Carvalho Chehab3e57eef2010-08-26 23:38:11 -03001005 if (!pvt->pci_dev_2x_0_fbd_branch[1]) {
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001006 i7300_printk(KERN_ERR,
1007 "MC: 'BRANCH 1' device not found:"
1008 "vendor 0x%x device 0x%x Func 0 "
1009 "(broken BIOS?)\n",
1010 PCI_VENDOR_ID_INTEL,
1011 PCI_DEVICE_ID_INTEL_I7300_MCH_FB1);
1012 goto error;
1013 }
1014
1015 return 0;
1016
1017error:
1018 i7300_put_devices(mci);
1019 return -ENODEV;
1020}
1021
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -03001022/**
1023 * i7300_init_one() - Probe for one instance of the device
1024 * @pdev: struct pci_dev pointer
1025 * @id: struct pci_device_id pointer - currently unused
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001026 */
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -03001027static int __devinit i7300_init_one(struct pci_dev *pdev,
1028 const struct pci_device_id *id)
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001029{
1030 struct mem_ctl_info *mci;
1031 struct i7300_pvt *pvt;
1032 int num_channels;
1033 int num_dimms_per_channel;
1034 int num_csrows;
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -03001035 int rc;
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001036
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -03001037 /* wake up device */
1038 rc = pci_enable_device(pdev);
1039 if (rc == -EIO)
1040 return rc;
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001041
1042 debugf0("MC: " __FILE__ ": %s(), pdev bus %u dev=0x%x fn=0x%x\n",
1043 __func__,
1044 pdev->bus->number,
1045 PCI_SLOT(pdev->devfn), PCI_FUNC(pdev->devfn));
1046
1047 /* We only are looking for func 0 of the set */
1048 if (PCI_FUNC(pdev->devfn) != 0)
1049 return -ENODEV;
1050
1051 /* As we don't have a motherboard identification routine to determine
1052 * actual number of slots/dimms per channel, we thus utilize the
1053 * resource as specified by the chipset. Thus, we might have
1054 * have more DIMMs per channel than actually on the mobo, but this
1055 * allows the driver to support upto the chipset max, without
1056 * some fancy mobo determination.
1057 */
1058 num_dimms_per_channel = MAX_SLOTS;
1059 num_channels = MAX_CHANNELS;
1060 num_csrows = MAX_SLOTS * MAX_CHANNELS;
1061
1062 debugf0("MC: %s(): Number of - Channels= %d DIMMS= %d CSROWS= %d\n",
1063 __func__, num_channels, num_dimms_per_channel, num_csrows);
1064
1065 /* allocate a new MC control structure */
1066 mci = edac_mc_alloc(sizeof(*pvt), num_csrows, num_channels, 0);
1067
1068 if (mci == NULL)
1069 return -ENOMEM;
1070
1071 debugf0("MC: " __FILE__ ": %s(): mci = %p\n", __func__, mci);
1072
1073 mci->dev = &pdev->dev; /* record ptr to the generic device */
1074
1075 pvt = mci->pvt_info;
Mauro Carvalho Chehab3e57eef2010-08-26 23:38:11 -03001076 pvt->pci_dev_16_0_fsb_ctlr = pdev; /* Record this device in our private */
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001077
Mauro Carvalho Chehab85580ea2010-08-27 11:36:23 -03001078 pvt->tmp_prt_buffer = kmalloc(PAGE_SIZE, GFP_KERNEL);
1079 if (!pvt->tmp_prt_buffer) {
1080 edac_mc_free(mci);
1081 return -ENOMEM;
1082 }
1083
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001084 /* 'get' the pci devices we want to reserve for our use */
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -03001085 if (i7300_get_devices(mci))
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001086 goto fail0;
1087
1088 mci->mc_idx = 0;
1089 mci->mtype_cap = MEM_FLAG_FB_DDR2;
1090 mci->edac_ctl_cap = EDAC_FLAG_NONE;
1091 mci->edac_cap = EDAC_FLAG_NONE;
1092 mci->mod_name = "i7300_edac.c";
1093 mci->mod_ver = I7300_REVISION;
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -03001094 mci->ctl_name = i7300_devs[0].ctl_name;
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001095 mci->dev_name = pci_name(pdev);
1096 mci->ctl_page_to_phys = NULL;
1097
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001098 /* Set the function pointer to an actual operation function */
1099 mci->edac_check = i7300_check_error;
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001100
1101 /* initialize the MC control structure 'csrows' table
1102 * with the mapping and control information */
1103 if (i7300_get_mc_regs(mci)) {
1104 debugf0("MC: Setting mci->edac_cap to EDAC_FLAG_NONE\n"
1105 " because i7300_init_csrows() returned nonzero "
1106 "value\n");
1107 mci->edac_cap = EDAC_FLAG_NONE; /* no csrows found */
1108 } else {
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001109 debugf1("MC: Enable error reporting now\n");
1110 i7300_enable_error_reporting(mci);
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001111 }
1112
1113 /* add this new MC control structure to EDAC's list of MCs */
1114 if (edac_mc_add_mc(mci)) {
1115 debugf0("MC: " __FILE__
1116 ": %s(): failed edac_mc_add_mc()\n", __func__);
1117 /* FIXME: perhaps some code should go here that disables error
1118 * reporting if we just enabled it
1119 */
1120 goto fail1;
1121 }
1122
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001123 i7300_clear_error(mci);
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001124
1125 /* allocating generic PCI control info */
1126 i7300_pci = edac_pci_create_generic_ctl(&pdev->dev, EDAC_MOD_STR);
1127 if (!i7300_pci) {
1128 printk(KERN_WARNING
1129 "%s(): Unable to create PCI control\n",
1130 __func__);
1131 printk(KERN_WARNING
1132 "%s(): PCI error report via EDAC not setup\n",
1133 __func__);
1134 }
1135
1136 return 0;
1137
1138 /* Error exit unwinding stack */
1139fail1:
1140
1141 i7300_put_devices(mci);
1142
1143fail0:
Mauro Carvalho Chehab85580ea2010-08-27 11:36:23 -03001144 kfree(pvt->tmp_prt_buffer);
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001145 edac_mc_free(mci);
1146 return -ENODEV;
1147}
1148
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -03001149/**
1150 * i7300_remove_one() - Remove the driver
1151 * @pdev: struct pci_dev pointer
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001152 */
1153static void __devexit i7300_remove_one(struct pci_dev *pdev)
1154{
1155 struct mem_ctl_info *mci;
Mauro Carvalho Chehab85580ea2010-08-27 11:36:23 -03001156 char *tmp;
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001157
1158 debugf0(__FILE__ ": %s()\n", __func__);
1159
1160 if (i7300_pci)
1161 edac_pci_release_generic_ctl(i7300_pci);
1162
1163 mci = edac_mc_del_mc(&pdev->dev);
1164 if (!mci)
1165 return;
1166
Mauro Carvalho Chehab85580ea2010-08-27 11:36:23 -03001167 tmp = ((struct i7300_pvt *)mci->pvt_info)->tmp_prt_buffer;
1168
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001169 /* retrieve references to resources, and free those resources */
1170 i7300_put_devices(mci);
1171
Mauro Carvalho Chehab85580ea2010-08-27 11:36:23 -03001172 kfree(tmp);
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001173 edac_mc_free(mci);
1174}
1175
1176/*
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -03001177 * pci_device_id: table for which devices we are looking for
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001178 *
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -03001179 * Has only 8086:360c PCI ID
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001180 */
1181static const struct pci_device_id i7300_pci_tbl[] __devinitdata = {
1182 {PCI_DEVICE(PCI_VENDOR_ID_INTEL, PCI_DEVICE_ID_INTEL_I7300_MCH_ERR)},
1183 {0,} /* 0 terminated list. */
1184};
1185
1186MODULE_DEVICE_TABLE(pci, i7300_pci_tbl);
1187
1188/*
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -03001189 * i7300_driver: pci_driver structure for this module
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001190 */
1191static struct pci_driver i7300_driver = {
1192 .name = "i7300_edac",
1193 .probe = i7300_init_one,
1194 .remove = __devexit_p(i7300_remove_one),
1195 .id_table = i7300_pci_tbl,
1196};
1197
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -03001198/**
1199 * i7300_init() - Registers the driver
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001200 */
1201static int __init i7300_init(void)
1202{
1203 int pci_rc;
1204
1205 debugf2("MC: " __FILE__ ": %s()\n", __func__);
1206
1207 /* Ensure that the OPSTATE is set correctly for POLL or NMI */
1208 opstate_init();
1209
1210 pci_rc = pci_register_driver(&i7300_driver);
1211
1212 return (pci_rc < 0) ? pci_rc : 0;
1213}
1214
Mauro Carvalho Chehabd091a6e2010-08-27 17:28:50 -03001215/**
1216 * i7300_init() - Unregisters the driver
Mauro Carvalho Chehabfcaf7802010-08-24 23:22:57 -03001217 */
1218static void __exit i7300_exit(void)
1219{
1220 debugf2("MC: " __FILE__ ": %s()\n", __func__);
1221 pci_unregister_driver(&i7300_driver);
1222}
1223
1224module_init(i7300_init);
1225module_exit(i7300_exit);
1226
1227MODULE_LICENSE("GPL");
1228MODULE_AUTHOR("Mauro Carvalho Chehab <mchehab@redhat.com>");
1229MODULE_AUTHOR("Red Hat Inc. (http://www.redhat.com)");
1230MODULE_DESCRIPTION("MC Driver for Intel I7300 memory controllers - "
1231 I7300_REVISION);
1232
1233module_param(edac_op_state, int, 0444);
1234MODULE_PARM_DESC(edac_op_state, "EDAC Error Reporting state: 0=Poll,1=NMI");