diff options
author | Mauro Carvalho Chehab <mchehab@redhat.com> | 2010-08-24 22:22:57 -0400 |
---|---|---|
committer | Mauro Carvalho Chehab <mchehab@redhat.com> | 2010-08-30 13:56:42 -0400 |
commit | fcaf780b2ad352edaeb1d1c07a6da053266b1eed (patch) | |
tree | 8ea1e46a19282b13c66442d144d59ca6cafb418d /drivers/edac/i7300_edac.c | |
parent | da5cabf80e2433131bf0ed8993abc0f7ea618c73 (diff) |
i7300_edac: start a driver for i7300 chipset (Clarksboro)
Signed-off-by: Mauro Carvalho Chehab <mchehab@redhat.com>
Diffstat (limited to 'drivers/edac/i7300_edac.c')
-rw-r--r-- | drivers/edac/i7300_edac.c | 1373 |
1 files changed, 1373 insertions, 0 deletions
diff --git a/drivers/edac/i7300_edac.c b/drivers/edac/i7300_edac.c new file mode 100644 index 000000000000..eb3f30e96ee3 --- /dev/null +++ b/drivers/edac/i7300_edac.c | |||
@@ -0,0 +1,1373 @@ | |||
1 | /* | ||
2 | * Intel 7300 class Memory Controllers kernel module (Clarksboro) | ||
3 | * | ||
4 | * This file may be distributed under the terms of the | ||
5 | * GNU General Public License version 2 only. | ||
6 | * | ||
7 | * Copyright (c) 2010 by: | ||
8 | * Mauro Carvalho Chehab <mchehab@redhat.com> | ||
9 | * | ||
10 | * Red Hat Inc. http://www.redhat.com | ||
11 | * | ||
12 | * Intel 7300 Chipset Memory Controller Hub (MCH) - Datasheet | ||
13 | * http://www.intel.com/Assets/PDF/datasheet/318082.pdf | ||
14 | * | ||
15 | * TODO: The chipset allow checking for PCI Express errors also. Currently, | ||
16 | * the driver covers only memory error errors | ||
17 | * | ||
18 | * This driver uses "csrows" EDAC attribute to represent DIMM slot# | ||
19 | */ | ||
20 | |||
21 | #include <linux/module.h> | ||
22 | #include <linux/init.h> | ||
23 | #include <linux/pci.h> | ||
24 | #include <linux/pci_ids.h> | ||
25 | #include <linux/slab.h> | ||
26 | #include <linux/edac.h> | ||
27 | #include <linux/mmzone.h> | ||
28 | |||
29 | #include "edac_core.h" | ||
30 | |||
31 | /* | ||
32 | * Alter this version for the I7300 module when modifications are made | ||
33 | */ | ||
34 | #define I7300_REVISION " Ver: 1.0.0 " __DATE__ | ||
35 | |||
36 | #define EDAC_MOD_STR "i7300_edac" | ||
37 | |||
38 | #define i7300_printk(level, fmt, arg...) \ | ||
39 | edac_printk(level, "i7300", fmt, ##arg) | ||
40 | |||
41 | #define i7300_mc_printk(mci, level, fmt, arg...) \ | ||
42 | edac_mc_chipset_printk(mci, level, "i7300", fmt, ##arg) | ||
43 | |||
44 | /* | ||
45 | * Memory topology is organized as: | ||
46 | * Branch 0 - 2 channels: channels 0 and 1 (FDB0 PCI dev 21.0) | ||
47 | * Branch 1 - 2 channels: channels 2 and 3 (FDB1 PCI dev 22.0) | ||
48 | * Each channel can have to 8 DIMM sets (called as SLOTS) | ||
49 | * Slots should generally be filled in pairs | ||
50 | * Except on Single Channel mode of operation | ||
51 | * just slot 0/channel0 filled on this mode | ||
52 | * On normal operation mode, the two channels on a branch should be | ||
53 | filled together for the same SLOT# | ||
54 | * When in mirrored mode, Branch 1 replicate memory at Branch 0, so, the four | ||
55 | * channels on both branches should be filled | ||
56 | */ | ||
57 | |||
58 | /* Limits for i7300 */ | ||
59 | #define MAX_SLOTS 8 | ||
60 | #define MAX_BRANCHES 2 | ||
61 | #define MAX_CH_PER_BRANCH 2 | ||
62 | #define MAX_CHANNELS (MAX_CH_PER_BRANCH * MAX_BRANCHES) | ||
63 | #define MAX_MIR 3 | ||
64 | |||
65 | #define to_channel(ch, branch) ((((branch)) << 1) | (ch)) | ||
66 | |||
67 | #define to_csrow(slot, ch, branch) \ | ||
68 | (to_channel(ch, branch) | ((slot) << 2)) | ||
69 | |||
70 | |||
71 | /* Device 16, | ||
72 | * Function 0: System Address (not documented) | ||
73 | * Function 1: Memory Branch Map, Control, Errors Register | ||
74 | * Function 2: FSB Error Registers | ||
75 | * | ||
76 | * All 3 functions of Device 16 (0,1,2) share the SAME DID and | ||
77 | * uses PCI_DEVICE_ID_INTEL_I7300_MCH_ERR for device 16 (0,1,2), | ||
78 | * PCI_DEVICE_ID_INTEL_I7300_MCH_FB0 and PCI_DEVICE_ID_INTEL_I7300_MCH_FB1 | ||
79 | * for device 21 (0,1). | ||
80 | */ | ||
81 | |||
82 | /* OFFSETS for Function 0 */ | ||
83 | #define AMBASE 0x48 /* AMB Mem Mapped Reg Region Base */ | ||
84 | #define MAXCH 0x56 /* Max Channel Number */ | ||
85 | #define MAXDIMMPERCH 0x57 /* Max DIMM PER Channel Number */ | ||
86 | |||
87 | /* OFFSETS for Function 1 */ | ||
88 | #define TOLM 0x6C | ||
89 | #define REDMEMB 0x7C | ||
90 | |||
91 | #define MIR0 0x80 | ||
92 | #define MIR1 0x84 | ||
93 | #define MIR2 0x88 | ||
94 | |||
95 | #if 0 | ||
96 | #define AMIR0 0x8c | ||
97 | #define AMIR1 0x90 | ||
98 | #define AMIR2 0x94 | ||
99 | |||
100 | /*TODO: double check it */ | ||
101 | #define REC_ECC_LOCATOR_ODD(x) ((x) & 0x3fe00) /* bits [17:9] indicate ODD, [8:0] indicate EVEN */ | ||
102 | |||
103 | /* Fatal error registers */ | ||
104 | #define FERR_FAT_FBD 0x98 | ||
105 | |||
106 | /*TODO: double check it */ | ||
107 | #define FERR_FAT_FBDCHAN (3<<28) /* channel index where the highest-order error occurred */ | ||
108 | |||
109 | #define NERR_FAT_FBD 0x9c | ||
110 | #define FERR_NF_FBD 0xa0 | ||
111 | |||
112 | /* Non-fatal error register */ | ||
113 | #define NERR_NF_FBD 0xa4 | ||
114 | |||
115 | /* Enable error mask */ | ||
116 | #define EMASK_FBD 0xa8 | ||
117 | |||
118 | #define ERR0_FBD 0xac | ||
119 | #define ERR1_FBD 0xb0 | ||
120 | #define ERR2_FBD 0xb4 | ||
121 | #define MCERR_FBD 0xb8 | ||
122 | |||
123 | #endif | ||
124 | |||
125 | /* TODO: Dev 16 fn1 allows memory error injection - offsets 0x100-0x10b */ | ||
126 | |||
127 | /* TODO: OFFSETS for Device 16 Function 2 */ | ||
128 | |||
129 | /* | ||
130 | * Device 21, | ||
131 | * Function 0: Memory Map Branch 0 | ||
132 | * | ||
133 | * Device 22, | ||
134 | * Function 0: Memory Map Branch 1 | ||
135 | */ | ||
136 | |||
137 | /* OFFSETS for Function 0 */ | ||
138 | |||
139 | /* | ||
140 | * Note: Other Intel EDAC drivers use AMBPRESENT to identify if the available | ||
141 | * memory. From datasheet item 7.3.1 (FB-DIMM technology & organization), it | ||
142 | * seems that we cannot use this information directly for the same usage. | ||
143 | * Each memory slot may have up to 2 AMB interfaces, one for income and another | ||
144 | * for outcome interface to the next slot. | ||
145 | * For now, the driver just stores the AMB present registers, but rely only at | ||
146 | * the MTR info to detect memory. | ||
147 | * Datasheet is also not clear about how to map each AMBPRESENT registers to | ||
148 | * one of the 4 available channels. | ||
149 | */ | ||
150 | #define AMBPRESENT_0 0x64 | ||
151 | #define AMBPRESENT_1 0x66 | ||
152 | |||
153 | const static u16 mtr_regs [MAX_SLOTS] = { | ||
154 | 0x80, 0x84, 0x88, 0x8c, | ||
155 | 0x82, 0x86, 0x8a, 0x8e | ||
156 | }; | ||
157 | |||
158 | /* Defines to extract the vaious fields from the | ||
159 | * MTRx - Memory Technology Registers | ||
160 | */ | ||
161 | #define MTR_DIMMS_PRESENT(mtr) ((mtr) & (1 << 8)) | ||
162 | #define MTR_DIMMS_ETHROTTLE(mtr) ((mtr) & (1 << 7)) | ||
163 | #define MTR_DRAM_WIDTH(mtr) (((mtr) & (1 << 6)) ? 8 : 4) | ||
164 | #define MTR_DRAM_BANKS(mtr) (((mtr) & (1 << 5)) ? 8 : 4) | ||
165 | #define MTR_DIMM_RANKS(mtr) (((mtr) & (1 << 4)) ? 1 : 0) | ||
166 | #define MTR_DIMM_ROWS(mtr) (((mtr) >> 2) & 0x3) | ||
167 | #define MTR_DRAM_BANKS_ADDR_BITS 2 | ||
168 | #define MTR_DIMM_ROWS_ADDR_BITS(mtr) (MTR_DIMM_ROWS(mtr) + 13) | ||
169 | #define MTR_DIMM_COLS(mtr) ((mtr) & 0x3) | ||
170 | #define MTR_DIMM_COLS_ADDR_BITS(mtr) (MTR_DIMM_COLS(mtr) + 10) | ||
171 | |||
172 | #if 0 | ||
173 | /* OFFSETS for Function 1 */ | ||
174 | |||
175 | /* TODO */ | ||
176 | #define NRECFGLOG 0x74 | ||
177 | #define RECFGLOG 0x78 | ||
178 | #define NRECMEMA 0xbe | ||
179 | #define NRECMEMB 0xc0 | ||
180 | #define NRECFB_DIMMA 0xc4 | ||
181 | #define NRECFB_DIMMB 0xc8 | ||
182 | #define NRECFB_DIMMC 0xcc | ||
183 | #define NRECFB_DIMMD 0xd0 | ||
184 | #define NRECFB_DIMME 0xd4 | ||
185 | #define NRECFB_DIMMF 0xd8 | ||
186 | #define REDMEMA 0xdC | ||
187 | #define RECMEMA 0xf0 | ||
188 | #define RECMEMB 0xf4 | ||
189 | #define RECFB_DIMMA 0xf8 | ||
190 | #define RECFB_DIMMB 0xec | ||
191 | #define RECFB_DIMMC 0xf0 | ||
192 | #define RECFB_DIMMD 0xf4 | ||
193 | #define RECFB_DIMME 0xf8 | ||
194 | #define RECFB_DIMMF 0xfC | ||
195 | |||
196 | /* This applies to FERR_NF_FB-DIMM as well as FERR_FAT_FB-DIMM */ | ||
197 | static inline int extract_fbdchan_indx(u32 x) | ||
198 | { | ||
199 | return (x>>28) & 0x3; | ||
200 | } | ||
201 | #endif | ||
202 | |||
203 | #ifdef CONFIG_EDAC_DEBUG | ||
204 | /* MTR NUMROW */ | ||
205 | static const char *numrow_toString[] = { | ||
206 | "8,192 - 13 rows", | ||
207 | "16,384 - 14 rows", | ||
208 | "32,768 - 15 rows", | ||
209 | "65,536 - 16 rows" | ||
210 | }; | ||
211 | |||
212 | /* MTR NUMCOL */ | ||
213 | static const char *numcol_toString[] = { | ||
214 | "1,024 - 10 columns", | ||
215 | "2,048 - 11 columns", | ||
216 | "4,096 - 12 columns", | ||
217 | "reserved" | ||
218 | }; | ||
219 | #endif | ||
220 | |||
221 | #if 0 | ||
222 | |||
223 | /* | ||
224 | * Error indicator bits and masks | ||
225 | * Error masks are according with Table 5-17 of i7300 datasheet | ||
226 | */ | ||
227 | |||
228 | enum error_mask { | ||
229 | EMASK_M1 = 1<<0, /* Memory Write error on non-redundant retry */ | ||
230 | EMASK_M2 = 1<<1, /* Memory or FB-DIMM configuration CRC read error */ | ||
231 | EMASK_M3 = 1<<2, /* Reserved */ | ||
232 | EMASK_M4 = 1<<3, /* Uncorrectable Data ECC on Replay */ | ||
233 | EMASK_M5 = 1<<4, /* Aliased Uncorrectable Non-Mirrored Demand Data ECC */ | ||
234 | EMASK_M6 = 1<<5, /* Unsupported on i7300 */ | ||
235 | EMASK_M7 = 1<<6, /* Aliased Uncorrectable Resilver- or Spare-Copy Data ECC */ | ||
236 | EMASK_M8 = 1<<7, /* Aliased Uncorrectable Patrol Data ECC */ | ||
237 | EMASK_M9 = 1<<8, /* Non-Aliased Uncorrectable Non-Mirrored Demand Data ECC */ | ||
238 | EMASK_M10 = 1<<9, /* Unsupported on i7300 */ | ||
239 | EMASK_M11 = 1<<10, /* Non-Aliased Uncorrectable Resilver- or Spare-Copy Data ECC */ | ||
240 | EMASK_M12 = 1<<11, /* Non-Aliased Uncorrectable Patrol Data ECC */ | ||
241 | EMASK_M13 = 1<<12, /* Memory Write error on first attempt */ | ||
242 | EMASK_M14 = 1<<13, /* FB-DIMM Configuration Write error on first attempt */ | ||
243 | EMASK_M15 = 1<<14, /* Memory or FB-DIMM configuration CRC read error */ | ||
244 | EMASK_M16 = 1<<15, /* Channel Failed-Over Occurred */ | ||
245 | EMASK_M17 = 1<<16, /* Correctable Non-Mirrored Demand Data ECC */ | ||
246 | EMASK_M18 = 1<<17, /* Unsupported on i7300 */ | ||
247 | EMASK_M19 = 1<<18, /* Correctable Resilver- or Spare-Copy Data ECC */ | ||
248 | EMASK_M20 = 1<<19, /* Correctable Patrol Data ECC */ | ||
249 | EMASK_M21 = 1<<20, /* FB-DIMM Northbound parity error on FB-DIMM Sync Status */ | ||
250 | EMASK_M22 = 1<<21, /* SPD protocol Error */ | ||
251 | EMASK_M23 = 1<<22, /* Non-Redundant Fast Reset Timeout */ | ||
252 | EMASK_M24 = 1<<23, /* Refresh error */ | ||
253 | EMASK_M25 = 1<<24, /* Memory Write error on redundant retry */ | ||
254 | EMASK_M26 = 1<<25, /* Redundant Fast Reset Timeout */ | ||
255 | EMASK_M27 = 1<<26, /* Correctable Counter Threshold Exceeded */ | ||
256 | EMASK_M28 = 1<<27, /* DIMM-Spare Copy Completed */ | ||
257 | EMASK_M29 = 1<<28, /* DIMM-Isolation Completed */ | ||
258 | }; | ||
259 | |||
260 | /* | ||
261 | * Names to translate bit error into something useful | ||
262 | */ | ||
263 | static const char *error_name[] = { | ||
264 | [0] = "Memory Write error on non-redundant retry", | ||
265 | [1] = "Memory or FB-DIMM configuration CRC read error", | ||
266 | /* Reserved */ | ||
267 | [3] = "Uncorrectable Data ECC on Replay", | ||
268 | [4] = "Aliased Uncorrectable Non-Mirrored Demand Data ECC", | ||
269 | /* M6 Unsupported on i7300 */ | ||
270 | [6] = "Aliased Uncorrectable Resilver- or Spare-Copy Data ECC", | ||
271 | [7] = "Aliased Uncorrectable Patrol Data ECC", | ||
272 | [8] = "Non-Aliased Uncorrectable Non-Mirrored Demand Data ECC", | ||
273 | /* M10 Unsupported on i7300 */ | ||
274 | [10] = "Non-Aliased Uncorrectable Resilver- or Spare-Copy Data ECC", | ||
275 | [11] = "Non-Aliased Uncorrectable Patrol Data ECC", | ||
276 | [12] = "Memory Write error on first attempt", | ||
277 | [13] = "FB-DIMM Configuration Write error on first attempt", | ||
278 | [14] = "Memory or FB-DIMM configuration CRC read error", | ||
279 | [15] = "Channel Failed-Over Occurred", | ||
280 | [16] = "Correctable Non-Mirrored Demand Data ECC", | ||
281 | /* M18 Unsupported on i7300 */ | ||
282 | [18] = "Correctable Resilver- or Spare-Copy Data ECC", | ||
283 | [19] = "Correctable Patrol Data ECC", | ||
284 | [20] = "FB-DIMM Northbound parity error on FB-DIMM Sync Status", | ||
285 | [21] = "SPD protocol Error", | ||
286 | [22] = "Non-Redundant Fast Reset Timeout", | ||
287 | [23] = "Refresh error", | ||
288 | [24] = "Memory Write error on redundant retry", | ||
289 | [25] = "Redundant Fast Reset Timeout", | ||
290 | [26] = "Correctable Counter Threshold Exceeded", | ||
291 | [27] = "DIMM-Spare Copy Completed", | ||
292 | [28] = "DIMM-Isolation Completed", | ||
293 | }; | ||
294 | |||
295 | /* Fatal errors */ | ||
296 | #define ERROR_FAT_MASK (EMASK_M1 | \ | ||
297 | EMASK_M2 | \ | ||
298 | EMASK_M23) | ||
299 | |||
300 | /* Correctable errors */ | ||
301 | #define ERROR_NF_CORRECTABLE (EMASK_M27 | \ | ||
302 | EMASK_M20 | \ | ||
303 | EMASK_M19 | \ | ||
304 | EMASK_M18 | \ | ||
305 | EMASK_M17 | \ | ||
306 | EMASK_M16) | ||
307 | #define ERROR_NF_DIMM_SPARE (EMASK_M29 | \ | ||
308 | EMASK_M28) | ||
309 | #define ERROR_NF_SPD_PROTOCOL (EMASK_M22) | ||
310 | #define ERROR_NF_NORTH_CRC (EMASK_M21) | ||
311 | |||
312 | /* Recoverable errors */ | ||
313 | #define ERROR_NF_RECOVERABLE (EMASK_M26 | \ | ||
314 | EMASK_M25 | \ | ||
315 | EMASK_M24 | \ | ||
316 | EMASK_M15 | \ | ||
317 | EMASK_M14 | \ | ||
318 | EMASK_M13 | \ | ||
319 | EMASK_M12 | \ | ||
320 | EMASK_M11 | \ | ||
321 | EMASK_M9 | \ | ||
322 | EMASK_M8 | \ | ||
323 | EMASK_M7 | \ | ||
324 | EMASK_M5) | ||
325 | |||
326 | /* uncorrectable errors */ | ||
327 | #define ERROR_NF_UNCORRECTABLE (EMASK_M4) | ||
328 | |||
329 | /* mask to all non-fatal errors */ | ||
330 | #define ERROR_NF_MASK (ERROR_NF_CORRECTABLE | \ | ||
331 | ERROR_NF_UNCORRECTABLE | \ | ||
332 | ERROR_NF_RECOVERABLE | \ | ||
333 | ERROR_NF_DIMM_SPARE | \ | ||
334 | ERROR_NF_SPD_PROTOCOL | \ | ||
335 | ERROR_NF_NORTH_CRC) | ||
336 | |||
337 | /* | ||
338 | * Define error masks for the several registers | ||
339 | */ | ||
340 | |||
341 | /* Enable all fatal and non fatal errors */ | ||
342 | #define ENABLE_EMASK_ALL (ERROR_FAT_MASK | ERROR_NF_MASK) | ||
343 | |||
344 | /* mask for fatal error registers */ | ||
345 | #define FERR_FAT_MASK ERROR_FAT_MASK | ||
346 | |||
347 | /* masks for non-fatal error register */ | ||
348 | static inline int to_nf_mask(unsigned int mask) | ||
349 | { | ||
350 | return (mask & EMASK_M29) | (mask >> 3); | ||
351 | }; | ||
352 | |||
353 | static inline int from_nf_ferr(unsigned int mask) | ||
354 | { | ||
355 | return (mask & EMASK_M29) | /* Bit 28 */ | ||
356 | (mask & ((1 << 28) - 1) << 3); /* Bits 0 to 27 */ | ||
357 | }; | ||
358 | |||
359 | #define FERR_NF_MASK to_nf_mask(ERROR_NF_MASK) | ||
360 | #define FERR_NF_CORRECTABLE to_nf_mask(ERROR_NF_CORRECTABLE) | ||
361 | #define FERR_NF_DIMM_SPARE to_nf_mask(ERROR_NF_DIMM_SPARE) | ||
362 | #define FERR_NF_SPD_PROTOCOL to_nf_mask(ERROR_NF_SPD_PROTOCOL) | ||
363 | #define FERR_NF_NORTH_CRC to_nf_mask(ERROR_NF_NORTH_CRC) | ||
364 | #define FERR_NF_RECOVERABLE to_nf_mask(ERROR_NF_RECOVERABLE) | ||
365 | #define FERR_NF_UNCORRECTABLE to_nf_mask(ERROR_NF_UNCORRECTABLE) | ||
366 | |||
367 | #endif | ||
368 | |||
369 | /* Device name and register DID (Device ID) */ | ||
370 | struct i7300_dev_info { | ||
371 | const char *ctl_name; /* name for this device */ | ||
372 | u16 fsb_mapping_errors; /* DID for the branchmap,control */ | ||
373 | }; | ||
374 | |||
375 | /* Table of devices attributes supported by this driver */ | ||
376 | static const struct i7300_dev_info i7300_devs[] = { | ||
377 | { | ||
378 | .ctl_name = "I7300", | ||
379 | .fsb_mapping_errors = PCI_DEVICE_ID_INTEL_I7300_MCH_ERR, | ||
380 | }, | ||
381 | }; | ||
382 | |||
383 | struct i7300_dimm_info { | ||
384 | int megabytes; /* size, 0 means not present */ | ||
385 | }; | ||
386 | |||
387 | /* driver private data structure */ | ||
388 | struct i7300_pvt { | ||
389 | struct pci_dev *system_address; /* 16.0 */ | ||
390 | struct pci_dev *branchmap_werrors; /* 16.1 */ | ||
391 | struct pci_dev *fsb_error_regs; /* 16.2 */ | ||
392 | struct pci_dev *branch_pci[MAX_BRANCHES]; /* 21.0 and 22.0 */ | ||
393 | |||
394 | u16 tolm; /* top of low memory */ | ||
395 | u64 ambase; /* AMB BAR */ | ||
396 | |||
397 | u16 mir[MAX_MIR]; | ||
398 | |||
399 | u16 mtr[MAX_SLOTS][MAX_BRANCHES]; /* Memory Technlogy Reg */ | ||
400 | u16 ambpresent[MAX_CHANNELS]; /* AMB present regs */ | ||
401 | |||
402 | /* DIMM information matrix, allocating architecture maximums */ | ||
403 | struct i7300_dimm_info dimm_info[MAX_SLOTS][MAX_CHANNELS]; | ||
404 | }; | ||
405 | |||
406 | #if 0 | ||
407 | /* I7300 MCH error information retrieved from Hardware */ | ||
408 | struct i7300_error_info { | ||
409 | /* These registers are always read from the MC */ | ||
410 | u32 ferr_fat_fbd; /* First Errors Fatal */ | ||
411 | u32 nerr_fat_fbd; /* Next Errors Fatal */ | ||
412 | u32 ferr_nf_fbd; /* First Errors Non-Fatal */ | ||
413 | u32 nerr_nf_fbd; /* Next Errors Non-Fatal */ | ||
414 | |||
415 | /* These registers are input ONLY if there was a Recoverable Error */ | ||
416 | u32 redmemb; /* Recoverable Mem Data Error log B */ | ||
417 | u16 recmema; /* Recoverable Mem Error log A */ | ||
418 | u32 recmemb; /* Recoverable Mem Error log B */ | ||
419 | |||
420 | /* These registers are input ONLY if there was a Non-Rec Error */ | ||
421 | u16 nrecmema; /* Non-Recoverable Mem log A */ | ||
422 | u16 nrecmemb; /* Non-Recoverable Mem log B */ | ||
423 | |||
424 | }; | ||
425 | #endif | ||
426 | |||
427 | /* FIXME: Why do we need to have this static? */ | ||
428 | static struct edac_pci_ctl_info *i7300_pci; | ||
429 | |||
430 | |||
431 | #if 0 | ||
432 | /* note that nrec_rdwr changed from NRECMEMA to NRECMEMB between the 5000 and | ||
433 | 5400 better to use an inline function than a macro in this case */ | ||
434 | static inline int nrec_bank(struct i7300_error_info *info) | ||
435 | { | ||
436 | return ((info->nrecmema) >> 12) & 0x7; | ||
437 | } | ||
438 | static inline int nrec_rank(struct i7300_error_info *info) | ||
439 | { | ||
440 | return ((info->nrecmema) >> 8) & 0xf; | ||
441 | } | ||
442 | static inline int nrec_buf_id(struct i7300_error_info *info) | ||
443 | { | ||
444 | return ((info->nrecmema)) & 0xff; | ||
445 | } | ||
446 | static inline int nrec_rdwr(struct i7300_error_info *info) | ||
447 | { | ||
448 | return (info->nrecmemb) >> 31; | ||
449 | } | ||
450 | /* This applies to both NREC and REC string so it can be used with nrec_rdwr | ||
451 | and rec_rdwr */ | ||
452 | static inline const char *rdwr_str(int rdwr) | ||
453 | { | ||
454 | return rdwr ? "Write" : "Read"; | ||
455 | } | ||
456 | static inline int nrec_cas(struct i7300_error_info *info) | ||
457 | { | ||
458 | return ((info->nrecmemb) >> 16) & 0x1fff; | ||
459 | } | ||
460 | static inline int nrec_ras(struct i7300_error_info *info) | ||
461 | { | ||
462 | return (info->nrecmemb) & 0xffff; | ||
463 | } | ||
464 | static inline int rec_bank(struct i7300_error_info *info) | ||
465 | { | ||
466 | return ((info->recmema) >> 12) & 0x7; | ||
467 | } | ||
468 | static inline int rec_rank(struct i7300_error_info *info) | ||
469 | { | ||
470 | return ((info->recmema) >> 8) & 0xf; | ||
471 | } | ||
472 | static inline int rec_rdwr(struct i7300_error_info *info) | ||
473 | { | ||
474 | return (info->recmemb) >> 31; | ||
475 | } | ||
476 | static inline int rec_cas(struct i7300_error_info *info) | ||
477 | { | ||
478 | return ((info->recmemb) >> 16) & 0x1fff; | ||
479 | } | ||
480 | static inline int rec_ras(struct i7300_error_info *info) | ||
481 | { | ||
482 | return (info->recmemb) & 0xffff; | ||
483 | } | ||
484 | |||
485 | /* | ||
486 | * i7300_get_error_info Retrieve the hardware error information from | ||
487 | * the hardware and cache it in the 'info' | ||
488 | * structure | ||
489 | */ | ||
490 | static void i7300_get_error_info(struct mem_ctl_info *mci, | ||
491 | struct i7300_error_info *info) | ||
492 | { | ||
493 | struct i7300_pvt *pvt; | ||
494 | u32 value; | ||
495 | |||
496 | pvt = mci->pvt_info; | ||
497 | |||
498 | /* read in the 1st FATAL error register */ | ||
499 | pci_read_config_dword(pvt->branchmap_werrors, FERR_FAT_FBD, &value); | ||
500 | |||
501 | /* Mask only the bits that the doc says are valid | ||
502 | */ | ||
503 | value &= (FERR_FAT_FBDCHAN | FERR_FAT_MASK); | ||
504 | |||
505 | /* If there is an error, then read in the | ||
506 | NEXT FATAL error register and the Memory Error Log Register A | ||
507 | */ | ||
508 | if (value & FERR_FAT_MASK) { | ||
509 | info->ferr_fat_fbd = value; | ||
510 | |||
511 | /* harvest the various error data we need */ | ||
512 | pci_read_config_dword(pvt->branchmap_werrors, | ||
513 | NERR_FAT_FBD, &info->nerr_fat_fbd); | ||
514 | pci_read_config_word(pvt->branchmap_werrors, | ||
515 | NRECMEMA, &info->nrecmema); | ||
516 | pci_read_config_word(pvt->branchmap_werrors, | ||
517 | NRECMEMB, &info->nrecmemb); | ||
518 | |||
519 | /* Clear the error bits, by writing them back */ | ||
520 | pci_write_config_dword(pvt->branchmap_werrors, | ||
521 | FERR_FAT_FBD, value); | ||
522 | } else { | ||
523 | info->ferr_fat_fbd = 0; | ||
524 | info->nerr_fat_fbd = 0; | ||
525 | info->nrecmema = 0; | ||
526 | info->nrecmemb = 0; | ||
527 | } | ||
528 | |||
529 | /* read in the 1st NON-FATAL error register */ | ||
530 | pci_read_config_dword(pvt->branchmap_werrors, FERR_NF_FBD, &value); | ||
531 | |||
532 | /* If there is an error, then read in the 1st NON-FATAL error | ||
533 | * register as well */ | ||
534 | if (value & FERR_NF_MASK) { | ||
535 | info->ferr_nf_fbd = value; | ||
536 | |||
537 | /* harvest the various error data we need */ | ||
538 | pci_read_config_dword(pvt->branchmap_werrors, | ||
539 | NERR_NF_FBD, &info->nerr_nf_fbd); | ||
540 | pci_read_config_word(pvt->branchmap_werrors, | ||
541 | RECMEMA, &info->recmema); | ||
542 | pci_read_config_dword(pvt->branchmap_werrors, | ||
543 | RECMEMB, &info->recmemb); | ||
544 | pci_read_config_dword(pvt->branchmap_werrors, | ||
545 | REDMEMB, &info->redmemb); | ||
546 | |||
547 | /* Clear the error bits, by writing them back */ | ||
548 | pci_write_config_dword(pvt->branchmap_werrors, | ||
549 | FERR_NF_FBD, value); | ||
550 | } else { | ||
551 | info->ferr_nf_fbd = 0; | ||
552 | info->nerr_nf_fbd = 0; | ||
553 | info->recmema = 0; | ||
554 | info->recmemb = 0; | ||
555 | info->redmemb = 0; | ||
556 | } | ||
557 | } | ||
558 | |||
559 | /* | ||
560 | * i7300_proccess_non_recoverable_info(struct mem_ctl_info *mci, | ||
561 | * struct i7300_error_info *info, | ||
562 | * int handle_errors); | ||
563 | * | ||
564 | * handle the Intel FATAL and unrecoverable errors, if any | ||
565 | */ | ||
566 | static void i7300_proccess_non_recoverable_info(struct mem_ctl_info *mci, | ||
567 | struct i7300_error_info *info, | ||
568 | unsigned long allErrors) | ||
569 | { | ||
570 | char msg[EDAC_MC_LABEL_LEN + 1 + 90 + 80]; | ||
571 | int branch; | ||
572 | int channel; | ||
573 | int bank; | ||
574 | int buf_id; | ||
575 | int rank; | ||
576 | int rdwr; | ||
577 | int ras, cas; | ||
578 | int errnum; | ||
579 | char *type = NULL; | ||
580 | |||
581 | if (!allErrors) | ||
582 | return; /* if no error, return now */ | ||
583 | |||
584 | if (allErrors & ERROR_FAT_MASK) | ||
585 | type = "FATAL"; | ||
586 | else if (allErrors & FERR_NF_UNCORRECTABLE) | ||
587 | type = "NON-FATAL uncorrected"; | ||
588 | else | ||
589 | type = "NON-FATAL recoverable"; | ||
590 | |||
591 | /* ONLY ONE of the possible error bits will be set, as per the docs */ | ||
592 | |||
593 | branch = extract_fbdchan_indx(info->ferr_fat_fbd); | ||
594 | channel = branch; | ||
595 | |||
596 | /* Use the NON-Recoverable macros to extract data */ | ||
597 | bank = nrec_bank(info); | ||
598 | rank = nrec_rank(info); | ||
599 | buf_id = nrec_buf_id(info); | ||
600 | rdwr = nrec_rdwr(info); | ||
601 | ras = nrec_ras(info); | ||
602 | cas = nrec_cas(info); | ||
603 | |||
604 | debugf0("\t\tCSROW= %d Channels= %d,%d (Branch= %d " | ||
605 | "DRAM Bank= %d Buffer ID = %d rdwr= %s ras= %d cas= %d)\n", | ||
606 | rank, channel, channel + 1, branch >> 1, bank, | ||
607 | buf_id, rdwr_str(rdwr), ras, cas); | ||
608 | |||
609 | /* Only 1 bit will be on */ | ||
610 | errnum = find_first_bit(&allErrors, ARRAY_SIZE(error_name)); | ||
611 | |||
612 | /* Form out message */ | ||
613 | snprintf(msg, sizeof(msg), | ||
614 | "%s (Branch=%d DRAM-Bank=%d Buffer ID = %d RDWR=%s " | ||
615 | "RAS=%d CAS=%d %s Err=0x%lx (%s))", | ||
616 | type, branch >> 1, bank, buf_id, rdwr_str(rdwr), ras, cas, | ||
617 | type, allErrors, error_name[errnum]); | ||
618 | |||
619 | /* Call the helper to output message */ | ||
620 | edac_mc_handle_fbd_ue(mci, rank, channel, channel + 1, msg); | ||
621 | } | ||
622 | |||
623 | /* | ||
624 | * i7300_process_fatal_error_info(struct mem_ctl_info *mci, | ||
625 | * struct i7300_error_info *info, | ||
626 | * int handle_errors); | ||
627 | * | ||
628 | * handle the Intel NON-FATAL errors, if any | ||
629 | */ | ||
630 | static void i7300_process_nonfatal_error_info(struct mem_ctl_info *mci, | ||
631 | struct i7300_error_info *info) | ||
632 | { | ||
633 | char msg[EDAC_MC_LABEL_LEN + 1 + 90 + 80]; | ||
634 | unsigned long allErrors; | ||
635 | int branch; | ||
636 | int channel; | ||
637 | int bank; | ||
638 | int rank; | ||
639 | int rdwr; | ||
640 | int ras, cas; | ||
641 | int errnum; | ||
642 | |||
643 | /* mask off the Error bits that are possible */ | ||
644 | allErrors = from_nf_ferr(info->ferr_nf_fbd & FERR_NF_MASK); | ||
645 | if (!allErrors) | ||
646 | return; /* if no error, return now */ | ||
647 | |||
648 | /* ONLY ONE of the possible error bits will be set, as per the docs */ | ||
649 | |||
650 | if (allErrors & (ERROR_NF_UNCORRECTABLE | ERROR_NF_RECOVERABLE)) { | ||
651 | i7300_proccess_non_recoverable_info(mci, info, allErrors); | ||
652 | return; | ||
653 | } | ||
654 | |||
655 | /* Correctable errors */ | ||
656 | if (allErrors & ERROR_NF_CORRECTABLE) { | ||
657 | debugf0("\tCorrected bits= 0x%lx\n", allErrors); | ||
658 | |||
659 | branch = extract_fbdchan_indx(info->ferr_nf_fbd); | ||
660 | |||
661 | channel = 0; | ||
662 | if (REC_ECC_LOCATOR_ODD(info->redmemb)) | ||
663 | channel = 1; | ||
664 | |||
665 | /* Convert channel to be based from zero, instead of | ||
666 | * from branch base of 0 */ | ||
667 | channel += branch; | ||
668 | |||
669 | bank = rec_bank(info); | ||
670 | rank = rec_rank(info); | ||
671 | rdwr = rec_rdwr(info); | ||
672 | ras = rec_ras(info); | ||
673 | cas = rec_cas(info); | ||
674 | |||
675 | /* Only 1 bit will be on */ | ||
676 | errnum = find_first_bit(&allErrors, ARRAY_SIZE(error_name)); | ||
677 | |||
678 | debugf0("\t\tCSROW= %d Channel= %d (Branch %d " | ||
679 | "DRAM Bank= %d rdwr= %s ras= %d cas= %d)\n", | ||
680 | rank, channel, branch >> 1, bank, | ||
681 | rdwr_str(rdwr), ras, cas); | ||
682 | |||
683 | /* Form out message */ | ||
684 | snprintf(msg, sizeof(msg), | ||
685 | "Corrected error (Branch=%d DRAM-Bank=%d RDWR=%s " | ||
686 | "RAS=%d CAS=%d, CE Err=0x%lx (%s))", | ||
687 | branch >> 1, bank, rdwr_str(rdwr), ras, cas, | ||
688 | allErrors, error_name[errnum]); | ||
689 | |||
690 | /* Call the helper to output message */ | ||
691 | edac_mc_handle_fbd_ce(mci, rank, channel, msg); | ||
692 | |||
693 | return; | ||
694 | } | ||
695 | |||
696 | /* Miscelaneous errors */ | ||
697 | errnum = find_first_bit(&allErrors, ARRAY_SIZE(error_name)); | ||
698 | |||
699 | branch = extract_fbdchan_indx(info->ferr_nf_fbd); | ||
700 | |||
701 | i7300_mc_printk(mci, KERN_EMERG, | ||
702 | "Non-Fatal misc error (Branch=%d Err=%#lx (%s))", | ||
703 | branch >> 1, allErrors, error_name[errnum]); | ||
704 | } | ||
705 | |||
706 | /* | ||
707 | * i7300_process_error_info Process the error info that is | ||
708 | * in the 'info' structure, previously retrieved from hardware | ||
709 | */ | ||
710 | static void i7300_process_error_info(struct mem_ctl_info *mci, | ||
711 | struct i7300_error_info *info) | ||
712 | { u32 allErrors; | ||
713 | |||
714 | /* First handle any fatal errors that occurred */ | ||
715 | allErrors = (info->ferr_fat_fbd & FERR_FAT_MASK); | ||
716 | i7300_proccess_non_recoverable_info(mci, info, allErrors); | ||
717 | |||
718 | /* now handle any non-fatal errors that occurred */ | ||
719 | i7300_process_nonfatal_error_info(mci, info); | ||
720 | } | ||
721 | |||
722 | /* | ||
723 | * i7300_clear_error Retrieve any error from the hardware | ||
724 | * but do NOT process that error. | ||
725 | * Used for 'clearing' out of previous errors | ||
726 | * Called by the Core module. | ||
727 | */ | ||
728 | static void i7300_clear_error(struct mem_ctl_info *mci) | ||
729 | { | ||
730 | struct i7300_error_info info; | ||
731 | |||
732 | i7300_get_error_info(mci, &info); | ||
733 | } | ||
734 | |||
735 | /* | ||
736 | * i7300_check_error Retrieve and process errors reported by the | ||
737 | * hardware. Called by the Core module. | ||
738 | */ | ||
739 | static void i7300_check_error(struct mem_ctl_info *mci) | ||
740 | { | ||
741 | struct i7300_error_info info; | ||
742 | debugf4("MC%d: " __FILE__ ": %s()\n", mci->mc_idx, __func__); | ||
743 | i7300_get_error_info(mci, &info); | ||
744 | i7300_process_error_info(mci, &info); | ||
745 | } | ||
746 | |||
747 | /* | ||
748 | * i7300_enable_error_reporting | ||
749 | * Turn on the memory reporting features of the hardware | ||
750 | */ | ||
751 | static void i7300_enable_error_reporting(struct mem_ctl_info *mci) | ||
752 | { | ||
753 | struct i7300_pvt *pvt; | ||
754 | u32 fbd_error_mask; | ||
755 | |||
756 | pvt = mci->pvt_info; | ||
757 | |||
758 | /* Read the FBD Error Mask Register */ | ||
759 | pci_read_config_dword(pvt->branchmap_werrors, EMASK_FBD, | ||
760 | &fbd_error_mask); | ||
761 | |||
762 | /* Enable with a '0' */ | ||
763 | fbd_error_mask &= ~(ENABLE_EMASK_ALL); | ||
764 | |||
765 | pci_write_config_dword(pvt->branchmap_werrors, EMASK_FBD, | ||
766 | fbd_error_mask); | ||
767 | } | ||
768 | #endif | ||
769 | |||
770 | /* | ||
771 | * determine_mtr(pvt, csrow, channel) | ||
772 | * | ||
773 | * return the proper MTR register as determine by the csrow and desired channel | ||
774 | */ | ||
775 | static int decode_mtr(struct i7300_pvt *pvt, | ||
776 | int slot, int ch, int branch, | ||
777 | struct i7300_dimm_info *dinfo, | ||
778 | struct csrow_info *p_csrow) | ||
779 | { | ||
780 | int mtr, ans, addrBits, channel; | ||
781 | |||
782 | channel = to_channel(ch, branch); | ||
783 | |||
784 | mtr = pvt->mtr[slot][branch]; | ||
785 | ans = MTR_DIMMS_PRESENT(mtr) ? 1 : 0; | ||
786 | |||
787 | debugf2("\tMTR%d CH%d: DIMMs are %s (mtr)\n", | ||
788 | slot, channel, | ||
789 | ans ? "Present" : "NOT Present"); | ||
790 | |||
791 | /* Determine if there is a DIMM present in this DIMM slot */ | ||
792 | |||
793 | #if 0 | ||
794 | if (!amb_present || !ans) | ||
795 | return 0; | ||
796 | #else | ||
797 | if (!ans) | ||
798 | return 0; | ||
799 | #endif | ||
800 | |||
801 | /* Start with the number of bits for a Bank | ||
802 | * on the DRAM */ | ||
803 | addrBits = MTR_DRAM_BANKS_ADDR_BITS; | ||
804 | /* Add thenumber of ROW bits */ | ||
805 | addrBits += MTR_DIMM_ROWS_ADDR_BITS(mtr); | ||
806 | /* add the number of COLUMN bits */ | ||
807 | addrBits += MTR_DIMM_COLS_ADDR_BITS(mtr); | ||
808 | /* add the number of RANK bits */ | ||
809 | addrBits += MTR_DIMM_RANKS(mtr); | ||
810 | |||
811 | addrBits += 6; /* add 64 bits per DIMM */ | ||
812 | addrBits -= 20; /* divide by 2^^20 */ | ||
813 | addrBits -= 3; /* 8 bits per bytes */ | ||
814 | |||
815 | dinfo->megabytes = 1 << addrBits; | ||
816 | |||
817 | debugf2("\t\tWIDTH: x%d\n", MTR_DRAM_WIDTH(mtr)); | ||
818 | |||
819 | debugf2("\t\tELECTRICAL THROTTLING is %s\n", | ||
820 | MTR_DIMMS_ETHROTTLE(mtr) ? "enabled" : "disabled"); | ||
821 | |||
822 | debugf2("\t\tNUMBANK: %d bank(s)\n", MTR_DRAM_BANKS(mtr)); | ||
823 | debugf2("\t\tNUMRANK: %s\n", MTR_DIMM_RANKS(mtr) ? "double" : "single"); | ||
824 | debugf2("\t\tNUMROW: %s\n", numrow_toString[MTR_DIMM_ROWS(mtr)]); | ||
825 | debugf2("\t\tNUMCOL: %s\n", numcol_toString[MTR_DIMM_COLS(mtr)]); | ||
826 | debugf2("\t\tSIZE: %d MB\n", dinfo->megabytes); | ||
827 | |||
828 | p_csrow->grain = 8; | ||
829 | p_csrow->nr_pages = dinfo->megabytes << 8; | ||
830 | p_csrow->mtype = MEM_FB_DDR2; | ||
831 | p_csrow->edac_mode = EDAC_S8ECD8ED; | ||
832 | |||
833 | /* ask what device type on this row */ | ||
834 | if (MTR_DRAM_WIDTH(mtr)) | ||
835 | p_csrow->dtype = DEV_X8; | ||
836 | else | ||
837 | p_csrow->dtype = DEV_X4; | ||
838 | |||
839 | return mtr; | ||
840 | } | ||
841 | |||
842 | /* | ||
843 | * print_dimm_size | ||
844 | * | ||
845 | * also will output a DIMM matrix map, if debug is enabled, for viewing | ||
846 | * how the DIMMs are populated | ||
847 | */ | ||
848 | static void print_dimm_size(struct i7300_pvt *pvt) | ||
849 | { | ||
850 | struct i7300_dimm_info *dinfo; | ||
851 | char *p, *mem_buffer; | ||
852 | int space, n; | ||
853 | int channel, slot; | ||
854 | |||
855 | space = PAGE_SIZE; | ||
856 | mem_buffer = p = kmalloc(space, GFP_KERNEL); | ||
857 | if (p == NULL) { | ||
858 | i7300_printk(KERN_ERR, "MC: %s:%s() kmalloc() failed\n", | ||
859 | __FILE__, __func__); | ||
860 | return; | ||
861 | } | ||
862 | |||
863 | n = snprintf(p, space, " "); | ||
864 | p += n; | ||
865 | space -= n; | ||
866 | for (channel = 0; channel < MAX_CHANNELS; channel++) { | ||
867 | n = snprintf(p, space, "channel %d | ", channel); | ||
868 | p += n; | ||
869 | space -= n; | ||
870 | } | ||
871 | debugf2("%s\n", mem_buffer); | ||
872 | p = mem_buffer; | ||
873 | space = PAGE_SIZE; | ||
874 | n = snprintf(p, space, "-------------------------------" | ||
875 | "------------------------------"); | ||
876 | p += n; | ||
877 | space -= n; | ||
878 | debugf2("%s\n", mem_buffer); | ||
879 | p = mem_buffer; | ||
880 | space = PAGE_SIZE; | ||
881 | |||
882 | for (slot = 0; slot < MAX_SLOTS; slot++) { | ||
883 | n = snprintf(p, space, "csrow/SLOT %d ", slot); | ||
884 | p += n; | ||
885 | space -= n; | ||
886 | |||
887 | for (channel = 0; channel < MAX_CHANNELS; channel++) { | ||
888 | dinfo = &pvt->dimm_info[slot][channel]; | ||
889 | n = snprintf(p, space, "%4d MB | ", dinfo->megabytes); | ||
890 | p += n; | ||
891 | space -= n; | ||
892 | } | ||
893 | |||
894 | debugf2("%s\n", mem_buffer); | ||
895 | p = mem_buffer; | ||
896 | space = PAGE_SIZE; | ||
897 | } | ||
898 | |||
899 | n = snprintf(p, space, "-------------------------------" | ||
900 | "------------------------------"); | ||
901 | p += n; | ||
902 | space -= n; | ||
903 | debugf2("%s\n", mem_buffer); | ||
904 | p = mem_buffer; | ||
905 | space = PAGE_SIZE; | ||
906 | |||
907 | kfree(mem_buffer); | ||
908 | } | ||
909 | |||
910 | /* | ||
911 | * i7300_init_csrows Initialize the 'csrows' table within | ||
912 | * the mci control structure with the | ||
913 | * addressing of memory. | ||
914 | * | ||
915 | * return: | ||
916 | * 0 success | ||
917 | * 1 no actual memory found on this MC | ||
918 | */ | ||
919 | static int i7300_init_csrows(struct mem_ctl_info *mci) | ||
920 | { | ||
921 | struct i7300_pvt *pvt; | ||
922 | struct i7300_dimm_info *dinfo; | ||
923 | struct csrow_info *p_csrow; | ||
924 | int empty; | ||
925 | int mtr; | ||
926 | int ch, branch, slot, channel; | ||
927 | |||
928 | pvt = mci->pvt_info; | ||
929 | |||
930 | empty = 1; /* Assume NO memory */ | ||
931 | |||
932 | debugf2("Memory Technology Registers:\n"); | ||
933 | |||
934 | /* Get the AMB present registers for the four channels */ | ||
935 | for (branch = 0; branch < MAX_BRANCHES; branch++) { | ||
936 | /* Read and dump branch 0's MTRs */ | ||
937 | channel = to_channel(0, branch); | ||
938 | pci_read_config_word(pvt->branch_pci[branch], AMBPRESENT_0, | ||
939 | &pvt->ambpresent[channel]); | ||
940 | debugf2("\t\tAMB-present CH%d = 0x%x:\n", | ||
941 | channel, pvt->ambpresent[channel]); | ||
942 | |||
943 | channel = to_channel(1, branch); | ||
944 | pci_read_config_word(pvt->branch_pci[branch], AMBPRESENT_1, | ||
945 | &pvt->ambpresent[channel]); | ||
946 | debugf2("\t\tAMB-present CH%d = 0x%x:\n", | ||
947 | channel, pvt->ambpresent[channel]); | ||
948 | } | ||
949 | |||
950 | /* Get the set of MTR[0-7] regs by each branch */ | ||
951 | for (slot = 0; slot < MAX_SLOTS; slot++) { | ||
952 | int where = mtr_regs[slot]; | ||
953 | for (branch = 0; branch < MAX_BRANCHES; branch++) { | ||
954 | pci_read_config_word(pvt->branch_pci[branch], | ||
955 | where, | ||
956 | &pvt->mtr[slot][branch]); | ||
957 | for (ch = 0; ch < MAX_BRANCHES; ch++) { | ||
958 | int channel = to_channel(ch, branch); | ||
959 | |||
960 | dinfo = &pvt->dimm_info[slot][channel]; | ||
961 | p_csrow = &mci->csrows[slot]; | ||
962 | |||
963 | mtr = decode_mtr(pvt, slot, ch, branch, | ||
964 | dinfo, p_csrow); | ||
965 | /* if no DIMMS on this row, continue */ | ||
966 | if (!MTR_DIMMS_PRESENT(mtr)) | ||
967 | continue; | ||
968 | |||
969 | p_csrow->csrow_idx = slot; | ||
970 | |||
971 | /* FAKE OUT VALUES, FIXME */ | ||
972 | p_csrow->first_page = 0 + slot * 20; | ||
973 | p_csrow->last_page = 9 + slot * 20; | ||
974 | p_csrow->page_mask = 0xfff; | ||
975 | |||
976 | empty = 0; | ||
977 | } | ||
978 | } | ||
979 | } | ||
980 | |||
981 | return empty; | ||
982 | } | ||
983 | |||
984 | static void decode_mir(int mir_no, u16 mir[MAX_MIR]) | ||
985 | { | ||
986 | if (mir[mir_no] & 3) | ||
987 | debugf2("MIR%d: limit= 0x%x Branch(es) that participate: %s %s\n", | ||
988 | mir_no, | ||
989 | (mir[mir_no] >> 4) & 0xfff, | ||
990 | (mir[mir_no] & 1) ? "B0" : "", | ||
991 | (mir[mir_no] & 2) ? "B1": ""); | ||
992 | } | ||
993 | |||
994 | /* | ||
995 | * i7300_get_mc_regs read in the necessary registers and | ||
996 | * cache locally | ||
997 | * | ||
998 | * Fills in the private data members | ||
999 | */ | ||
1000 | static int i7300_get_mc_regs(struct mem_ctl_info *mci) | ||
1001 | { | ||
1002 | struct i7300_pvt *pvt; | ||
1003 | u32 actual_tolm; | ||
1004 | int i, rc; | ||
1005 | |||
1006 | pvt = mci->pvt_info; | ||
1007 | |||
1008 | pci_read_config_dword(pvt->system_address, AMBASE, | ||
1009 | (u32 *) &pvt->ambase); | ||
1010 | |||
1011 | debugf2("AMBASE= 0x%lx\n", (long unsigned int)pvt->ambase); | ||
1012 | |||
1013 | /* Get the Branch Map regs */ | ||
1014 | pci_read_config_word(pvt->branchmap_werrors, TOLM, &pvt->tolm); | ||
1015 | pvt->tolm >>= 12; | ||
1016 | debugf2("TOLM (number of 256M regions) =%u (0x%x)\n", pvt->tolm, | ||
1017 | pvt->tolm); | ||
1018 | |||
1019 | actual_tolm = (u32) ((1000l * pvt->tolm) >> (30 - 28)); | ||
1020 | debugf2("Actual TOLM byte addr=%u.%03u GB (0x%x)\n", | ||
1021 | actual_tolm/1000, actual_tolm % 1000, pvt->tolm << 28); | ||
1022 | |||
1023 | pci_read_config_word(pvt->branchmap_werrors, MIR0, &pvt->mir[0]); | ||
1024 | pci_read_config_word(pvt->branchmap_werrors, MIR1, &pvt->mir[1]); | ||
1025 | pci_read_config_word(pvt->branchmap_werrors, MIR2, &pvt->mir[2]); | ||
1026 | |||
1027 | /* Decode the MIR regs */ | ||
1028 | for (i = 0; i < MAX_MIR; i++) | ||
1029 | decode_mir(i, pvt->mir); | ||
1030 | |||
1031 | rc = i7300_init_csrows(mci); | ||
1032 | if (rc < 0) | ||
1033 | return rc; | ||
1034 | |||
1035 | /* Go and determine the size of each DIMM and place in an | ||
1036 | * orderly matrix */ | ||
1037 | print_dimm_size(pvt); | ||
1038 | |||
1039 | return 0; | ||
1040 | } | ||
1041 | |||
1042 | /* | ||
1043 | * i7300_put_devices 'put' all the devices that we have | ||
1044 | * reserved via 'get' | ||
1045 | */ | ||
1046 | static void i7300_put_devices(struct mem_ctl_info *mci) | ||
1047 | { | ||
1048 | struct i7300_pvt *pvt; | ||
1049 | int branch; | ||
1050 | |||
1051 | pvt = mci->pvt_info; | ||
1052 | |||
1053 | /* Decrement usage count for devices */ | ||
1054 | for (branch = 0; branch < MAX_CH_PER_BRANCH; branch++) | ||
1055 | pci_dev_put(pvt->branch_pci[branch]); | ||
1056 | pci_dev_put(pvt->fsb_error_regs); | ||
1057 | pci_dev_put(pvt->branchmap_werrors); | ||
1058 | } | ||
1059 | |||
1060 | /* | ||
1061 | * i7300_get_devices Find and perform 'get' operation on the MCH's | ||
1062 | * device/functions we want to reference for this driver | ||
1063 | * | ||
1064 | * Need to 'get' device 16 func 1 and func 2 | ||
1065 | */ | ||
1066 | static int i7300_get_devices(struct mem_ctl_info *mci, int dev_idx) | ||
1067 | { | ||
1068 | struct i7300_pvt *pvt; | ||
1069 | struct pci_dev *pdev; | ||
1070 | |||
1071 | pvt = mci->pvt_info; | ||
1072 | |||
1073 | /* Attempt to 'get' the MCH register we want */ | ||
1074 | pdev = NULL; | ||
1075 | while (!pvt->branchmap_werrors || !pvt->fsb_error_regs) { | ||
1076 | pdev = pci_get_device(PCI_VENDOR_ID_INTEL, | ||
1077 | PCI_DEVICE_ID_INTEL_I7300_MCH_ERR, pdev); | ||
1078 | if (!pdev) { | ||
1079 | /* End of list, leave */ | ||
1080 | i7300_printk(KERN_ERR, | ||
1081 | "'system address,Process Bus' " | ||
1082 | "device not found:" | ||
1083 | "vendor 0x%x device 0x%x ERR funcs " | ||
1084 | "(broken BIOS?)\n", | ||
1085 | PCI_VENDOR_ID_INTEL, | ||
1086 | PCI_DEVICE_ID_INTEL_I7300_MCH_ERR); | ||
1087 | goto error; | ||
1088 | } | ||
1089 | |||
1090 | /* Store device 16 funcs 1 and 2 */ | ||
1091 | switch (PCI_FUNC(pdev->devfn)) { | ||
1092 | case 1: | ||
1093 | pvt->branchmap_werrors = pdev; | ||
1094 | break; | ||
1095 | case 2: | ||
1096 | pvt->fsb_error_regs = pdev; | ||
1097 | break; | ||
1098 | } | ||
1099 | } | ||
1100 | |||
1101 | debugf1("System Address, processor bus- PCI Bus ID: %s %x:%x\n", | ||
1102 | pci_name(pvt->system_address), | ||
1103 | pvt->system_address->vendor, pvt->system_address->device); | ||
1104 | debugf1("Branchmap, control and errors - PCI Bus ID: %s %x:%x\n", | ||
1105 | pci_name(pvt->branchmap_werrors), | ||
1106 | pvt->branchmap_werrors->vendor, pvt->branchmap_werrors->device); | ||
1107 | debugf1("FSB Error Regs - PCI Bus ID: %s %x:%x\n", | ||
1108 | pci_name(pvt->fsb_error_regs), | ||
1109 | pvt->fsb_error_regs->vendor, pvt->fsb_error_regs->device); | ||
1110 | |||
1111 | pvt->branch_pci[0] = pci_get_device(PCI_VENDOR_ID_INTEL, | ||
1112 | PCI_DEVICE_ID_INTEL_I7300_MCH_FB0, | ||
1113 | NULL); | ||
1114 | if (!pvt->branch_pci[0]) { | ||
1115 | i7300_printk(KERN_ERR, | ||
1116 | "MC: 'BRANCH 0' device not found:" | ||
1117 | "vendor 0x%x device 0x%x Func 0 (broken BIOS?)\n", | ||
1118 | PCI_VENDOR_ID_INTEL, PCI_DEVICE_ID_INTEL_I7300_MCH_FB0); | ||
1119 | goto error; | ||
1120 | } | ||
1121 | |||
1122 | pvt->branch_pci[1] = pci_get_device(PCI_VENDOR_ID_INTEL, | ||
1123 | PCI_DEVICE_ID_INTEL_I7300_MCH_FB1, | ||
1124 | NULL); | ||
1125 | if (!pvt->branch_pci[1]) { | ||
1126 | i7300_printk(KERN_ERR, | ||
1127 | "MC: 'BRANCH 1' device not found:" | ||
1128 | "vendor 0x%x device 0x%x Func 0 " | ||
1129 | "(broken BIOS?)\n", | ||
1130 | PCI_VENDOR_ID_INTEL, | ||
1131 | PCI_DEVICE_ID_INTEL_I7300_MCH_FB1); | ||
1132 | goto error; | ||
1133 | } | ||
1134 | |||
1135 | return 0; | ||
1136 | |||
1137 | error: | ||
1138 | i7300_put_devices(mci); | ||
1139 | return -ENODEV; | ||
1140 | } | ||
1141 | |||
1142 | /* | ||
1143 | * i7300_probe1 Probe for ONE instance of device to see if it is | ||
1144 | * present. | ||
1145 | * return: | ||
1146 | * 0 for FOUND a device | ||
1147 | * < 0 for error code | ||
1148 | */ | ||
1149 | static int i7300_probe1(struct pci_dev *pdev, int dev_idx) | ||
1150 | { | ||
1151 | struct mem_ctl_info *mci; | ||
1152 | struct i7300_pvt *pvt; | ||
1153 | int num_channels; | ||
1154 | int num_dimms_per_channel; | ||
1155 | int num_csrows; | ||
1156 | |||
1157 | if (dev_idx >= ARRAY_SIZE(i7300_devs)) | ||
1158 | return -EINVAL; | ||
1159 | |||
1160 | debugf0("MC: " __FILE__ ": %s(), pdev bus %u dev=0x%x fn=0x%x\n", | ||
1161 | __func__, | ||
1162 | pdev->bus->number, | ||
1163 | PCI_SLOT(pdev->devfn), PCI_FUNC(pdev->devfn)); | ||
1164 | |||
1165 | /* We only are looking for func 0 of the set */ | ||
1166 | if (PCI_FUNC(pdev->devfn) != 0) | ||
1167 | return -ENODEV; | ||
1168 | |||
1169 | /* As we don't have a motherboard identification routine to determine | ||
1170 | * actual number of slots/dimms per channel, we thus utilize the | ||
1171 | * resource as specified by the chipset. Thus, we might have | ||
1172 | * have more DIMMs per channel than actually on the mobo, but this | ||
1173 | * allows the driver to support upto the chipset max, without | ||
1174 | * some fancy mobo determination. | ||
1175 | */ | ||
1176 | num_dimms_per_channel = MAX_SLOTS; | ||
1177 | num_channels = MAX_CHANNELS; | ||
1178 | num_csrows = MAX_SLOTS * MAX_CHANNELS; | ||
1179 | |||
1180 | debugf0("MC: %s(): Number of - Channels= %d DIMMS= %d CSROWS= %d\n", | ||
1181 | __func__, num_channels, num_dimms_per_channel, num_csrows); | ||
1182 | |||
1183 | /* allocate a new MC control structure */ | ||
1184 | mci = edac_mc_alloc(sizeof(*pvt), num_csrows, num_channels, 0); | ||
1185 | |||
1186 | if (mci == NULL) | ||
1187 | return -ENOMEM; | ||
1188 | |||
1189 | debugf0("MC: " __FILE__ ": %s(): mci = %p\n", __func__, mci); | ||
1190 | |||
1191 | mci->dev = &pdev->dev; /* record ptr to the generic device */ | ||
1192 | |||
1193 | pvt = mci->pvt_info; | ||
1194 | pvt->system_address = pdev; /* Record this device in our private */ | ||
1195 | |||
1196 | /* 'get' the pci devices we want to reserve for our use */ | ||
1197 | if (i7300_get_devices(mci, dev_idx)) | ||
1198 | goto fail0; | ||
1199 | |||
1200 | mci->mc_idx = 0; | ||
1201 | mci->mtype_cap = MEM_FLAG_FB_DDR2; | ||
1202 | mci->edac_ctl_cap = EDAC_FLAG_NONE; | ||
1203 | mci->edac_cap = EDAC_FLAG_NONE; | ||
1204 | mci->mod_name = "i7300_edac.c"; | ||
1205 | mci->mod_ver = I7300_REVISION; | ||
1206 | mci->ctl_name = i7300_devs[dev_idx].ctl_name; | ||
1207 | mci->dev_name = pci_name(pdev); | ||
1208 | mci->ctl_page_to_phys = NULL; | ||
1209 | |||
1210 | #if 0 | ||
1211 | /* Set the function pointer to an actual operation function */ | ||
1212 | mci->edac_check = i7300_check_error; | ||
1213 | #endif | ||
1214 | |||
1215 | /* initialize the MC control structure 'csrows' table | ||
1216 | * with the mapping and control information */ | ||
1217 | if (i7300_get_mc_regs(mci)) { | ||
1218 | debugf0("MC: Setting mci->edac_cap to EDAC_FLAG_NONE\n" | ||
1219 | " because i7300_init_csrows() returned nonzero " | ||
1220 | "value\n"); | ||
1221 | mci->edac_cap = EDAC_FLAG_NONE; /* no csrows found */ | ||
1222 | } else { | ||
1223 | #if 0 | ||
1224 | debugf1("MC: Enable error reporting now\n"); | ||
1225 | i7300_enable_error_reporting(mci); | ||
1226 | #endif | ||
1227 | } | ||
1228 | |||
1229 | /* add this new MC control structure to EDAC's list of MCs */ | ||
1230 | if (edac_mc_add_mc(mci)) { | ||
1231 | debugf0("MC: " __FILE__ | ||
1232 | ": %s(): failed edac_mc_add_mc()\n", __func__); | ||
1233 | /* FIXME: perhaps some code should go here that disables error | ||
1234 | * reporting if we just enabled it | ||
1235 | */ | ||
1236 | goto fail1; | ||
1237 | } | ||
1238 | |||
1239 | #if 0 | ||
1240 | i7300_clear_error(mci); | ||
1241 | #endif | ||
1242 | |||
1243 | /* allocating generic PCI control info */ | ||
1244 | i7300_pci = edac_pci_create_generic_ctl(&pdev->dev, EDAC_MOD_STR); | ||
1245 | if (!i7300_pci) { | ||
1246 | printk(KERN_WARNING | ||
1247 | "%s(): Unable to create PCI control\n", | ||
1248 | __func__); | ||
1249 | printk(KERN_WARNING | ||
1250 | "%s(): PCI error report via EDAC not setup\n", | ||
1251 | __func__); | ||
1252 | } | ||
1253 | |||
1254 | return 0; | ||
1255 | |||
1256 | /* Error exit unwinding stack */ | ||
1257 | fail1: | ||
1258 | |||
1259 | i7300_put_devices(mci); | ||
1260 | |||
1261 | fail0: | ||
1262 | edac_mc_free(mci); | ||
1263 | return -ENODEV; | ||
1264 | } | ||
1265 | |||
1266 | /* | ||
1267 | * i7300_init_one constructor for one instance of device | ||
1268 | * | ||
1269 | * returns: | ||
1270 | * negative on error | ||
1271 | * count (>= 0) | ||
1272 | */ | ||
1273 | static int __devinit i7300_init_one(struct pci_dev *pdev, | ||
1274 | const struct pci_device_id *id) | ||
1275 | { | ||
1276 | int rc; | ||
1277 | |||
1278 | debugf0("MC: " __FILE__ ": %s()\n", __func__); | ||
1279 | |||
1280 | /* wake up device */ | ||
1281 | rc = pci_enable_device(pdev); | ||
1282 | if (rc == -EIO) | ||
1283 | return rc; | ||
1284 | |||
1285 | /* now probe and enable the device */ | ||
1286 | return i7300_probe1(pdev, id->driver_data); | ||
1287 | } | ||
1288 | |||
1289 | /* | ||
1290 | * i7300_remove_one destructor for one instance of device | ||
1291 | * | ||
1292 | */ | ||
1293 | static void __devexit i7300_remove_one(struct pci_dev *pdev) | ||
1294 | { | ||
1295 | struct mem_ctl_info *mci; | ||
1296 | |||
1297 | debugf0(__FILE__ ": %s()\n", __func__); | ||
1298 | |||
1299 | if (i7300_pci) | ||
1300 | edac_pci_release_generic_ctl(i7300_pci); | ||
1301 | |||
1302 | mci = edac_mc_del_mc(&pdev->dev); | ||
1303 | if (!mci) | ||
1304 | return; | ||
1305 | |||
1306 | /* retrieve references to resources, and free those resources */ | ||
1307 | i7300_put_devices(mci); | ||
1308 | |||
1309 | edac_mc_free(mci); | ||
1310 | } | ||
1311 | |||
1312 | /* | ||
1313 | * pci_device_id table for which devices we are looking for | ||
1314 | * | ||
1315 | * The "E500P" device is the first device supported. | ||
1316 | */ | ||
1317 | static const struct pci_device_id i7300_pci_tbl[] __devinitdata = { | ||
1318 | {PCI_DEVICE(PCI_VENDOR_ID_INTEL, PCI_DEVICE_ID_INTEL_I7300_MCH_ERR)}, | ||
1319 | {0,} /* 0 terminated list. */ | ||
1320 | }; | ||
1321 | |||
1322 | MODULE_DEVICE_TABLE(pci, i7300_pci_tbl); | ||
1323 | |||
1324 | /* | ||
1325 | * i7300_driver pci_driver structure for this module | ||
1326 | * | ||
1327 | */ | ||
1328 | static struct pci_driver i7300_driver = { | ||
1329 | .name = "i7300_edac", | ||
1330 | .probe = i7300_init_one, | ||
1331 | .remove = __devexit_p(i7300_remove_one), | ||
1332 | .id_table = i7300_pci_tbl, | ||
1333 | }; | ||
1334 | |||
1335 | /* | ||
1336 | * i7300_init Module entry function | ||
1337 | * Try to initialize this module for its devices | ||
1338 | */ | ||
1339 | static int __init i7300_init(void) | ||
1340 | { | ||
1341 | int pci_rc; | ||
1342 | |||
1343 | debugf2("MC: " __FILE__ ": %s()\n", __func__); | ||
1344 | |||
1345 | /* Ensure that the OPSTATE is set correctly for POLL or NMI */ | ||
1346 | opstate_init(); | ||
1347 | |||
1348 | pci_rc = pci_register_driver(&i7300_driver); | ||
1349 | |||
1350 | return (pci_rc < 0) ? pci_rc : 0; | ||
1351 | } | ||
1352 | |||
1353 | /* | ||
1354 | * i7300_exit() Module exit function | ||
1355 | * Unregister the driver | ||
1356 | */ | ||
1357 | static void __exit i7300_exit(void) | ||
1358 | { | ||
1359 | debugf2("MC: " __FILE__ ": %s()\n", __func__); | ||
1360 | pci_unregister_driver(&i7300_driver); | ||
1361 | } | ||
1362 | |||
1363 | module_init(i7300_init); | ||
1364 | module_exit(i7300_exit); | ||
1365 | |||
1366 | MODULE_LICENSE("GPL"); | ||
1367 | MODULE_AUTHOR("Mauro Carvalho Chehab <mchehab@redhat.com>"); | ||
1368 | MODULE_AUTHOR("Red Hat Inc. (http://www.redhat.com)"); | ||
1369 | MODULE_DESCRIPTION("MC Driver for Intel I7300 memory controllers - " | ||
1370 | I7300_REVISION); | ||
1371 | |||
1372 | module_param(edac_op_state, int, 0444); | ||
1373 | MODULE_PARM_DESC(edac_op_state, "EDAC Error Reporting state: 0=Poll,1=NMI"); | ||