1 // SPDX-License-Identifier: GPL-2.0-only
3 * Intel 7300 class Memory Controllers kernel module (Clarksboro)
5 * Copyright (c) 2010 by:
6 * Mauro Carvalho Chehab
8 * Red Hat Inc. http://www.redhat.com
10 * Intel 7300 Chipset Memory Controller Hub (MCH) - Datasheet
11 * http://www.intel.com/Assets/PDF/datasheet/318082.pdf
13 * TODO: The chipset allow checking for PCI Express errors also. Currently,
14 * the driver covers only memory error errors
16 * This driver uses "csrows" EDAC attribute to represent DIMM slot#
19 #include <linux/module.h>
20 #include <linux/init.h>
21 #include <linux/pci.h>
22 #include <linux/pci_ids.h>
23 #include <linux/slab.h>
24 #include <linux/edac.h>
25 #include <linux/mmzone.h>
27 #include "edac_module.h"
30 * Alter this version for the I7300 module when modifications are made
32 #define I7300_REVISION " Ver: 1.0.0"
34 #define EDAC_MOD_STR "i7300_edac"
36 #define i7300_printk(level, fmt, arg...) \
37 edac_printk(level, "i7300", fmt, ##arg)
39 #define i7300_mc_printk(mci, level, fmt, arg...) \
40 edac_mc_chipset_printk(mci, level, "i7300", fmt, ##arg)
42 /***********************************************
43 * i7300 Limit constants Structs and static vars
44 ***********************************************/
47 * Memory topology is organized as:
48 * Branch 0 - 2 channels: channels 0 and 1 (FDB0 PCI dev 21.0)
49 * Branch 1 - 2 channels: channels 2 and 3 (FDB1 PCI dev 22.0)
50 * Each channel can have to 8 DIMM sets (called as SLOTS)
51 * Slots should generally be filled in pairs
52 * Except on Single Channel mode of operation
53 * just slot 0/channel0 filled on this mode
54 * On normal operation mode, the two channels on a branch should be
55 * filled together for the same SLOT#
56 * When in mirrored mode, Branch 1 replicate memory at Branch 0, so, the four
57 * channels on both branches should be filled
60 /* Limits for i7300 */
62 #define MAX_BRANCHES 2
63 #define MAX_CH_PER_BRANCH 2
64 #define MAX_CHANNELS (MAX_CH_PER_BRANCH * MAX_BRANCHES)
67 #define to_channel(ch, branch) ((((branch)) << 1) | (ch))
69 #define to_csrow(slot, ch, branch) \
70 (to_channel(ch, branch) | ((slot) << 2))
72 /* Device name and register DID (Device ID) */
73 struct i7300_dev_info
{
74 const char *ctl_name
; /* name for this device */
75 u16 fsb_mapping_errors
; /* DID for the branchmap,control */
78 /* Table of devices attributes supported by this driver */
79 static const struct i7300_dev_info i7300_devs
[] = {
82 .fsb_mapping_errors
= PCI_DEVICE_ID_INTEL_I7300_MCH_ERR
,
86 struct i7300_dimm_info
{
87 int megabytes
; /* size, 0 means not present */
90 /* driver private data structure */
92 struct pci_dev
*pci_dev_16_0_fsb_ctlr
; /* 16.0 */
93 struct pci_dev
*pci_dev_16_1_fsb_addr_map
; /* 16.1 */
94 struct pci_dev
*pci_dev_16_2_fsb_err_regs
; /* 16.2 */
95 struct pci_dev
*pci_dev_2x_0_fbd_branch
[MAX_BRANCHES
]; /* 21.0 and 22.0 */
97 u16 tolm
; /* top of low memory */
98 u64 ambase
; /* AMB BAR */
100 u32 mc_settings
; /* Report several settings */
103 u16 mir
[MAX_MIR
]; /* Memory Interleave Reg*/
105 u16 mtr
[MAX_SLOTS
][MAX_BRANCHES
]; /* Memory Technlogy Reg */
106 u16 ambpresent
[MAX_CHANNELS
]; /* AMB present regs */
108 /* DIMM information matrix, allocating architecture maximums */
109 struct i7300_dimm_info dimm_info
[MAX_SLOTS
][MAX_CHANNELS
];
111 /* Temporary buffer for use when preparing error messages */
112 char *tmp_prt_buffer
;
115 /* FIXME: Why do we need to have this static? */
116 static struct edac_pci_ctl_info
*i7300_pci
;
118 /***************************************************
119 * i7300 Register definitions for memory enumeration
120 ***************************************************/
124 * Function 0: System Address (not documented)
125 * Function 1: Memory Branch Map, Control, Errors Register
128 /* OFFSETS for Function 0 */
129 #define AMBASE 0x48 /* AMB Mem Mapped Reg Region Base */
130 #define MAXCH 0x56 /* Max Channel Number */
131 #define MAXDIMMPERCH 0x57 /* Max DIMM PER Channel Number */
133 /* OFFSETS for Function 1 */
134 #define MC_SETTINGS 0x40
135 #define IS_MIRRORED(mc) ((mc) & (1 << 16))
136 #define IS_ECC_ENABLED(mc) ((mc) & (1 << 5))
137 #define IS_RETRY_ENABLED(mc) ((mc) & (1 << 31))
138 #define IS_SCRBALGO_ENHANCED(mc) ((mc) & (1 << 8))
140 #define MC_SETTINGS_A 0x58
141 #define IS_SINGLE_MODE(mca) ((mca) & (1 << 14))
150 * Note: Other Intel EDAC drivers use AMBPRESENT to identify if the available
151 * memory. From datasheet item 7.3.1 (FB-DIMM technology & organization), it
152 * seems that we cannot use this information directly for the same usage.
153 * Each memory slot may have up to 2 AMB interfaces, one for income and another
154 * for outcome interface to the next slot.
155 * For now, the driver just stores the AMB present registers, but rely only at
156 * the MTR info to detect memory.
157 * Datasheet is also not clear about how to map each AMBPRESENT registers to
158 * one of the 4 available channels.
160 #define AMBPRESENT_0 0x64
161 #define AMBPRESENT_1 0x66
163 static const u16 mtr_regs
[MAX_SLOTS
] = {
164 0x80, 0x84, 0x88, 0x8c,
165 0x82, 0x86, 0x8a, 0x8e
169 * Defines to extract the vaious fields from the
170 * MTRx - Memory Technology Registers
172 #define MTR_DIMMS_PRESENT(mtr) ((mtr) & (1 << 8))
173 #define MTR_DIMMS_ETHROTTLE(mtr) ((mtr) & (1 << 7))
174 #define MTR_DRAM_WIDTH(mtr) (((mtr) & (1 << 6)) ? 8 : 4)
175 #define MTR_DRAM_BANKS(mtr) (((mtr) & (1 << 5)) ? 8 : 4)
176 #define MTR_DIMM_RANKS(mtr) (((mtr) & (1 << 4)) ? 1 : 0)
177 #define MTR_DIMM_ROWS(mtr) (((mtr) >> 2) & 0x3)
178 #define MTR_DRAM_BANKS_ADDR_BITS 2
179 #define MTR_DIMM_ROWS_ADDR_BITS(mtr) (MTR_DIMM_ROWS(mtr) + 13)
180 #define MTR_DIMM_COLS(mtr) ((mtr) & 0x3)
181 #define MTR_DIMM_COLS_ADDR_BITS(mtr) (MTR_DIMM_COLS(mtr) + 10)
183 /************************************************
184 * i7300 Register definitions for error detection
185 ************************************************/
188 * Device 16.1: FBD Error Registers
190 #define FERR_FAT_FBD 0x98
191 static const char *ferr_fat_fbd_name
[] = {
192 [22] = "Non-Redundant Fast Reset Timeout",
193 [2] = ">Tmid Thermal event with intelligent throttling disabled",
194 [1] = "Memory or FBD configuration CRC read error",
195 [0] = "Memory Write error on non-redundant retry or "
196 "FBD configuration Write error on retry",
198 #define GET_FBD_FAT_IDX(fbderr) (((fbderr) >> 28) & 3)
199 #define FERR_FAT_FBD_ERR_MASK ((1 << 0) | (1 << 1) | (1 << 2) | (1 << 22))
201 #define FERR_NF_FBD 0xa0
202 static const char *ferr_nf_fbd_name
[] = {
203 [24] = "DIMM-Spare Copy Completed",
204 [23] = "DIMM-Spare Copy Initiated",
205 [22] = "Redundant Fast Reset Timeout",
206 [21] = "Memory Write error on redundant retry",
207 [18] = "SPD protocol Error",
208 [17] = "FBD Northbound parity error on FBD Sync Status",
209 [16] = "Correctable Patrol Data ECC",
210 [15] = "Correctable Resilver- or Spare-Copy Data ECC",
211 [14] = "Correctable Mirrored Demand Data ECC",
212 [13] = "Correctable Non-Mirrored Demand Data ECC",
213 [11] = "Memory or FBD configuration CRC read error",
214 [10] = "FBD Configuration Write error on first attempt",
215 [9] = "Memory Write error on first attempt",
216 [8] = "Non-Aliased Uncorrectable Patrol Data ECC",
217 [7] = "Non-Aliased Uncorrectable Resilver- or Spare-Copy Data ECC",
218 [6] = "Non-Aliased Uncorrectable Mirrored Demand Data ECC",
219 [5] = "Non-Aliased Uncorrectable Non-Mirrored Demand Data ECC",
220 [4] = "Aliased Uncorrectable Patrol Data ECC",
221 [3] = "Aliased Uncorrectable Resilver- or Spare-Copy Data ECC",
222 [2] = "Aliased Uncorrectable Mirrored Demand Data ECC",
223 [1] = "Aliased Uncorrectable Non-Mirrored Demand Data ECC",
224 [0] = "Uncorrectable Data ECC on Replay",
226 #define GET_FBD_NF_IDX(fbderr) (((fbderr) >> 28) & 3)
227 #define FERR_NF_FBD_ERR_MASK ((1 << 24) | (1 << 23) | (1 << 22) | (1 << 21) |\
228 (1 << 18) | (1 << 17) | (1 << 16) | (1 << 15) |\
229 (1 << 14) | (1 << 13) | (1 << 11) | (1 << 10) |\
230 (1 << 9) | (1 << 8) | (1 << 7) | (1 << 6) |\
231 (1 << 5) | (1 << 4) | (1 << 3) | (1 << 2) |\
234 #define EMASK_FBD 0xa8
235 #define EMASK_FBD_ERR_MASK ((1 << 27) | (1 << 26) | (1 << 25) | (1 << 24) |\
236 (1 << 22) | (1 << 21) | (1 << 20) | (1 << 19) |\
237 (1 << 18) | (1 << 17) | (1 << 16) | (1 << 14) |\
238 (1 << 13) | (1 << 12) | (1 << 11) | (1 << 10) |\
239 (1 << 9) | (1 << 8) | (1 << 7) | (1 << 6) |\
240 (1 << 5) | (1 << 4) | (1 << 3) | (1 << 2) |\
244 * Device 16.2: Global Error Registers
247 #define FERR_GLOBAL_HI 0x48
248 static const char *ferr_global_hi_name
[] = {
249 [3] = "FSB 3 Fatal Error",
250 [2] = "FSB 2 Fatal Error",
251 [1] = "FSB 1 Fatal Error",
252 [0] = "FSB 0 Fatal Error",
254 #define ferr_global_hi_is_fatal(errno) 1
256 #define FERR_GLOBAL_LO 0x40
257 static const char *ferr_global_lo_name
[] = {
258 [31] = "Internal MCH Fatal Error",
259 [30] = "Intel QuickData Technology Device Fatal Error",
260 [29] = "FSB1 Fatal Error",
261 [28] = "FSB0 Fatal Error",
262 [27] = "FBD Channel 3 Fatal Error",
263 [26] = "FBD Channel 2 Fatal Error",
264 [25] = "FBD Channel 1 Fatal Error",
265 [24] = "FBD Channel 0 Fatal Error",
266 [23] = "PCI Express Device 7Fatal Error",
267 [22] = "PCI Express Device 6 Fatal Error",
268 [21] = "PCI Express Device 5 Fatal Error",
269 [20] = "PCI Express Device 4 Fatal Error",
270 [19] = "PCI Express Device 3 Fatal Error",
271 [18] = "PCI Express Device 2 Fatal Error",
272 [17] = "PCI Express Device 1 Fatal Error",
273 [16] = "ESI Fatal Error",
274 [15] = "Internal MCH Non-Fatal Error",
275 [14] = "Intel QuickData Technology Device Non Fatal Error",
276 [13] = "FSB1 Non-Fatal Error",
277 [12] = "FSB 0 Non-Fatal Error",
278 [11] = "FBD Channel 3 Non-Fatal Error",
279 [10] = "FBD Channel 2 Non-Fatal Error",
280 [9] = "FBD Channel 1 Non-Fatal Error",
281 [8] = "FBD Channel 0 Non-Fatal Error",
282 [7] = "PCI Express Device 7 Non-Fatal Error",
283 [6] = "PCI Express Device 6 Non-Fatal Error",
284 [5] = "PCI Express Device 5 Non-Fatal Error",
285 [4] = "PCI Express Device 4 Non-Fatal Error",
286 [3] = "PCI Express Device 3 Non-Fatal Error",
287 [2] = "PCI Express Device 2 Non-Fatal Error",
288 [1] = "PCI Express Device 1 Non-Fatal Error",
289 [0] = "ESI Non-Fatal Error",
291 #define ferr_global_lo_is_fatal(errno) ((errno < 16) ? 0 : 1)
293 #define NRECMEMA 0xbe
294 #define NRECMEMA_BANK(v) (((v) >> 12) & 7)
295 #define NRECMEMA_RANK(v) (((v) >> 8) & 15)
297 #define NRECMEMB 0xc0
298 #define NRECMEMB_IS_WR(v) ((v) & (1 << 31))
299 #define NRECMEMB_CAS(v) (((v) >> 16) & 0x1fff)
300 #define NRECMEMB_RAS(v) ((v) & 0xffff)
307 #define RECMEMA_BANK(v) (((v) >> 12) & 7)
308 #define RECMEMA_RANK(v) (((v) >> 8) & 15)
311 #define RECMEMB_IS_WR(v) ((v) & (1 << 31))
312 #define RECMEMB_CAS(v) (((v) >> 16) & 0x1fff)
313 #define RECMEMB_RAS(v) ((v) & 0xffff)
315 /********************************************
316 * i7300 Functions related to error detection
317 ********************************************/
320 * get_err_from_table() - Gets the error message from a table
321 * @table: table name (array of char *)
322 * @size: number of elements at the table
323 * @pos: position of the element to be returned
325 * This is a small routine that gets the pos-th element of a table. If the
326 * element doesn't exist (or it is empty), it returns "reserved".
327 * Instead of calling it directly, the better is to call via the macro
328 * GET_ERR_FROM_TABLE(), that automatically checks the table size via
331 static const char *get_err_from_table(const char *table
[], int size
, int pos
)
333 if (unlikely(pos
>= size
))
336 if (unlikely(!table
[pos
]))
342 #define GET_ERR_FROM_TABLE(table, pos) \
343 get_err_from_table(table, ARRAY_SIZE(table), pos)
346 * i7300_process_error_global() - Retrieve the hardware error information from
347 * the hardware global error registers and
349 * @mci: struct mem_ctl_info pointer
351 static void i7300_process_error_global(struct mem_ctl_info
*mci
)
353 struct i7300_pvt
*pvt
;
354 u32 errnum
, error_reg
;
355 unsigned long errors
;
356 const char *specific
;
361 /* read in the 1st FATAL error register */
362 pci_read_config_dword(pvt
->pci_dev_16_2_fsb_err_regs
,
363 FERR_GLOBAL_HI
, &error_reg
);
364 if (unlikely(error_reg
)) {
366 errnum
= find_first_bit(&errors
,
367 ARRAY_SIZE(ferr_global_hi_name
));
368 specific
= GET_ERR_FROM_TABLE(ferr_global_hi_name
, errnum
);
369 is_fatal
= ferr_global_hi_is_fatal(errnum
);
371 /* Clear the error bit */
372 pci_write_config_dword(pvt
->pci_dev_16_2_fsb_err_regs
,
373 FERR_GLOBAL_HI
, error_reg
);
378 pci_read_config_dword(pvt
->pci_dev_16_2_fsb_err_regs
,
379 FERR_GLOBAL_LO
, &error_reg
);
380 if (unlikely(error_reg
)) {
382 errnum
= find_first_bit(&errors
,
383 ARRAY_SIZE(ferr_global_lo_name
));
384 specific
= GET_ERR_FROM_TABLE(ferr_global_lo_name
, errnum
);
385 is_fatal
= ferr_global_lo_is_fatal(errnum
);
387 /* Clear the error bit */
388 pci_write_config_dword(pvt
->pci_dev_16_2_fsb_err_regs
,
389 FERR_GLOBAL_LO
, error_reg
);
396 i7300_mc_printk(mci
, KERN_EMERG
, "%s misc error: %s\n",
397 is_fatal
? "Fatal" : "NOT fatal", specific
);
401 * i7300_process_fbd_error() - Retrieve the hardware error information from
402 * the FBD error registers and sends it via
403 * EDAC error API calls
404 * @mci: struct mem_ctl_info pointer
406 static void i7300_process_fbd_error(struct mem_ctl_info
*mci
)
408 struct i7300_pvt
*pvt
;
409 u32 errnum
, value
, error_reg
;
411 unsigned branch
, channel
, bank
, rank
, cas
, ras
;
414 unsigned long errors
;
415 const char *specific
;
420 /* read in the 1st FATAL error register */
421 pci_read_config_dword(pvt
->pci_dev_16_1_fsb_addr_map
,
422 FERR_FAT_FBD
, &error_reg
);
423 if (unlikely(error_reg
& FERR_FAT_FBD_ERR_MASK
)) {
424 errors
= error_reg
& FERR_FAT_FBD_ERR_MASK
;
425 errnum
= find_first_bit(&errors
,
426 ARRAY_SIZE(ferr_fat_fbd_name
));
427 specific
= GET_ERR_FROM_TABLE(ferr_fat_fbd_name
, errnum
);
428 branch
= (GET_FBD_FAT_IDX(error_reg
) == 2) ? 1 : 0;
430 pci_read_config_word(pvt
->pci_dev_16_1_fsb_addr_map
,
432 bank
= NRECMEMA_BANK(val16
);
433 rank
= NRECMEMA_RANK(val16
);
435 pci_read_config_dword(pvt
->pci_dev_16_1_fsb_addr_map
,
437 is_wr
= NRECMEMB_IS_WR(value
);
438 cas
= NRECMEMB_CAS(value
);
439 ras
= NRECMEMB_RAS(value
);
441 /* Clean the error register */
442 pci_write_config_dword(pvt
->pci_dev_16_1_fsb_addr_map
,
443 FERR_FAT_FBD
, error_reg
);
445 snprintf(pvt
->tmp_prt_buffer
, PAGE_SIZE
,
446 "Bank=%d RAS=%d CAS=%d Err=0x%lx (%s))",
447 bank
, ras
, cas
, errors
, specific
);
449 edac_mc_handle_error(HW_EVENT_ERR_FATAL
, mci
, 1, 0, 0, 0,
451 is_wr
? "Write error" : "Read error",
452 pvt
->tmp_prt_buffer
);
456 /* read in the 1st NON-FATAL error register */
457 pci_read_config_dword(pvt
->pci_dev_16_1_fsb_addr_map
,
458 FERR_NF_FBD
, &error_reg
);
459 if (unlikely(error_reg
& FERR_NF_FBD_ERR_MASK
)) {
460 errors
= error_reg
& FERR_NF_FBD_ERR_MASK
;
461 errnum
= find_first_bit(&errors
,
462 ARRAY_SIZE(ferr_nf_fbd_name
));
463 specific
= GET_ERR_FROM_TABLE(ferr_nf_fbd_name
, errnum
);
464 branch
= (GET_FBD_NF_IDX(error_reg
) == 2) ? 1 : 0;
466 pci_read_config_dword(pvt
->pci_dev_16_1_fsb_addr_map
,
469 pci_read_config_word(pvt
->pci_dev_16_1_fsb_addr_map
,
471 bank
= RECMEMA_BANK(val16
);
472 rank
= RECMEMA_RANK(val16
);
474 pci_read_config_dword(pvt
->pci_dev_16_1_fsb_addr_map
,
476 is_wr
= RECMEMB_IS_WR(value
);
477 cas
= RECMEMB_CAS(value
);
478 ras
= RECMEMB_RAS(value
);
480 pci_read_config_dword(pvt
->pci_dev_16_1_fsb_addr_map
,
482 channel
= (branch
<< 1);
484 /* Second channel ? */
485 channel
+= !!(value
& BIT(17));
487 /* Clear the error bit */
488 pci_write_config_dword(pvt
->pci_dev_16_1_fsb_addr_map
,
489 FERR_NF_FBD
, error_reg
);
491 /* Form out message */
492 snprintf(pvt
->tmp_prt_buffer
, PAGE_SIZE
,
493 "DRAM-Bank=%d RAS=%d CAS=%d, Err=0x%lx (%s))",
494 bank
, ras
, cas
, errors
, specific
);
496 edac_mc_handle_error(HW_EVENT_ERR_CORRECTED
, mci
, 1, 0, 0,
498 branch
>> 1, channel
% 2, rank
,
499 is_wr
? "Write error" : "Read error",
500 pvt
->tmp_prt_buffer
);
506 * i7300_check_error() - Calls the error checking subroutines
507 * @mci: struct mem_ctl_info pointer
509 static void i7300_check_error(struct mem_ctl_info
*mci
)
511 i7300_process_error_global(mci
);
512 i7300_process_fbd_error(mci
);
516 * i7300_clear_error() - Clears the error registers
517 * @mci: struct mem_ctl_info pointer
519 static void i7300_clear_error(struct mem_ctl_info
*mci
)
521 struct i7300_pvt
*pvt
= mci
->pvt_info
;
524 * All error values are RWC - we need to read and write 1 to the
525 * bit that we want to cleanup
528 /* Clear global error registers */
529 pci_read_config_dword(pvt
->pci_dev_16_2_fsb_err_regs
,
530 FERR_GLOBAL_HI
, &value
);
531 pci_write_config_dword(pvt
->pci_dev_16_2_fsb_err_regs
,
532 FERR_GLOBAL_HI
, value
);
534 pci_read_config_dword(pvt
->pci_dev_16_2_fsb_err_regs
,
535 FERR_GLOBAL_LO
, &value
);
536 pci_write_config_dword(pvt
->pci_dev_16_2_fsb_err_regs
,
537 FERR_GLOBAL_LO
, value
);
539 /* Clear FBD error registers */
540 pci_read_config_dword(pvt
->pci_dev_16_1_fsb_addr_map
,
541 FERR_FAT_FBD
, &value
);
542 pci_write_config_dword(pvt
->pci_dev_16_1_fsb_addr_map
,
543 FERR_FAT_FBD
, value
);
545 pci_read_config_dword(pvt
->pci_dev_16_1_fsb_addr_map
,
546 FERR_NF_FBD
, &value
);
547 pci_write_config_dword(pvt
->pci_dev_16_1_fsb_addr_map
,
552 * i7300_enable_error_reporting() - Enable the memory reporting logic at the
554 * @mci: struct mem_ctl_info pointer
556 static void i7300_enable_error_reporting(struct mem_ctl_info
*mci
)
558 struct i7300_pvt
*pvt
= mci
->pvt_info
;
561 /* Read the FBD Error Mask Register */
562 pci_read_config_dword(pvt
->pci_dev_16_1_fsb_addr_map
,
563 EMASK_FBD
, &fbd_error_mask
);
565 /* Enable with a '0' */
566 fbd_error_mask
&= ~(EMASK_FBD_ERR_MASK
);
568 pci_write_config_dword(pvt
->pci_dev_16_1_fsb_addr_map
,
569 EMASK_FBD
, fbd_error_mask
);
572 /************************************************
573 * i7300 Functions related to memory enumberation
574 ************************************************/
577 * decode_mtr() - Decodes the MTR descriptor, filling the edac structs
578 * @pvt: pointer to the private data struct used by i7300 driver
579 * @slot: DIMM slot (0 to 7)
580 * @ch: Channel number within the branch (0 or 1)
581 * @branch: Branch number (0 or 1)
582 * @dinfo: Pointer to DIMM info where dimm size is stored
583 * @dimm: Pointer to the struct dimm_info that corresponds to that element
585 static int decode_mtr(struct i7300_pvt
*pvt
,
586 int slot
, int ch
, int branch
,
587 struct i7300_dimm_info
*dinfo
,
588 struct dimm_info
*dimm
)
590 int mtr
, ans
, addrBits
, channel
;
592 channel
= to_channel(ch
, branch
);
594 mtr
= pvt
->mtr
[slot
][branch
];
595 ans
= MTR_DIMMS_PRESENT(mtr
) ? 1 : 0;
597 edac_dbg(2, "\tMTR%d CH%d: DIMMs are %sPresent (mtr)\n",
598 slot
, channel
, ans
? "" : "NOT ");
600 /* Determine if there is a DIMM present in this DIMM slot */
604 /* Start with the number of bits for a Bank
606 addrBits
= MTR_DRAM_BANKS_ADDR_BITS
;
607 /* Add thenumber of ROW bits */
608 addrBits
+= MTR_DIMM_ROWS_ADDR_BITS(mtr
);
609 /* add the number of COLUMN bits */
610 addrBits
+= MTR_DIMM_COLS_ADDR_BITS(mtr
);
611 /* add the number of RANK bits */
612 addrBits
+= MTR_DIMM_RANKS(mtr
);
614 addrBits
+= 6; /* add 64 bits per DIMM */
615 addrBits
-= 20; /* divide by 2^^20 */
616 addrBits
-= 3; /* 8 bits per bytes */
618 dinfo
->megabytes
= 1 << addrBits
;
620 edac_dbg(2, "\t\tWIDTH: x%d\n", MTR_DRAM_WIDTH(mtr
));
622 edac_dbg(2, "\t\tELECTRICAL THROTTLING is %s\n",
623 MTR_DIMMS_ETHROTTLE(mtr
) ? "enabled" : "disabled");
625 edac_dbg(2, "\t\tNUMBANK: %d bank(s)\n", MTR_DRAM_BANKS(mtr
));
626 edac_dbg(2, "\t\tNUMRANK: %s\n",
627 MTR_DIMM_RANKS(mtr
) ? "double" : "single");
628 edac_dbg(2, "\t\tNUMROW: %s\n",
629 MTR_DIMM_ROWS(mtr
) == 0 ? "8,192 - 13 rows" :
630 MTR_DIMM_ROWS(mtr
) == 1 ? "16,384 - 14 rows" :
631 MTR_DIMM_ROWS(mtr
) == 2 ? "32,768 - 15 rows" :
633 edac_dbg(2, "\t\tNUMCOL: %s\n",
634 MTR_DIMM_COLS(mtr
) == 0 ? "1,024 - 10 columns" :
635 MTR_DIMM_COLS(mtr
) == 1 ? "2,048 - 11 columns" :
636 MTR_DIMM_COLS(mtr
) == 2 ? "4,096 - 12 columns" :
638 edac_dbg(2, "\t\tSIZE: %d MB\n", dinfo
->megabytes
);
641 * The type of error detection actually depends of the
642 * mode of operation. When it is just one single memory chip, at
643 * socket 0, channel 0, it uses 8-byte-over-32-byte SECDED+ code.
644 * In normal or mirrored mode, it uses Lockstep mode,
645 * with the possibility of using an extended algorithm for x8 memories
646 * See datasheet Sections 7.3.6 to 7.3.8
649 dimm
->nr_pages
= MiB_TO_PAGES(dinfo
->megabytes
);
651 dimm
->mtype
= MEM_FB_DDR2
;
652 if (IS_SINGLE_MODE(pvt
->mc_settings_a
)) {
653 dimm
->edac_mode
= EDAC_SECDED
;
654 edac_dbg(2, "\t\tECC code is 8-byte-over-32-byte SECDED+ code\n");
656 edac_dbg(2, "\t\tECC code is on Lockstep mode\n");
657 if (MTR_DRAM_WIDTH(mtr
) == 8)
658 dimm
->edac_mode
= EDAC_S8ECD8ED
;
660 dimm
->edac_mode
= EDAC_S4ECD4ED
;
663 /* ask what device type on this row */
664 if (MTR_DRAM_WIDTH(mtr
) == 8) {
665 edac_dbg(2, "\t\tScrub algorithm for x8 is on %s mode\n",
666 IS_SCRBALGO_ENHANCED(pvt
->mc_settings
) ?
667 "enhanced" : "normal");
669 dimm
->dtype
= DEV_X8
;
671 dimm
->dtype
= DEV_X4
;
677 * print_dimm_size() - Prints dump of the memory organization
678 * @pvt: pointer to the private data struct used by i7300 driver
680 * Useful for debug. If debug is disabled, this routine do nothing
682 static void print_dimm_size(struct i7300_pvt
*pvt
)
684 #ifdef CONFIG_EDAC_DEBUG
685 struct i7300_dimm_info
*dinfo
;
691 p
= pvt
->tmp_prt_buffer
;
693 n
= snprintf(p
, space
, " ");
696 for (channel
= 0; channel
< MAX_CHANNELS
; channel
++) {
697 n
= snprintf(p
, space
, "channel %d | ", channel
);
701 edac_dbg(2, "%s\n", pvt
->tmp_prt_buffer
);
702 p
= pvt
->tmp_prt_buffer
;
704 n
= snprintf(p
, space
, "-------------------------------"
705 "------------------------------");
708 edac_dbg(2, "%s\n", pvt
->tmp_prt_buffer
);
709 p
= pvt
->tmp_prt_buffer
;
712 for (slot
= 0; slot
< MAX_SLOTS
; slot
++) {
713 n
= snprintf(p
, space
, "csrow/SLOT %d ", slot
);
717 for (channel
= 0; channel
< MAX_CHANNELS
; channel
++) {
718 dinfo
= &pvt
->dimm_info
[slot
][channel
];
719 n
= snprintf(p
, space
, "%4d MB | ", dinfo
->megabytes
);
724 edac_dbg(2, "%s\n", pvt
->tmp_prt_buffer
);
725 p
= pvt
->tmp_prt_buffer
;
729 n
= snprintf(p
, space
, "-------------------------------"
730 "------------------------------");
733 edac_dbg(2, "%s\n", pvt
->tmp_prt_buffer
);
734 p
= pvt
->tmp_prt_buffer
;
740 * i7300_init_csrows() - Initialize the 'csrows' table within
741 * the mci control structure with the
742 * addressing of memory.
743 * @mci: struct mem_ctl_info pointer
745 static int i7300_init_csrows(struct mem_ctl_info
*mci
)
747 struct i7300_pvt
*pvt
;
748 struct i7300_dimm_info
*dinfo
;
751 int ch
, branch
, slot
, channel
, max_channel
, max_branch
;
752 struct dimm_info
*dimm
;
756 edac_dbg(2, "Memory Technology Registers:\n");
758 if (IS_SINGLE_MODE(pvt
->mc_settings_a
)) {
762 max_branch
= MAX_BRANCHES
;
763 max_channel
= MAX_CH_PER_BRANCH
;
766 /* Get the AMB present registers for the four channels */
767 for (branch
= 0; branch
< max_branch
; branch
++) {
768 /* Read and dump branch 0's MTRs */
769 channel
= to_channel(0, branch
);
770 pci_read_config_word(pvt
->pci_dev_2x_0_fbd_branch
[branch
],
772 &pvt
->ambpresent
[channel
]);
773 edac_dbg(2, "\t\tAMB-present CH%d = 0x%x:\n",
774 channel
, pvt
->ambpresent
[channel
]);
776 if (max_channel
== 1)
779 channel
= to_channel(1, branch
);
780 pci_read_config_word(pvt
->pci_dev_2x_0_fbd_branch
[branch
],
782 &pvt
->ambpresent
[channel
]);
783 edac_dbg(2, "\t\tAMB-present CH%d = 0x%x:\n",
784 channel
, pvt
->ambpresent
[channel
]);
787 /* Get the set of MTR[0-7] regs by each branch */
788 for (slot
= 0; slot
< MAX_SLOTS
; slot
++) {
789 int where
= mtr_regs
[slot
];
790 for (branch
= 0; branch
< max_branch
; branch
++) {
791 pci_read_config_word(pvt
->pci_dev_2x_0_fbd_branch
[branch
],
793 &pvt
->mtr
[slot
][branch
]);
794 for (ch
= 0; ch
< max_channel
; ch
++) {
795 int channel
= to_channel(ch
, branch
);
797 dimm
= edac_get_dimm(mci
, branch
, ch
, slot
);
799 dinfo
= &pvt
->dimm_info
[slot
][channel
];
801 mtr
= decode_mtr(pvt
, slot
, ch
, branch
,
804 /* if no DIMMS on this row, continue */
805 if (!MTR_DIMMS_PRESENT(mtr
))
818 * decode_mir() - Decodes Memory Interleave Register (MIR) info
819 * @mir_no: number of the MIR register to decode
820 * @mir: array with the MIR data cached on the driver
822 static void decode_mir(int mir_no
, u16 mir
[MAX_MIR
])
825 edac_dbg(2, "MIR%d: limit= 0x%x Branch(es) that participate: %s %s\n",
827 (mir
[mir_no
] >> 4) & 0xfff,
828 (mir
[mir_no
] & 1) ? "B0" : "",
829 (mir
[mir_no
] & 2) ? "B1" : "");
833 * i7300_get_mc_regs() - Get the contents of the MC enumeration registers
834 * @mci: struct mem_ctl_info pointer
836 * Data read is cached internally for its usage when needed
838 static int i7300_get_mc_regs(struct mem_ctl_info
*mci
)
840 struct i7300_pvt
*pvt
;
846 pci_read_config_dword(pvt
->pci_dev_16_0_fsb_ctlr
, AMBASE
,
847 (u32
*) &pvt
->ambase
);
849 edac_dbg(2, "AMBASE= 0x%lx\n", (long unsigned int)pvt
->ambase
);
851 /* Get the Branch Map regs */
852 pci_read_config_word(pvt
->pci_dev_16_1_fsb_addr_map
, TOLM
, &pvt
->tolm
);
854 edac_dbg(2, "TOLM (number of 256M regions) =%u (0x%x)\n",
855 pvt
->tolm
, pvt
->tolm
);
857 actual_tolm
= (u32
) ((1000l * pvt
->tolm
) >> (30 - 28));
858 edac_dbg(2, "Actual TOLM byte addr=%u.%03u GB (0x%x)\n",
859 actual_tolm
/1000, actual_tolm
% 1000, pvt
->tolm
<< 28);
861 /* Get memory controller settings */
862 pci_read_config_dword(pvt
->pci_dev_16_1_fsb_addr_map
, MC_SETTINGS
,
864 pci_read_config_dword(pvt
->pci_dev_16_1_fsb_addr_map
, MC_SETTINGS_A
,
865 &pvt
->mc_settings_a
);
867 if (IS_SINGLE_MODE(pvt
->mc_settings_a
))
868 edac_dbg(0, "Memory controller operating on single mode\n");
870 edac_dbg(0, "Memory controller operating on %smirrored mode\n",
871 IS_MIRRORED(pvt
->mc_settings
) ? "" : "non-");
873 edac_dbg(0, "Error detection is %s\n",
874 IS_ECC_ENABLED(pvt
->mc_settings
) ? "enabled" : "disabled");
875 edac_dbg(0, "Retry is %s\n",
876 IS_RETRY_ENABLED(pvt
->mc_settings
) ? "enabled" : "disabled");
878 /* Get Memory Interleave Range registers */
879 pci_read_config_word(pvt
->pci_dev_16_1_fsb_addr_map
, MIR0
,
881 pci_read_config_word(pvt
->pci_dev_16_1_fsb_addr_map
, MIR1
,
883 pci_read_config_word(pvt
->pci_dev_16_1_fsb_addr_map
, MIR2
,
886 /* Decode the MIR regs */
887 for (i
= 0; i
< MAX_MIR
; i
++)
888 decode_mir(i
, pvt
->mir
);
890 rc
= i7300_init_csrows(mci
);
894 /* Go and determine the size of each DIMM and place in an
896 print_dimm_size(pvt
);
901 /*************************************************
902 * i7300 Functions related to device probe/release
903 *************************************************/
906 * i7300_put_devices() - Release the PCI devices
907 * @mci: struct mem_ctl_info pointer
909 static void i7300_put_devices(struct mem_ctl_info
*mci
)
911 struct i7300_pvt
*pvt
;
916 /* Decrement usage count for devices */
917 for (branch
= 0; branch
< MAX_CH_PER_BRANCH
; branch
++)
918 pci_dev_put(pvt
->pci_dev_2x_0_fbd_branch
[branch
]);
919 pci_dev_put(pvt
->pci_dev_16_2_fsb_err_regs
);
920 pci_dev_put(pvt
->pci_dev_16_1_fsb_addr_map
);
924 * i7300_get_devices() - Find and perform 'get' operation on the MCH's
925 * device/functions we want to reference for this driver
926 * @mci: struct mem_ctl_info pointer
928 * Access and prepare the several devices for usage:
929 * I7300 devices used by this driver:
930 * Device 16, functions 0,1 and 2: PCI_DEVICE_ID_INTEL_I7300_MCH_ERR
931 * Device 21 function 0: PCI_DEVICE_ID_INTEL_I7300_MCH_FB0
932 * Device 22 function 0: PCI_DEVICE_ID_INTEL_I7300_MCH_FB1
934 static int i7300_get_devices(struct mem_ctl_info
*mci
)
936 struct i7300_pvt
*pvt
;
937 struct pci_dev
*pdev
;
941 /* Attempt to 'get' the MCH register we want */
943 while ((pdev
= pci_get_device(PCI_VENDOR_ID_INTEL
,
944 PCI_DEVICE_ID_INTEL_I7300_MCH_ERR
,
946 /* Store device 16 funcs 1 and 2 */
947 switch (PCI_FUNC(pdev
->devfn
)) {
949 if (!pvt
->pci_dev_16_1_fsb_addr_map
)
950 pvt
->pci_dev_16_1_fsb_addr_map
=
954 if (!pvt
->pci_dev_16_2_fsb_err_regs
)
955 pvt
->pci_dev_16_2_fsb_err_regs
=
961 if (!pvt
->pci_dev_16_1_fsb_addr_map
||
962 !pvt
->pci_dev_16_2_fsb_err_regs
) {
963 /* At least one device was not found */
964 i7300_printk(KERN_ERR
,
965 "'system address,Process Bus' device not found:"
966 "vendor 0x%x device 0x%x ERR funcs (broken BIOS?)\n",
968 PCI_DEVICE_ID_INTEL_I7300_MCH_ERR
);
972 edac_dbg(1, "System Address, processor bus- PCI Bus ID: %s %x:%x\n",
973 pci_name(pvt
->pci_dev_16_0_fsb_ctlr
),
974 pvt
->pci_dev_16_0_fsb_ctlr
->vendor
,
975 pvt
->pci_dev_16_0_fsb_ctlr
->device
);
976 edac_dbg(1, "Branchmap, control and errors - PCI Bus ID: %s %x:%x\n",
977 pci_name(pvt
->pci_dev_16_1_fsb_addr_map
),
978 pvt
->pci_dev_16_1_fsb_addr_map
->vendor
,
979 pvt
->pci_dev_16_1_fsb_addr_map
->device
);
980 edac_dbg(1, "FSB Error Regs - PCI Bus ID: %s %x:%x\n",
981 pci_name(pvt
->pci_dev_16_2_fsb_err_regs
),
982 pvt
->pci_dev_16_2_fsb_err_regs
->vendor
,
983 pvt
->pci_dev_16_2_fsb_err_regs
->device
);
985 pvt
->pci_dev_2x_0_fbd_branch
[0] = pci_get_device(PCI_VENDOR_ID_INTEL
,
986 PCI_DEVICE_ID_INTEL_I7300_MCH_FB0
,
988 if (!pvt
->pci_dev_2x_0_fbd_branch
[0]) {
989 i7300_printk(KERN_ERR
,
990 "MC: 'BRANCH 0' device not found:"
991 "vendor 0x%x device 0x%x Func 0 (broken BIOS?)\n",
992 PCI_VENDOR_ID_INTEL
, PCI_DEVICE_ID_INTEL_I7300_MCH_FB0
);
996 pvt
->pci_dev_2x_0_fbd_branch
[1] = pci_get_device(PCI_VENDOR_ID_INTEL
,
997 PCI_DEVICE_ID_INTEL_I7300_MCH_FB1
,
999 if (!pvt
->pci_dev_2x_0_fbd_branch
[1]) {
1000 i7300_printk(KERN_ERR
,
1001 "MC: 'BRANCH 1' device not found:"
1002 "vendor 0x%x device 0x%x Func 0 "
1004 PCI_VENDOR_ID_INTEL
,
1005 PCI_DEVICE_ID_INTEL_I7300_MCH_FB1
);
1012 i7300_put_devices(mci
);
1017 * i7300_init_one() - Probe for one instance of the device
1018 * @pdev: struct pci_dev pointer
1019 * @id: struct pci_device_id pointer - currently unused
1021 static int i7300_init_one(struct pci_dev
*pdev
, const struct pci_device_id
*id
)
1023 struct mem_ctl_info
*mci
;
1024 struct edac_mc_layer layers
[3];
1025 struct i7300_pvt
*pvt
;
1028 /* wake up device */
1029 rc
= pci_enable_device(pdev
);
1033 edac_dbg(0, "MC: pdev bus %u dev=0x%x fn=0x%x\n",
1035 PCI_SLOT(pdev
->devfn
), PCI_FUNC(pdev
->devfn
));
1037 /* We only are looking for func 0 of the set */
1038 if (PCI_FUNC(pdev
->devfn
) != 0)
1041 /* allocate a new MC control structure */
1042 layers
[0].type
= EDAC_MC_LAYER_BRANCH
;
1043 layers
[0].size
= MAX_BRANCHES
;
1044 layers
[0].is_virt_csrow
= false;
1045 layers
[1].type
= EDAC_MC_LAYER_CHANNEL
;
1046 layers
[1].size
= MAX_CH_PER_BRANCH
;
1047 layers
[1].is_virt_csrow
= true;
1048 layers
[2].type
= EDAC_MC_LAYER_SLOT
;
1049 layers
[2].size
= MAX_SLOTS
;
1050 layers
[2].is_virt_csrow
= true;
1051 mci
= edac_mc_alloc(0, ARRAY_SIZE(layers
), layers
, sizeof(*pvt
));
1055 edac_dbg(0, "MC: mci = %p\n", mci
);
1057 mci
->pdev
= &pdev
->dev
; /* record ptr to the generic device */
1059 pvt
= mci
->pvt_info
;
1060 pvt
->pci_dev_16_0_fsb_ctlr
= pdev
; /* Record this device in our private */
1062 pvt
->tmp_prt_buffer
= kmalloc(PAGE_SIZE
, GFP_KERNEL
);
1063 if (!pvt
->tmp_prt_buffer
) {
1068 /* 'get' the pci devices we want to reserve for our use */
1069 if (i7300_get_devices(mci
))
1073 mci
->mtype_cap
= MEM_FLAG_FB_DDR2
;
1074 mci
->edac_ctl_cap
= EDAC_FLAG_NONE
;
1075 mci
->edac_cap
= EDAC_FLAG_NONE
;
1076 mci
->mod_name
= "i7300_edac.c";
1077 mci
->ctl_name
= i7300_devs
[0].ctl_name
;
1078 mci
->dev_name
= pci_name(pdev
);
1079 mci
->ctl_page_to_phys
= NULL
;
1081 /* Set the function pointer to an actual operation function */
1082 mci
->edac_check
= i7300_check_error
;
1084 /* initialize the MC control structure 'csrows' table
1085 * with the mapping and control information */
1086 if (i7300_get_mc_regs(mci
)) {
1087 edac_dbg(0, "MC: Setting mci->edac_cap to EDAC_FLAG_NONE because i7300_init_csrows() returned nonzero value\n");
1088 mci
->edac_cap
= EDAC_FLAG_NONE
; /* no csrows found */
1090 edac_dbg(1, "MC: Enable error reporting now\n");
1091 i7300_enable_error_reporting(mci
);
1094 /* add this new MC control structure to EDAC's list of MCs */
1095 if (edac_mc_add_mc(mci
)) {
1096 edac_dbg(0, "MC: failed edac_mc_add_mc()\n");
1097 /* FIXME: perhaps some code should go here that disables error
1098 * reporting if we just enabled it
1103 i7300_clear_error(mci
);
1105 /* allocating generic PCI control info */
1106 i7300_pci
= edac_pci_create_generic_ctl(&pdev
->dev
, EDAC_MOD_STR
);
1109 "%s(): Unable to create PCI control\n",
1112 "%s(): PCI error report via EDAC not setup\n",
1118 /* Error exit unwinding stack */
1121 i7300_put_devices(mci
);
1124 kfree(pvt
->tmp_prt_buffer
);
1130 * i7300_remove_one() - Remove the driver
1131 * @pdev: struct pci_dev pointer
1133 static void i7300_remove_one(struct pci_dev
*pdev
)
1135 struct mem_ctl_info
*mci
;
1141 edac_pci_release_generic_ctl(i7300_pci
);
1143 mci
= edac_mc_del_mc(&pdev
->dev
);
1147 tmp
= ((struct i7300_pvt
*)mci
->pvt_info
)->tmp_prt_buffer
;
1149 /* retrieve references to resources, and free those resources */
1150 i7300_put_devices(mci
);
1157 * pci_device_id: table for which devices we are looking for
1159 * Has only 8086:360c PCI ID
1161 static const struct pci_device_id i7300_pci_tbl
[] = {
1162 {PCI_DEVICE(PCI_VENDOR_ID_INTEL
, PCI_DEVICE_ID_INTEL_I7300_MCH_ERR
)},
1163 {0,} /* 0 terminated list. */
1166 MODULE_DEVICE_TABLE(pci
, i7300_pci_tbl
);
1169 * i7300_driver: pci_driver structure for this module
1171 static struct pci_driver i7300_driver
= {
1172 .name
= "i7300_edac",
1173 .probe
= i7300_init_one
,
1174 .remove
= i7300_remove_one
,
1175 .id_table
= i7300_pci_tbl
,
1179 * i7300_init() - Registers the driver
1181 static int __init
i7300_init(void)
1187 /* Ensure that the OPSTATE is set correctly for POLL or NMI */
1190 pci_rc
= pci_register_driver(&i7300_driver
);
1192 return (pci_rc
< 0) ? pci_rc
: 0;
1196 * i7300_init() - Unregisters the driver
1198 static void __exit
i7300_exit(void)
1201 pci_unregister_driver(&i7300_driver
);
1204 module_init(i7300_init
);
1205 module_exit(i7300_exit
);
1207 MODULE_LICENSE("GPL");
1208 MODULE_AUTHOR("Mauro Carvalho Chehab");
1209 MODULE_AUTHOR("Red Hat Inc. (http://www.redhat.com)");
1210 MODULE_DESCRIPTION("MC Driver for Intel I7300 memory controllers - "
1213 module_param(edac_op_state
, int, 0444);
1214 MODULE_PARM_DESC(edac_op_state
, "EDAC Error Reporting state: 0=Poll,1=NMI");