]> git.proxmox.com Git - mirror_ubuntu-artful-kernel.git/blame - drivers/edac/i7300_edac.c
i7300_edac: Properly detect the type of error correction
[mirror_ubuntu-artful-kernel.git] / drivers / edac / i7300_edac.c
CommitLineData
fcaf780b
MCC
1/*
2 * Intel 7300 class Memory Controllers kernel module (Clarksboro)
3 *
4 * This file may be distributed under the terms of the
5 * GNU General Public License version 2 only.
6 *
7 * Copyright (c) 2010 by:
8 * Mauro Carvalho Chehab <mchehab@redhat.com>
9 *
10 * Red Hat Inc. http://www.redhat.com
11 *
12 * Intel 7300 Chipset Memory Controller Hub (MCH) - Datasheet
13 * http://www.intel.com/Assets/PDF/datasheet/318082.pdf
14 *
15 * TODO: The chipset allow checking for PCI Express errors also. Currently,
16 * the driver covers only memory error errors
17 *
18 * This driver uses "csrows" EDAC attribute to represent DIMM slot#
19 */
20
21#include <linux/module.h>
22#include <linux/init.h>
23#include <linux/pci.h>
24#include <linux/pci_ids.h>
25#include <linux/slab.h>
26#include <linux/edac.h>
27#include <linux/mmzone.h>
28
29#include "edac_core.h"
30
31/*
32 * Alter this version for the I7300 module when modifications are made
33 */
34#define I7300_REVISION " Ver: 1.0.0 " __DATE__
35
36#define EDAC_MOD_STR "i7300_edac"
37
38#define i7300_printk(level, fmt, arg...) \
39 edac_printk(level, "i7300", fmt, ##arg)
40
41#define i7300_mc_printk(mci, level, fmt, arg...) \
42 edac_mc_chipset_printk(mci, level, "i7300", fmt, ##arg)
43
44/*
45 * Memory topology is organized as:
46 * Branch 0 - 2 channels: channels 0 and 1 (FDB0 PCI dev 21.0)
47 * Branch 1 - 2 channels: channels 2 and 3 (FDB1 PCI dev 22.0)
48 * Each channel can have to 8 DIMM sets (called as SLOTS)
49 * Slots should generally be filled in pairs
50 * Except on Single Channel mode of operation
51 * just slot 0/channel0 filled on this mode
52 * On normal operation mode, the two channels on a branch should be
c3af2eaf 53 * filled together for the same SLOT#
fcaf780b
MCC
54 * When in mirrored mode, Branch 1 replicate memory at Branch 0, so, the four
55 * channels on both branches should be filled
56 */
57
58/* Limits for i7300 */
59#define MAX_SLOTS 8
60#define MAX_BRANCHES 2
61#define MAX_CH_PER_BRANCH 2
62#define MAX_CHANNELS (MAX_CH_PER_BRANCH * MAX_BRANCHES)
63#define MAX_MIR 3
64
65#define to_channel(ch, branch) ((((branch)) << 1) | (ch))
66
67#define to_csrow(slot, ch, branch) \
68 (to_channel(ch, branch) | ((slot) << 2))
69
c3af2eaf
MCC
70/*
71 * I7300 devices
fcaf780b
MCC
72 * All 3 functions of Device 16 (0,1,2) share the SAME DID and
73 * uses PCI_DEVICE_ID_INTEL_I7300_MCH_ERR for device 16 (0,1,2),
74 * PCI_DEVICE_ID_INTEL_I7300_MCH_FB0 and PCI_DEVICE_ID_INTEL_I7300_MCH_FB1
75 * for device 21 (0,1).
c3af2eaf
MCC
76 */
77
78/****************************************************
79 * i7300 Register definitions for memory enumberation
80 ****************************************************/
81
82/*
83 * Device 16,
84 * Function 0: System Address (not documented)
85 * Function 1: Memory Branch Map, Control, Errors Register
fcaf780b
MCC
86 */
87
88 /* OFFSETS for Function 0 */
af3d8831
MCC
89#define AMBASE 0x48 /* AMB Mem Mapped Reg Region Base */
90#define MAXCH 0x56 /* Max Channel Number */
91#define MAXDIMMPERCH 0x57 /* Max DIMM PER Channel Number */
fcaf780b
MCC
92
93 /* OFFSETS for Function 1 */
af3d8831 94#define MC_SETTINGS 0x40
bb81a216
MCC
95 #define IS_MIRRORED(mc) ((mc) & (1 << 16))
96 #define IS_ECC_ENABLED(mc) ((mc) & (1 << 5))
97 #define IS_RETRY_ENABLED(mc) ((mc) & (1 << 31))
98 #define IS_SCRBALGO_ENHANCED(mc) ((mc) & (1 << 8))
fcaf780b 99
bb81a216
MCC
100#define MC_SETTINGS_A 0x58
101 #define IS_SINGLE_MODE(mca) ((mca) & (1 << 14))
d7de2bdb 102
af3d8831
MCC
103#define TOLM 0x6C
104#define REDMEMB 0x7C
105
106#define MIR0 0x80
107#define MIR1 0x84
108#define MIR2 0x88
fcaf780b 109
fcaf780b
MCC
110/*
111 * Note: Other Intel EDAC drivers use AMBPRESENT to identify if the available
112 * memory. From datasheet item 7.3.1 (FB-DIMM technology & organization), it
113 * seems that we cannot use this information directly for the same usage.
114 * Each memory slot may have up to 2 AMB interfaces, one for income and another
115 * for outcome interface to the next slot.
116 * For now, the driver just stores the AMB present registers, but rely only at
117 * the MTR info to detect memory.
118 * Datasheet is also not clear about how to map each AMBPRESENT registers to
119 * one of the 4 available channels.
120 */
121#define AMBPRESENT_0 0x64
122#define AMBPRESENT_1 0x66
123
124const static u16 mtr_regs [MAX_SLOTS] = {
125 0x80, 0x84, 0x88, 0x8c,
126 0x82, 0x86, 0x8a, 0x8e
127};
128
129/* Defines to extract the vaious fields from the
130 * MTRx - Memory Technology Registers
131 */
132#define MTR_DIMMS_PRESENT(mtr) ((mtr) & (1 << 8))
133#define MTR_DIMMS_ETHROTTLE(mtr) ((mtr) & (1 << 7))
134#define MTR_DRAM_WIDTH(mtr) (((mtr) & (1 << 6)) ? 8 : 4)
135#define MTR_DRAM_BANKS(mtr) (((mtr) & (1 << 5)) ? 8 : 4)
136#define MTR_DIMM_RANKS(mtr) (((mtr) & (1 << 4)) ? 1 : 0)
137#define MTR_DIMM_ROWS(mtr) (((mtr) >> 2) & 0x3)
138#define MTR_DRAM_BANKS_ADDR_BITS 2
139#define MTR_DIMM_ROWS_ADDR_BITS(mtr) (MTR_DIMM_ROWS(mtr) + 13)
140#define MTR_DIMM_COLS(mtr) ((mtr) & 0x3)
141#define MTR_DIMM_COLS_ADDR_BITS(mtr) (MTR_DIMM_COLS(mtr) + 10)
142
fcaf780b
MCC
143#ifdef CONFIG_EDAC_DEBUG
144/* MTR NUMROW */
145static const char *numrow_toString[] = {
146 "8,192 - 13 rows",
147 "16,384 - 14 rows",
148 "32,768 - 15 rows",
149 "65,536 - 16 rows"
150};
151
152/* MTR NUMCOL */
153static const char *numcol_toString[] = {
154 "1,024 - 10 columns",
155 "2,048 - 11 columns",
156 "4,096 - 12 columns",
157 "reserved"
158};
159#endif
160
c3af2eaf
MCC
161/************************************************
162 * i7300 Register definitions for error detection
163 ************************************************/
164/*
165 * Device 16.2: Global Error Registers
166 */
167
5de6e07e
MCC
168#define FERR_GLOBAL_HI 0x48
169static const char *ferr_global_hi_name[] = {
170 [3] = "FSB 3 Fatal Error",
171 [2] = "FSB 2 Fatal Error",
172 [1] = "FSB 1 Fatal Error",
173 [0] = "FSB 0 Fatal Error",
174};
175#define ferr_global_hi_is_fatal(errno) 1
176
c3af2eaf 177#define FERR_GLOBAL_LO 0x40
5de6e07e 178static const char *ferr_global_lo_name[] = {
c3af2eaf
MCC
179 [31] = "Internal MCH Fatal Error",
180 [30] = "Intel QuickData Technology Device Fatal Error",
181 [29] = "FSB1 Fatal Error",
182 [28] = "FSB0 Fatal Error",
183 [27] = "FBD Channel 3 Fatal Error",
184 [26] = "FBD Channel 2 Fatal Error",
185 [25] = "FBD Channel 1 Fatal Error",
186 [24] = "FBD Channel 0 Fatal Error",
187 [23] = "PCI Express Device 7Fatal Error",
188 [22] = "PCI Express Device 6 Fatal Error",
189 [21] = "PCI Express Device 5 Fatal Error",
190 [20] = "PCI Express Device 4 Fatal Error",
191 [19] = "PCI Express Device 3 Fatal Error",
192 [18] = "PCI Express Device 2 Fatal Error",
193 [17] = "PCI Express Device 1 Fatal Error",
194 [16] = "ESI Fatal Error",
195 [15] = "Internal MCH Non-Fatal Error",
196 [14] = "Intel QuickData Technology Device Non Fatal Error",
197 [13] = "FSB1 Non-Fatal Error",
198 [12] = "FSB 0 Non-Fatal Error",
199 [11] = "FBD Channel 3 Non-Fatal Error",
200 [10] = "FBD Channel 2 Non-Fatal Error",
201 [9] = "FBD Channel 1 Non-Fatal Error",
202 [8] = "FBD Channel 0 Non-Fatal Error",
203 [7] = "PCI Express Device 7 Non-Fatal Error",
204 [6] = "PCI Express Device 6 Non-Fatal Error",
205 [5] = "PCI Express Device 5 Non-Fatal Error",
206 [4] = "PCI Express Device 4 Non-Fatal Error",
207 [3] = "PCI Express Device 3 Non-Fatal Error",
208 [2] = "PCI Express Device 2 Non-Fatal Error",
209 [1] = "PCI Express Device 1 Non-Fatal Error",
210 [0] = "ESI Non-Fatal Error",
211};
5de6e07e 212#define ferr_global_lo_is_fatal(errno) ((errno < 16) ? 0 : 1)
fcaf780b
MCC
213
214/* Device name and register DID (Device ID) */
215struct i7300_dev_info {
216 const char *ctl_name; /* name for this device */
217 u16 fsb_mapping_errors; /* DID for the branchmap,control */
218};
219
220/* Table of devices attributes supported by this driver */
221static const struct i7300_dev_info i7300_devs[] = {
222 {
223 .ctl_name = "I7300",
224 .fsb_mapping_errors = PCI_DEVICE_ID_INTEL_I7300_MCH_ERR,
225 },
226};
227
228struct i7300_dimm_info {
229 int megabytes; /* size, 0 means not present */
230};
231
232/* driver private data structure */
233struct i7300_pvt {
3e57eef6
MCC
234 struct pci_dev *pci_dev_16_0_fsb_ctlr; /* 16.0 */
235 struct pci_dev *pci_dev_16_1_fsb_addr_map; /* 16.1 */
236 struct pci_dev *pci_dev_16_2_fsb_err_regs; /* 16.2 */
237 struct pci_dev *pci_dev_2x_0_fbd_branch[MAX_BRANCHES]; /* 21.0 and 22.0 */
fcaf780b
MCC
238
239 u16 tolm; /* top of low memory */
240 u64 ambase; /* AMB BAR */
241
bb81a216
MCC
242 u32 mc_settings; /* Report several settings */
243 u32 mc_settings_a;
244
245 u16 mir[MAX_MIR]; /* Memory Interleave Reg*/
fcaf780b
MCC
246
247 u16 mtr[MAX_SLOTS][MAX_BRANCHES]; /* Memory Technlogy Reg */
248 u16 ambpresent[MAX_CHANNELS]; /* AMB present regs */
249
250 /* DIMM information matrix, allocating architecture maximums */
251 struct i7300_dimm_info dimm_info[MAX_SLOTS][MAX_CHANNELS];
252};
253
fcaf780b
MCC
254/* FIXME: Why do we need to have this static? */
255static struct edac_pci_ctl_info *i7300_pci;
256
5de6e07e
MCC
257/********************************************
258 * i7300 Functions related to error detection
259 ********************************************/
fcaf780b 260
5de6e07e
MCC
261struct i7300_error_info {
262 int dummy; /* FIXME */
263};
264
265const char *get_err_from_table(const char *table[], int size, int pos)
fcaf780b 266{
5de6e07e
MCC
267 if (pos >= size)
268 return "Reserved";
269
270 return table[pos];
fcaf780b
MCC
271}
272
5de6e07e
MCC
273#define GET_ERR_FROM_TABLE(table, pos) \
274 get_err_from_table(table, ARRAY_SIZE(table), pos)
275
fcaf780b
MCC
276/*
277 * i7300_get_error_info Retrieve the hardware error information from
278 * the hardware and cache it in the 'info'
279 * structure
280 */
281static void i7300_get_error_info(struct mem_ctl_info *mci,
282 struct i7300_error_info *info)
283{
fcaf780b
MCC
284}
285
286/*
5de6e07e
MCC
287 * i7300_process_error_global Retrieve the hardware error information from
288 * the hardware and cache it in the 'info'
289 * structure
fcaf780b 290 */
5de6e07e
MCC
291static void i7300_process_error_global(struct mem_ctl_info *mci,
292 struct i7300_error_info *info)
fcaf780b 293{
5de6e07e
MCC
294 struct i7300_pvt *pvt;
295 u32 errnum, value;
296 unsigned long errors;
297 const char *specific;
298 bool is_fatal;
fcaf780b 299
5de6e07e 300 pvt = mci->pvt_info;
fcaf780b 301
5de6e07e
MCC
302 /* read in the 1st FATAL error register */
303 pci_read_config_dword(pvt->pci_dev_16_2_fsb_err_regs,
304 FERR_GLOBAL_HI, &value);
305 if (unlikely(value)) {
306 errors = value;
307 errnum = find_first_bit(&errors,
308 ARRAY_SIZE(ferr_global_hi_name));
309 specific = GET_ERR_FROM_TABLE(ferr_global_hi_name, errnum);
310 is_fatal = ferr_global_hi_is_fatal(errnum);
86002324
MCC
311
312 /* Clear the error bit */
313 pci_write_config_dword(pvt->pci_dev_16_2_fsb_err_regs,
314 FERR_GLOBAL_HI, value);
315
5de6e07e 316 goto error_global;
fcaf780b
MCC
317 }
318
5de6e07e
MCC
319 pci_read_config_dword(pvt->pci_dev_16_2_fsb_err_regs,
320 FERR_GLOBAL_LO, &value);
321 if (unlikely(value)) {
322 errors = value;
323 errnum = find_first_bit(&errors,
324 ARRAY_SIZE(ferr_global_lo_name));
325 specific = GET_ERR_FROM_TABLE(ferr_global_lo_name, errnum);
326 is_fatal = ferr_global_lo_is_fatal(errnum);
86002324
MCC
327
328 /* Clear the error bit */
329 pci_write_config_dword(pvt->pci_dev_16_2_fsb_err_regs,
330 FERR_GLOBAL_LO, value);
331
5de6e07e
MCC
332 goto error_global;
333 }
334 return;
fcaf780b 335
5de6e07e
MCC
336error_global:
337 i7300_mc_printk(mci, KERN_EMERG, "%s misc error: %s\n",
338 is_fatal ? "Fatal" : "NOT fatal", specific);
fcaf780b
MCC
339}
340
341/*
5de6e07e
MCC
342 * i7300_process_error_info Retrieve the hardware error information from
343 * the hardware and cache it in the 'info'
344 * structure
fcaf780b
MCC
345 */
346static void i7300_process_error_info(struct mem_ctl_info *mci,
5de6e07e
MCC
347 struct i7300_error_info *info)
348{
349 i7300_process_error_global(mci, info);
350};
fcaf780b
MCC
351
352/*
353 * i7300_clear_error Retrieve any error from the hardware
354 * but do NOT process that error.
355 * Used for 'clearing' out of previous errors
356 * Called by the Core module.
357 */
358static void i7300_clear_error(struct mem_ctl_info *mci)
359{
360 struct i7300_error_info info;
361
362 i7300_get_error_info(mci, &info);
363}
364
365/*
366 * i7300_check_error Retrieve and process errors reported by the
367 * hardware. Called by the Core module.
368 */
369static void i7300_check_error(struct mem_ctl_info *mci)
370{
371 struct i7300_error_info info;
372 debugf4("MC%d: " __FILE__ ": %s()\n", mci->mc_idx, __func__);
5de6e07e 373
fcaf780b
MCC
374 i7300_get_error_info(mci, &info);
375 i7300_process_error_info(mci, &info);
376}
377
378/*
379 * i7300_enable_error_reporting
380 * Turn on the memory reporting features of the hardware
381 */
382static void i7300_enable_error_reporting(struct mem_ctl_info *mci)
383{
fcaf780b 384}
5de6e07e
MCC
385
386/************************************************
387 * i7300 Functions related to memory enumberation
388 ************************************************/
fcaf780b
MCC
389
390/*
391 * determine_mtr(pvt, csrow, channel)
392 *
393 * return the proper MTR register as determine by the csrow and desired channel
394 */
395static int decode_mtr(struct i7300_pvt *pvt,
396 int slot, int ch, int branch,
397 struct i7300_dimm_info *dinfo,
398 struct csrow_info *p_csrow)
399{
400 int mtr, ans, addrBits, channel;
401
402 channel = to_channel(ch, branch);
403
404 mtr = pvt->mtr[slot][branch];
405 ans = MTR_DIMMS_PRESENT(mtr) ? 1 : 0;
406
407 debugf2("\tMTR%d CH%d: DIMMs are %s (mtr)\n",
408 slot, channel,
409 ans ? "Present" : "NOT Present");
410
411 /* Determine if there is a DIMM present in this DIMM slot */
412
413#if 0
414 if (!amb_present || !ans)
415 return 0;
416#else
417 if (!ans)
418 return 0;
419#endif
420
421 /* Start with the number of bits for a Bank
422 * on the DRAM */
423 addrBits = MTR_DRAM_BANKS_ADDR_BITS;
424 /* Add thenumber of ROW bits */
425 addrBits += MTR_DIMM_ROWS_ADDR_BITS(mtr);
426 /* add the number of COLUMN bits */
427 addrBits += MTR_DIMM_COLS_ADDR_BITS(mtr);
428 /* add the number of RANK bits */
429 addrBits += MTR_DIMM_RANKS(mtr);
430
431 addrBits += 6; /* add 64 bits per DIMM */
432 addrBits -= 20; /* divide by 2^^20 */
433 addrBits -= 3; /* 8 bits per bytes */
434
435 dinfo->megabytes = 1 << addrBits;
436
437 debugf2("\t\tWIDTH: x%d\n", MTR_DRAM_WIDTH(mtr));
438
439 debugf2("\t\tELECTRICAL THROTTLING is %s\n",
440 MTR_DIMMS_ETHROTTLE(mtr) ? "enabled" : "disabled");
441
442 debugf2("\t\tNUMBANK: %d bank(s)\n", MTR_DRAM_BANKS(mtr));
443 debugf2("\t\tNUMRANK: %s\n", MTR_DIMM_RANKS(mtr) ? "double" : "single");
444 debugf2("\t\tNUMROW: %s\n", numrow_toString[MTR_DIMM_ROWS(mtr)]);
445 debugf2("\t\tNUMCOL: %s\n", numcol_toString[MTR_DIMM_COLS(mtr)]);
446 debugf2("\t\tSIZE: %d MB\n", dinfo->megabytes);
447
448 p_csrow->grain = 8;
449 p_csrow->nr_pages = dinfo->megabytes << 8;
450 p_csrow->mtype = MEM_FB_DDR2;
116389ed
MCC
451
452 /*
15154c57 453 * The type of error detection actually depends of the
116389ed 454 * mode of operation. When it is just one single memory chip, at
15154c57
MCC
455 * socket 0, channel 0, it uses 8-byte-over-32-byte SECDED+ code.
456 * In normal or mirrored mode, it uses Lockstep mode,
116389ed
MCC
457 * with the possibility of using an extended algorithm for x8 memories
458 * See datasheet Sections 7.3.6 to 7.3.8
459 */
15154c57
MCC
460
461 if (IS_SINGLE_MODE(pvt->mc_settings_a)) {
462 p_csrow->edac_mode = EDAC_SECDED;
463 debugf0("ECC code is 8-byte-over-32-byte SECDED+ code\n");
464 } else {
465 debugf0("ECC code is on Lockstep mode\n");
466 if (MTR_DRAM_WIDTH(mtr))
467 p_csrow->edac_mode = EDAC_S8ECD8ED;
468 else
469 p_csrow->edac_mode = EDAC_S4ECD4ED;
470 }
fcaf780b
MCC
471
472 /* ask what device type on this row */
d7de2bdb
MCC
473 if (MTR_DRAM_WIDTH(mtr)) {
474 debugf0("Scrub algorithm for x8 is on %s mode\n",
475 IS_SCRBALGO_ENHANCED(pvt->mc_settings) ?
476 "enhanced" : "normal");
477
fcaf780b 478 p_csrow->dtype = DEV_X8;
d7de2bdb 479 } else
fcaf780b
MCC
480 p_csrow->dtype = DEV_X4;
481
482 return mtr;
483}
484
485/*
486 * print_dimm_size
487 *
488 * also will output a DIMM matrix map, if debug is enabled, for viewing
489 * how the DIMMs are populated
490 */
491static void print_dimm_size(struct i7300_pvt *pvt)
492{
493 struct i7300_dimm_info *dinfo;
494 char *p, *mem_buffer;
495 int space, n;
496 int channel, slot;
497
498 space = PAGE_SIZE;
499 mem_buffer = p = kmalloc(space, GFP_KERNEL);
500 if (p == NULL) {
501 i7300_printk(KERN_ERR, "MC: %s:%s() kmalloc() failed\n",
502 __FILE__, __func__);
503 return;
504 }
505
506 n = snprintf(p, space, " ");
507 p += n;
508 space -= n;
509 for (channel = 0; channel < MAX_CHANNELS; channel++) {
510 n = snprintf(p, space, "channel %d | ", channel);
511 p += n;
512 space -= n;
513 }
514 debugf2("%s\n", mem_buffer);
515 p = mem_buffer;
516 space = PAGE_SIZE;
517 n = snprintf(p, space, "-------------------------------"
518 "------------------------------");
519 p += n;
520 space -= n;
521 debugf2("%s\n", mem_buffer);
522 p = mem_buffer;
523 space = PAGE_SIZE;
524
525 for (slot = 0; slot < MAX_SLOTS; slot++) {
526 n = snprintf(p, space, "csrow/SLOT %d ", slot);
527 p += n;
528 space -= n;
529
530 for (channel = 0; channel < MAX_CHANNELS; channel++) {
531 dinfo = &pvt->dimm_info[slot][channel];
532 n = snprintf(p, space, "%4d MB | ", dinfo->megabytes);
533 p += n;
534 space -= n;
535 }
536
537 debugf2("%s\n", mem_buffer);
538 p = mem_buffer;
539 space = PAGE_SIZE;
540 }
541
542 n = snprintf(p, space, "-------------------------------"
543 "------------------------------");
544 p += n;
545 space -= n;
546 debugf2("%s\n", mem_buffer);
547 p = mem_buffer;
548 space = PAGE_SIZE;
549
550 kfree(mem_buffer);
551}
552
553/*
554 * i7300_init_csrows Initialize the 'csrows' table within
555 * the mci control structure with the
556 * addressing of memory.
557 *
558 * return:
559 * 0 success
560 * 1 no actual memory found on this MC
561 */
562static int i7300_init_csrows(struct mem_ctl_info *mci)
563{
564 struct i7300_pvt *pvt;
565 struct i7300_dimm_info *dinfo;
566 struct csrow_info *p_csrow;
567 int empty;
568 int mtr;
569 int ch, branch, slot, channel;
570
571 pvt = mci->pvt_info;
572
573 empty = 1; /* Assume NO memory */
574
575 debugf2("Memory Technology Registers:\n");
576
577 /* Get the AMB present registers for the four channels */
578 for (branch = 0; branch < MAX_BRANCHES; branch++) {
579 /* Read and dump branch 0's MTRs */
580 channel = to_channel(0, branch);
3e57eef6 581 pci_read_config_word(pvt->pci_dev_2x_0_fbd_branch[branch], AMBPRESENT_0,
fcaf780b
MCC
582 &pvt->ambpresent[channel]);
583 debugf2("\t\tAMB-present CH%d = 0x%x:\n",
584 channel, pvt->ambpresent[channel]);
585
586 channel = to_channel(1, branch);
3e57eef6 587 pci_read_config_word(pvt->pci_dev_2x_0_fbd_branch[branch], AMBPRESENT_1,
fcaf780b
MCC
588 &pvt->ambpresent[channel]);
589 debugf2("\t\tAMB-present CH%d = 0x%x:\n",
590 channel, pvt->ambpresent[channel]);
591 }
592
593 /* Get the set of MTR[0-7] regs by each branch */
594 for (slot = 0; slot < MAX_SLOTS; slot++) {
595 int where = mtr_regs[slot];
596 for (branch = 0; branch < MAX_BRANCHES; branch++) {
3e57eef6 597 pci_read_config_word(pvt->pci_dev_2x_0_fbd_branch[branch],
fcaf780b
MCC
598 where,
599 &pvt->mtr[slot][branch]);
600 for (ch = 0; ch < MAX_BRANCHES; ch++) {
601 int channel = to_channel(ch, branch);
602
603 dinfo = &pvt->dimm_info[slot][channel];
604 p_csrow = &mci->csrows[slot];
605
606 mtr = decode_mtr(pvt, slot, ch, branch,
607 dinfo, p_csrow);
608 /* if no DIMMS on this row, continue */
609 if (!MTR_DIMMS_PRESENT(mtr))
610 continue;
611
612 p_csrow->csrow_idx = slot;
613
614 /* FAKE OUT VALUES, FIXME */
615 p_csrow->first_page = 0 + slot * 20;
616 p_csrow->last_page = 9 + slot * 20;
617 p_csrow->page_mask = 0xfff;
618
619 empty = 0;
620 }
621 }
622 }
623
624 return empty;
625}
626
627static void decode_mir(int mir_no, u16 mir[MAX_MIR])
628{
629 if (mir[mir_no] & 3)
630 debugf2("MIR%d: limit= 0x%x Branch(es) that participate: %s %s\n",
631 mir_no,
632 (mir[mir_no] >> 4) & 0xfff,
633 (mir[mir_no] & 1) ? "B0" : "",
634 (mir[mir_no] & 2) ? "B1": "");
635}
636
637/*
638 * i7300_get_mc_regs read in the necessary registers and
639 * cache locally
640 *
641 * Fills in the private data members
642 */
643static int i7300_get_mc_regs(struct mem_ctl_info *mci)
644{
645 struct i7300_pvt *pvt;
646 u32 actual_tolm;
647 int i, rc;
648
649 pvt = mci->pvt_info;
650
3e57eef6 651 pci_read_config_dword(pvt->pci_dev_16_0_fsb_ctlr, AMBASE,
fcaf780b
MCC
652 (u32 *) &pvt->ambase);
653
654 debugf2("AMBASE= 0x%lx\n", (long unsigned int)pvt->ambase);
655
656 /* Get the Branch Map regs */
3e57eef6 657 pci_read_config_word(pvt->pci_dev_16_1_fsb_addr_map, TOLM, &pvt->tolm);
fcaf780b
MCC
658 pvt->tolm >>= 12;
659 debugf2("TOLM (number of 256M regions) =%u (0x%x)\n", pvt->tolm,
660 pvt->tolm);
661
662 actual_tolm = (u32) ((1000l * pvt->tolm) >> (30 - 28));
663 debugf2("Actual TOLM byte addr=%u.%03u GB (0x%x)\n",
664 actual_tolm/1000, actual_tolm % 1000, pvt->tolm << 28);
665
af3d8831 666 /* Get memory controller settings */
3e57eef6 667 pci_read_config_dword(pvt->pci_dev_16_1_fsb_addr_map, MC_SETTINGS,
af3d8831 668 &pvt->mc_settings);
bb81a216
MCC
669 pci_read_config_dword(pvt->pci_dev_16_1_fsb_addr_map, MC_SETTINGS_A,
670 &pvt->mc_settings_a);
d7de2bdb 671
bb81a216
MCC
672 if (IS_SINGLE_MODE(pvt->mc_settings_a))
673 debugf0("Memory controller operating on single mode\n");
674 else
675 debugf0("Memory controller operating on %s mode\n",
d7de2bdb 676 IS_MIRRORED(pvt->mc_settings) ? "mirrored" : "non-mirrored");
bb81a216 677
af3d8831 678 debugf0("Error detection is %s\n",
d7de2bdb
MCC
679 IS_ECC_ENABLED(pvt->mc_settings) ? "enabled" : "disabled");
680 debugf0("Retry is %s\n",
681 IS_RETRY_ENABLED(pvt->mc_settings) ? "enabled" : "disabled");
af3d8831
MCC
682
683 /* Get Memory Interleave Range registers */
3e57eef6
MCC
684 pci_read_config_word(pvt->pci_dev_16_1_fsb_addr_map, MIR0, &pvt->mir[0]);
685 pci_read_config_word(pvt->pci_dev_16_1_fsb_addr_map, MIR1, &pvt->mir[1]);
686 pci_read_config_word(pvt->pci_dev_16_1_fsb_addr_map, MIR2, &pvt->mir[2]);
fcaf780b
MCC
687
688 /* Decode the MIR regs */
689 for (i = 0; i < MAX_MIR; i++)
690 decode_mir(i, pvt->mir);
691
692 rc = i7300_init_csrows(mci);
693 if (rc < 0)
694 return rc;
695
696 /* Go and determine the size of each DIMM and place in an
697 * orderly matrix */
698 print_dimm_size(pvt);
699
700 return 0;
701}
702
5de6e07e
MCC
703/*************************************************
704 * i7300 Functions related to device probe/release
705 *************************************************/
706
fcaf780b
MCC
707/*
708 * i7300_put_devices 'put' all the devices that we have
709 * reserved via 'get'
710 */
711static void i7300_put_devices(struct mem_ctl_info *mci)
712{
713 struct i7300_pvt *pvt;
714 int branch;
715
716 pvt = mci->pvt_info;
717
718 /* Decrement usage count for devices */
719 for (branch = 0; branch < MAX_CH_PER_BRANCH; branch++)
3e57eef6
MCC
720 pci_dev_put(pvt->pci_dev_2x_0_fbd_branch[branch]);
721 pci_dev_put(pvt->pci_dev_16_2_fsb_err_regs);
722 pci_dev_put(pvt->pci_dev_16_1_fsb_addr_map);
fcaf780b
MCC
723}
724
725/*
726 * i7300_get_devices Find and perform 'get' operation on the MCH's
727 * device/functions we want to reference for this driver
728 *
729 * Need to 'get' device 16 func 1 and func 2
730 */
731static int i7300_get_devices(struct mem_ctl_info *mci, int dev_idx)
732{
733 struct i7300_pvt *pvt;
734 struct pci_dev *pdev;
735
736 pvt = mci->pvt_info;
737
738 /* Attempt to 'get' the MCH register we want */
739 pdev = NULL;
3e57eef6 740 while (!pvt->pci_dev_16_1_fsb_addr_map || !pvt->pci_dev_16_2_fsb_err_regs) {
fcaf780b
MCC
741 pdev = pci_get_device(PCI_VENDOR_ID_INTEL,
742 PCI_DEVICE_ID_INTEL_I7300_MCH_ERR, pdev);
743 if (!pdev) {
744 /* End of list, leave */
745 i7300_printk(KERN_ERR,
746 "'system address,Process Bus' "
747 "device not found:"
748 "vendor 0x%x device 0x%x ERR funcs "
749 "(broken BIOS?)\n",
750 PCI_VENDOR_ID_INTEL,
751 PCI_DEVICE_ID_INTEL_I7300_MCH_ERR);
752 goto error;
753 }
754
755 /* Store device 16 funcs 1 and 2 */
756 switch (PCI_FUNC(pdev->devfn)) {
757 case 1:
3e57eef6 758 pvt->pci_dev_16_1_fsb_addr_map = pdev;
fcaf780b
MCC
759 break;
760 case 2:
3e57eef6 761 pvt->pci_dev_16_2_fsb_err_regs = pdev;
fcaf780b
MCC
762 break;
763 }
764 }
765
766 debugf1("System Address, processor bus- PCI Bus ID: %s %x:%x\n",
3e57eef6
MCC
767 pci_name(pvt->pci_dev_16_0_fsb_ctlr),
768 pvt->pci_dev_16_0_fsb_ctlr->vendor, pvt->pci_dev_16_0_fsb_ctlr->device);
fcaf780b 769 debugf1("Branchmap, control and errors - PCI Bus ID: %s %x:%x\n",
3e57eef6
MCC
770 pci_name(pvt->pci_dev_16_1_fsb_addr_map),
771 pvt->pci_dev_16_1_fsb_addr_map->vendor, pvt->pci_dev_16_1_fsb_addr_map->device);
fcaf780b 772 debugf1("FSB Error Regs - PCI Bus ID: %s %x:%x\n",
3e57eef6
MCC
773 pci_name(pvt->pci_dev_16_2_fsb_err_regs),
774 pvt->pci_dev_16_2_fsb_err_regs->vendor, pvt->pci_dev_16_2_fsb_err_regs->device);
fcaf780b 775
3e57eef6 776 pvt->pci_dev_2x_0_fbd_branch[0] = pci_get_device(PCI_VENDOR_ID_INTEL,
fcaf780b
MCC
777 PCI_DEVICE_ID_INTEL_I7300_MCH_FB0,
778 NULL);
3e57eef6 779 if (!pvt->pci_dev_2x_0_fbd_branch[0]) {
fcaf780b
MCC
780 i7300_printk(KERN_ERR,
781 "MC: 'BRANCH 0' device not found:"
782 "vendor 0x%x device 0x%x Func 0 (broken BIOS?)\n",
783 PCI_VENDOR_ID_INTEL, PCI_DEVICE_ID_INTEL_I7300_MCH_FB0);
784 goto error;
785 }
786
3e57eef6 787 pvt->pci_dev_2x_0_fbd_branch[1] = pci_get_device(PCI_VENDOR_ID_INTEL,
fcaf780b
MCC
788 PCI_DEVICE_ID_INTEL_I7300_MCH_FB1,
789 NULL);
3e57eef6 790 if (!pvt->pci_dev_2x_0_fbd_branch[1]) {
fcaf780b
MCC
791 i7300_printk(KERN_ERR,
792 "MC: 'BRANCH 1' device not found:"
793 "vendor 0x%x device 0x%x Func 0 "
794 "(broken BIOS?)\n",
795 PCI_VENDOR_ID_INTEL,
796 PCI_DEVICE_ID_INTEL_I7300_MCH_FB1);
797 goto error;
798 }
799
800 return 0;
801
802error:
803 i7300_put_devices(mci);
804 return -ENODEV;
805}
806
807/*
808 * i7300_probe1 Probe for ONE instance of device to see if it is
809 * present.
810 * return:
811 * 0 for FOUND a device
812 * < 0 for error code
813 */
814static int i7300_probe1(struct pci_dev *pdev, int dev_idx)
815{
816 struct mem_ctl_info *mci;
817 struct i7300_pvt *pvt;
818 int num_channels;
819 int num_dimms_per_channel;
820 int num_csrows;
821
822 if (dev_idx >= ARRAY_SIZE(i7300_devs))
823 return -EINVAL;
824
825 debugf0("MC: " __FILE__ ": %s(), pdev bus %u dev=0x%x fn=0x%x\n",
826 __func__,
827 pdev->bus->number,
828 PCI_SLOT(pdev->devfn), PCI_FUNC(pdev->devfn));
829
830 /* We only are looking for func 0 of the set */
831 if (PCI_FUNC(pdev->devfn) != 0)
832 return -ENODEV;
833
834 /* As we don't have a motherboard identification routine to determine
835 * actual number of slots/dimms per channel, we thus utilize the
836 * resource as specified by the chipset. Thus, we might have
837 * have more DIMMs per channel than actually on the mobo, but this
838 * allows the driver to support upto the chipset max, without
839 * some fancy mobo determination.
840 */
841 num_dimms_per_channel = MAX_SLOTS;
842 num_channels = MAX_CHANNELS;
843 num_csrows = MAX_SLOTS * MAX_CHANNELS;
844
845 debugf0("MC: %s(): Number of - Channels= %d DIMMS= %d CSROWS= %d\n",
846 __func__, num_channels, num_dimms_per_channel, num_csrows);
847
848 /* allocate a new MC control structure */
849 mci = edac_mc_alloc(sizeof(*pvt), num_csrows, num_channels, 0);
850
851 if (mci == NULL)
852 return -ENOMEM;
853
854 debugf0("MC: " __FILE__ ": %s(): mci = %p\n", __func__, mci);
855
856 mci->dev = &pdev->dev; /* record ptr to the generic device */
857
858 pvt = mci->pvt_info;
3e57eef6 859 pvt->pci_dev_16_0_fsb_ctlr = pdev; /* Record this device in our private */
fcaf780b
MCC
860
861 /* 'get' the pci devices we want to reserve for our use */
862 if (i7300_get_devices(mci, dev_idx))
863 goto fail0;
864
865 mci->mc_idx = 0;
866 mci->mtype_cap = MEM_FLAG_FB_DDR2;
867 mci->edac_ctl_cap = EDAC_FLAG_NONE;
868 mci->edac_cap = EDAC_FLAG_NONE;
869 mci->mod_name = "i7300_edac.c";
870 mci->mod_ver = I7300_REVISION;
871 mci->ctl_name = i7300_devs[dev_idx].ctl_name;
872 mci->dev_name = pci_name(pdev);
873 mci->ctl_page_to_phys = NULL;
874
fcaf780b
MCC
875 /* Set the function pointer to an actual operation function */
876 mci->edac_check = i7300_check_error;
fcaf780b
MCC
877
878 /* initialize the MC control structure 'csrows' table
879 * with the mapping and control information */
880 if (i7300_get_mc_regs(mci)) {
881 debugf0("MC: Setting mci->edac_cap to EDAC_FLAG_NONE\n"
882 " because i7300_init_csrows() returned nonzero "
883 "value\n");
884 mci->edac_cap = EDAC_FLAG_NONE; /* no csrows found */
885 } else {
fcaf780b
MCC
886 debugf1("MC: Enable error reporting now\n");
887 i7300_enable_error_reporting(mci);
fcaf780b
MCC
888 }
889
890 /* add this new MC control structure to EDAC's list of MCs */
891 if (edac_mc_add_mc(mci)) {
892 debugf0("MC: " __FILE__
893 ": %s(): failed edac_mc_add_mc()\n", __func__);
894 /* FIXME: perhaps some code should go here that disables error
895 * reporting if we just enabled it
896 */
897 goto fail1;
898 }
899
fcaf780b 900 i7300_clear_error(mci);
fcaf780b
MCC
901
902 /* allocating generic PCI control info */
903 i7300_pci = edac_pci_create_generic_ctl(&pdev->dev, EDAC_MOD_STR);
904 if (!i7300_pci) {
905 printk(KERN_WARNING
906 "%s(): Unable to create PCI control\n",
907 __func__);
908 printk(KERN_WARNING
909 "%s(): PCI error report via EDAC not setup\n",
910 __func__);
911 }
912
913 return 0;
914
915 /* Error exit unwinding stack */
916fail1:
917
918 i7300_put_devices(mci);
919
920fail0:
921 edac_mc_free(mci);
922 return -ENODEV;
923}
924
925/*
926 * i7300_init_one constructor for one instance of device
927 *
928 * returns:
929 * negative on error
930 * count (>= 0)
931 */
932static int __devinit i7300_init_one(struct pci_dev *pdev,
933 const struct pci_device_id *id)
934{
935 int rc;
936
937 debugf0("MC: " __FILE__ ": %s()\n", __func__);
938
939 /* wake up device */
940 rc = pci_enable_device(pdev);
941 if (rc == -EIO)
942 return rc;
943
944 /* now probe and enable the device */
945 return i7300_probe1(pdev, id->driver_data);
946}
947
948/*
949 * i7300_remove_one destructor for one instance of device
950 *
951 */
952static void __devexit i7300_remove_one(struct pci_dev *pdev)
953{
954 struct mem_ctl_info *mci;
955
956 debugf0(__FILE__ ": %s()\n", __func__);
957
958 if (i7300_pci)
959 edac_pci_release_generic_ctl(i7300_pci);
960
961 mci = edac_mc_del_mc(&pdev->dev);
962 if (!mci)
963 return;
964
965 /* retrieve references to resources, and free those resources */
966 i7300_put_devices(mci);
967
968 edac_mc_free(mci);
969}
970
971/*
972 * pci_device_id table for which devices we are looking for
973 *
974 * The "E500P" device is the first device supported.
975 */
976static const struct pci_device_id i7300_pci_tbl[] __devinitdata = {
977 {PCI_DEVICE(PCI_VENDOR_ID_INTEL, PCI_DEVICE_ID_INTEL_I7300_MCH_ERR)},
978 {0,} /* 0 terminated list. */
979};
980
981MODULE_DEVICE_TABLE(pci, i7300_pci_tbl);
982
983/*
984 * i7300_driver pci_driver structure for this module
985 *
986 */
987static struct pci_driver i7300_driver = {
988 .name = "i7300_edac",
989 .probe = i7300_init_one,
990 .remove = __devexit_p(i7300_remove_one),
991 .id_table = i7300_pci_tbl,
992};
993
994/*
995 * i7300_init Module entry function
996 * Try to initialize this module for its devices
997 */
998static int __init i7300_init(void)
999{
1000 int pci_rc;
1001
1002 debugf2("MC: " __FILE__ ": %s()\n", __func__);
1003
1004 /* Ensure that the OPSTATE is set correctly for POLL or NMI */
1005 opstate_init();
1006
1007 pci_rc = pci_register_driver(&i7300_driver);
1008
1009 return (pci_rc < 0) ? pci_rc : 0;
1010}
1011
1012/*
1013 * i7300_exit() Module exit function
1014 * Unregister the driver
1015 */
1016static void __exit i7300_exit(void)
1017{
1018 debugf2("MC: " __FILE__ ": %s()\n", __func__);
1019 pci_unregister_driver(&i7300_driver);
1020}
1021
1022module_init(i7300_init);
1023module_exit(i7300_exit);
1024
1025MODULE_LICENSE("GPL");
1026MODULE_AUTHOR("Mauro Carvalho Chehab <mchehab@redhat.com>");
1027MODULE_AUTHOR("Red Hat Inc. (http://www.redhat.com)");
1028MODULE_DESCRIPTION("MC Driver for Intel I7300 memory controllers - "
1029 I7300_REVISION);
1030
1031module_param(edac_op_state, int, 0444);
1032MODULE_PARM_DESC(edac_op_state, "EDAC Error Reporting state: 0=Poll,1=NMI");