Merge branch 'for-next' of git://git.samba.org/sfrench/cifs-2.6
[deliverable/linux.git] / drivers / edac / i5100_edac.c
1 /*
2 * Intel 5100 Memory Controllers kernel module
3 *
4 * This file may be distributed under the terms of the
5 * GNU General Public License.
6 *
7 * This module is based on the following document:
8 *
9 * Intel 5100X Chipset Memory Controller Hub (MCH) - Datasheet
10 * http://download.intel.com/design/chipsets/datashts/318378.pdf
11 *
12 * The intel 5100 has two independent channels. EDAC core currently
13 * can not reflect this configuration so instead the chip-select
14 * rows for each respective channel are laid out one after another,
15 * the first half belonging to channel 0, the second half belonging
16 * to channel 1.
17 *
18 * This driver is for DDR2 DIMMs, and it uses chip select to select among the
19 * several ranks. However, instead of showing memories as ranks, it outputs
20 * them as DIMM's. An internal table creates the association between ranks
21 * and DIMM's.
22 */
23 #include <linux/module.h>
24 #include <linux/init.h>
25 #include <linux/pci.h>
26 #include <linux/pci_ids.h>
27 #include <linux/edac.h>
28 #include <linux/delay.h>
29 #include <linux/mmzone.h>
30 #include <linux/debugfs.h>
31
32 #include "edac_core.h"
33 #include "edac_module.h"
34
35 /* register addresses */
36
37 /* device 16, func 1 */
38 #define I5100_MC 0x40 /* Memory Control Register */
39 #define I5100_MC_SCRBEN_MASK (1 << 7)
40 #define I5100_MC_SCRBDONE_MASK (1 << 4)
41 #define I5100_MS 0x44 /* Memory Status Register */
42 #define I5100_SPDDATA 0x48 /* Serial Presence Detect Status Reg */
43 #define I5100_SPDCMD 0x4c /* Serial Presence Detect Command Reg */
44 #define I5100_TOLM 0x6c /* Top of Low Memory */
45 #define I5100_MIR0 0x80 /* Memory Interleave Range 0 */
46 #define I5100_MIR1 0x84 /* Memory Interleave Range 1 */
47 #define I5100_AMIR_0 0x8c /* Adjusted Memory Interleave Range 0 */
48 #define I5100_AMIR_1 0x90 /* Adjusted Memory Interleave Range 1 */
49 #define I5100_FERR_NF_MEM 0xa0 /* MC First Non Fatal Errors */
50 #define I5100_FERR_NF_MEM_M16ERR_MASK (1 << 16)
51 #define I5100_FERR_NF_MEM_M15ERR_MASK (1 << 15)
52 #define I5100_FERR_NF_MEM_M14ERR_MASK (1 << 14)
53 #define I5100_FERR_NF_MEM_M12ERR_MASK (1 << 12)
54 #define I5100_FERR_NF_MEM_M11ERR_MASK (1 << 11)
55 #define I5100_FERR_NF_MEM_M10ERR_MASK (1 << 10)
56 #define I5100_FERR_NF_MEM_M6ERR_MASK (1 << 6)
57 #define I5100_FERR_NF_MEM_M5ERR_MASK (1 << 5)
58 #define I5100_FERR_NF_MEM_M4ERR_MASK (1 << 4)
59 #define I5100_FERR_NF_MEM_M1ERR_MASK (1 << 1)
60 #define I5100_FERR_NF_MEM_ANY_MASK \
61 (I5100_FERR_NF_MEM_M16ERR_MASK | \
62 I5100_FERR_NF_MEM_M15ERR_MASK | \
63 I5100_FERR_NF_MEM_M14ERR_MASK | \
64 I5100_FERR_NF_MEM_M12ERR_MASK | \
65 I5100_FERR_NF_MEM_M11ERR_MASK | \
66 I5100_FERR_NF_MEM_M10ERR_MASK | \
67 I5100_FERR_NF_MEM_M6ERR_MASK | \
68 I5100_FERR_NF_MEM_M5ERR_MASK | \
69 I5100_FERR_NF_MEM_M4ERR_MASK | \
70 I5100_FERR_NF_MEM_M1ERR_MASK)
71 #define I5100_NERR_NF_MEM 0xa4 /* MC Next Non-Fatal Errors */
72 #define I5100_EMASK_MEM 0xa8 /* MC Error Mask Register */
73 #define I5100_MEM0EINJMSK0 0x200 /* Injection Mask0 Register Channel 0 */
74 #define I5100_MEM1EINJMSK0 0x208 /* Injection Mask0 Register Channel 1 */
75 #define I5100_MEMXEINJMSK0_EINJEN (1 << 27)
76 #define I5100_MEM0EINJMSK1 0x204 /* Injection Mask1 Register Channel 0 */
77 #define I5100_MEM1EINJMSK1 0x206 /* Injection Mask1 Register Channel 1 */
78
79 /* Device 19, Function 0 */
80 #define I5100_DINJ0 0x9a
81
82 /* device 21 and 22, func 0 */
83 #define I5100_MTR_0 0x154 /* Memory Technology Registers 0-3 */
84 #define I5100_DMIR 0x15c /* DIMM Interleave Range */
85 #define I5100_VALIDLOG 0x18c /* Valid Log Markers */
86 #define I5100_NRECMEMA 0x190 /* Non-Recoverable Memory Error Log Reg A */
87 #define I5100_NRECMEMB 0x194 /* Non-Recoverable Memory Error Log Reg B */
88 #define I5100_REDMEMA 0x198 /* Recoverable Memory Data Error Log Reg A */
89 #define I5100_REDMEMB 0x19c /* Recoverable Memory Data Error Log Reg B */
90 #define I5100_RECMEMA 0x1a0 /* Recoverable Memory Error Log Reg A */
91 #define I5100_RECMEMB 0x1a4 /* Recoverable Memory Error Log Reg B */
92 #define I5100_MTR_4 0x1b0 /* Memory Technology Registers 4,5 */
93
94 /* bit field accessors */
95
96 static inline u32 i5100_mc_scrben(u32 mc)
97 {
98 return mc >> 7 & 1;
99 }
100
101 static inline u32 i5100_mc_errdeten(u32 mc)
102 {
103 return mc >> 5 & 1;
104 }
105
106 static inline u32 i5100_mc_scrbdone(u32 mc)
107 {
108 return mc >> 4 & 1;
109 }
110
111 static inline u16 i5100_spddata_rdo(u16 a)
112 {
113 return a >> 15 & 1;
114 }
115
116 static inline u16 i5100_spddata_sbe(u16 a)
117 {
118 return a >> 13 & 1;
119 }
120
121 static inline u16 i5100_spddata_busy(u16 a)
122 {
123 return a >> 12 & 1;
124 }
125
126 static inline u16 i5100_spddata_data(u16 a)
127 {
128 return a & ((1 << 8) - 1);
129 }
130
131 static inline u32 i5100_spdcmd_create(u32 dti, u32 ckovrd, u32 sa, u32 ba,
132 u32 data, u32 cmd)
133 {
134 return ((dti & ((1 << 4) - 1)) << 28) |
135 ((ckovrd & 1) << 27) |
136 ((sa & ((1 << 3) - 1)) << 24) |
137 ((ba & ((1 << 8) - 1)) << 16) |
138 ((data & ((1 << 8) - 1)) << 8) |
139 (cmd & 1);
140 }
141
142 static inline u16 i5100_tolm_tolm(u16 a)
143 {
144 return a >> 12 & ((1 << 4) - 1);
145 }
146
147 static inline u16 i5100_mir_limit(u16 a)
148 {
149 return a >> 4 & ((1 << 12) - 1);
150 }
151
152 static inline u16 i5100_mir_way1(u16 a)
153 {
154 return a >> 1 & 1;
155 }
156
157 static inline u16 i5100_mir_way0(u16 a)
158 {
159 return a & 1;
160 }
161
162 static inline u32 i5100_ferr_nf_mem_chan_indx(u32 a)
163 {
164 return a >> 28 & 1;
165 }
166
167 static inline u32 i5100_ferr_nf_mem_any(u32 a)
168 {
169 return a & I5100_FERR_NF_MEM_ANY_MASK;
170 }
171
172 static inline u32 i5100_nerr_nf_mem_any(u32 a)
173 {
174 return i5100_ferr_nf_mem_any(a);
175 }
176
177 static inline u32 i5100_dmir_limit(u32 a)
178 {
179 return a >> 16 & ((1 << 11) - 1);
180 }
181
182 static inline u32 i5100_dmir_rank(u32 a, u32 i)
183 {
184 return a >> (4 * i) & ((1 << 2) - 1);
185 }
186
187 static inline u16 i5100_mtr_present(u16 a)
188 {
189 return a >> 10 & 1;
190 }
191
192 static inline u16 i5100_mtr_ethrottle(u16 a)
193 {
194 return a >> 9 & 1;
195 }
196
197 static inline u16 i5100_mtr_width(u16 a)
198 {
199 return a >> 8 & 1;
200 }
201
202 static inline u16 i5100_mtr_numbank(u16 a)
203 {
204 return a >> 6 & 1;
205 }
206
207 static inline u16 i5100_mtr_numrow(u16 a)
208 {
209 return a >> 2 & ((1 << 2) - 1);
210 }
211
212 static inline u16 i5100_mtr_numcol(u16 a)
213 {
214 return a & ((1 << 2) - 1);
215 }
216
217
218 static inline u32 i5100_validlog_redmemvalid(u32 a)
219 {
220 return a >> 2 & 1;
221 }
222
223 static inline u32 i5100_validlog_recmemvalid(u32 a)
224 {
225 return a >> 1 & 1;
226 }
227
228 static inline u32 i5100_validlog_nrecmemvalid(u32 a)
229 {
230 return a & 1;
231 }
232
233 static inline u32 i5100_nrecmema_merr(u32 a)
234 {
235 return a >> 15 & ((1 << 5) - 1);
236 }
237
238 static inline u32 i5100_nrecmema_bank(u32 a)
239 {
240 return a >> 12 & ((1 << 3) - 1);
241 }
242
243 static inline u32 i5100_nrecmema_rank(u32 a)
244 {
245 return a >> 8 & ((1 << 3) - 1);
246 }
247
248 static inline u32 i5100_nrecmema_dm_buf_id(u32 a)
249 {
250 return a & ((1 << 8) - 1);
251 }
252
253 static inline u32 i5100_nrecmemb_cas(u32 a)
254 {
255 return a >> 16 & ((1 << 13) - 1);
256 }
257
258 static inline u32 i5100_nrecmemb_ras(u32 a)
259 {
260 return a & ((1 << 16) - 1);
261 }
262
263 static inline u32 i5100_redmemb_ecc_locator(u32 a)
264 {
265 return a & ((1 << 18) - 1);
266 }
267
268 static inline u32 i5100_recmema_merr(u32 a)
269 {
270 return i5100_nrecmema_merr(a);
271 }
272
273 static inline u32 i5100_recmema_bank(u32 a)
274 {
275 return i5100_nrecmema_bank(a);
276 }
277
278 static inline u32 i5100_recmema_rank(u32 a)
279 {
280 return i5100_nrecmema_rank(a);
281 }
282
283 static inline u32 i5100_recmemb_cas(u32 a)
284 {
285 return i5100_nrecmemb_cas(a);
286 }
287
288 static inline u32 i5100_recmemb_ras(u32 a)
289 {
290 return i5100_nrecmemb_ras(a);
291 }
292
293 /* some generic limits */
294 #define I5100_MAX_RANKS_PER_CHAN 6
295 #define I5100_CHANNELS 2
296 #define I5100_MAX_RANKS_PER_DIMM 4
297 #define I5100_DIMM_ADDR_LINES (6 - 3) /* 64 bits / 8 bits per byte */
298 #define I5100_MAX_DIMM_SLOTS_PER_CHAN 4
299 #define I5100_MAX_RANK_INTERLEAVE 4
300 #define I5100_MAX_DMIRS 5
301 #define I5100_SCRUB_REFRESH_RATE (5 * 60 * HZ)
302
303 struct i5100_priv {
304 /* ranks on each dimm -- 0 maps to not present -- obtained via SPD */
305 int dimm_numrank[I5100_CHANNELS][I5100_MAX_DIMM_SLOTS_PER_CHAN];
306
307 /*
308 * mainboard chip select map -- maps i5100 chip selects to
309 * DIMM slot chip selects. In the case of only 4 ranks per
310 * channel, the mapping is fairly obvious but not unique.
311 * we map -1 -> NC and assume both channels use the same
312 * map...
313 *
314 */
315 int dimm_csmap[I5100_MAX_DIMM_SLOTS_PER_CHAN][I5100_MAX_RANKS_PER_DIMM];
316
317 /* memory interleave range */
318 struct {
319 u64 limit;
320 unsigned way[2];
321 } mir[I5100_CHANNELS];
322
323 /* adjusted memory interleave range register */
324 unsigned amir[I5100_CHANNELS];
325
326 /* dimm interleave range */
327 struct {
328 unsigned rank[I5100_MAX_RANK_INTERLEAVE];
329 u64 limit;
330 } dmir[I5100_CHANNELS][I5100_MAX_DMIRS];
331
332 /* memory technology registers... */
333 struct {
334 unsigned present; /* 0 or 1 */
335 unsigned ethrottle; /* 0 or 1 */
336 unsigned width; /* 4 or 8 bits */
337 unsigned numbank; /* 2 or 3 lines */
338 unsigned numrow; /* 13 .. 16 lines */
339 unsigned numcol; /* 11 .. 12 lines */
340 } mtr[I5100_CHANNELS][I5100_MAX_RANKS_PER_CHAN];
341
342 u64 tolm; /* top of low memory in bytes */
343 unsigned ranksperchan; /* number of ranks per channel */
344
345 struct pci_dev *mc; /* device 16 func 1 */
346 struct pci_dev *einj; /* device 19 func 0 */
347 struct pci_dev *ch0mm; /* device 21 func 0 */
348 struct pci_dev *ch1mm; /* device 22 func 0 */
349
350 struct delayed_work i5100_scrubbing;
351 int scrub_enable;
352
353 /* Error injection */
354 u8 inject_channel;
355 u8 inject_hlinesel;
356 u8 inject_deviceptr1;
357 u8 inject_deviceptr2;
358 u16 inject_eccmask1;
359 u16 inject_eccmask2;
360
361 struct dentry *debugfs;
362 };
363
364 static struct dentry *i5100_debugfs;
365
366 /* map a rank/chan to a slot number on the mainboard */
367 static int i5100_rank_to_slot(const struct mem_ctl_info *mci,
368 int chan, int rank)
369 {
370 const struct i5100_priv *priv = mci->pvt_info;
371 int i;
372
373 for (i = 0; i < I5100_MAX_DIMM_SLOTS_PER_CHAN; i++) {
374 int j;
375 const int numrank = priv->dimm_numrank[chan][i];
376
377 for (j = 0; j < numrank; j++)
378 if (priv->dimm_csmap[i][j] == rank)
379 return i * 2 + chan;
380 }
381
382 return -1;
383 }
384
385 static const char *i5100_err_msg(unsigned err)
386 {
387 static const char *merrs[] = {
388 "unknown", /* 0 */
389 "uncorrectable data ECC on replay", /* 1 */
390 "unknown", /* 2 */
391 "unknown", /* 3 */
392 "aliased uncorrectable demand data ECC", /* 4 */
393 "aliased uncorrectable spare-copy data ECC", /* 5 */
394 "aliased uncorrectable patrol data ECC", /* 6 */
395 "unknown", /* 7 */
396 "unknown", /* 8 */
397 "unknown", /* 9 */
398 "non-aliased uncorrectable demand data ECC", /* 10 */
399 "non-aliased uncorrectable spare-copy data ECC", /* 11 */
400 "non-aliased uncorrectable patrol data ECC", /* 12 */
401 "unknown", /* 13 */
402 "correctable demand data ECC", /* 14 */
403 "correctable spare-copy data ECC", /* 15 */
404 "correctable patrol data ECC", /* 16 */
405 "unknown", /* 17 */
406 "SPD protocol error", /* 18 */
407 "unknown", /* 19 */
408 "spare copy initiated", /* 20 */
409 "spare copy completed", /* 21 */
410 };
411 unsigned i;
412
413 for (i = 0; i < ARRAY_SIZE(merrs); i++)
414 if (1 << i & err)
415 return merrs[i];
416
417 return "none";
418 }
419
420 /* convert csrow index into a rank (per channel -- 0..5) */
421 static int i5100_csrow_to_rank(const struct mem_ctl_info *mci, int csrow)
422 {
423 const struct i5100_priv *priv = mci->pvt_info;
424
425 return csrow % priv->ranksperchan;
426 }
427
428 /* convert csrow index into a channel (0..1) */
429 static int i5100_csrow_to_chan(const struct mem_ctl_info *mci, int csrow)
430 {
431 const struct i5100_priv *priv = mci->pvt_info;
432
433 return csrow / priv->ranksperchan;
434 }
435
436 static void i5100_handle_ce(struct mem_ctl_info *mci,
437 int chan,
438 unsigned bank,
439 unsigned rank,
440 unsigned long syndrome,
441 unsigned cas,
442 unsigned ras,
443 const char *msg)
444 {
445 char detail[80];
446
447 /* Form out message */
448 snprintf(detail, sizeof(detail),
449 "bank %u, cas %u, ras %u\n",
450 bank, cas, ras);
451
452 edac_mc_handle_error(HW_EVENT_ERR_CORRECTED, mci, 1,
453 0, 0, syndrome,
454 chan, rank, -1,
455 msg, detail);
456 }
457
458 static void i5100_handle_ue(struct mem_ctl_info *mci,
459 int chan,
460 unsigned bank,
461 unsigned rank,
462 unsigned long syndrome,
463 unsigned cas,
464 unsigned ras,
465 const char *msg)
466 {
467 char detail[80];
468
469 /* Form out message */
470 snprintf(detail, sizeof(detail),
471 "bank %u, cas %u, ras %u\n",
472 bank, cas, ras);
473
474 edac_mc_handle_error(HW_EVENT_ERR_UNCORRECTED, mci, 1,
475 0, 0, syndrome,
476 chan, rank, -1,
477 msg, detail);
478 }
479
480 static void i5100_read_log(struct mem_ctl_info *mci, int chan,
481 u32 ferr, u32 nerr)
482 {
483 struct i5100_priv *priv = mci->pvt_info;
484 struct pci_dev *pdev = (chan) ? priv->ch1mm : priv->ch0mm;
485 u32 dw;
486 u32 dw2;
487 unsigned syndrome = 0;
488 unsigned ecc_loc = 0;
489 unsigned merr;
490 unsigned bank;
491 unsigned rank;
492 unsigned cas;
493 unsigned ras;
494
495 pci_read_config_dword(pdev, I5100_VALIDLOG, &dw);
496
497 if (i5100_validlog_redmemvalid(dw)) {
498 pci_read_config_dword(pdev, I5100_REDMEMA, &dw2);
499 syndrome = dw2;
500 pci_read_config_dword(pdev, I5100_REDMEMB, &dw2);
501 ecc_loc = i5100_redmemb_ecc_locator(dw2);
502 }
503
504 if (i5100_validlog_recmemvalid(dw)) {
505 const char *msg;
506
507 pci_read_config_dword(pdev, I5100_RECMEMA, &dw2);
508 merr = i5100_recmema_merr(dw2);
509 bank = i5100_recmema_bank(dw2);
510 rank = i5100_recmema_rank(dw2);
511
512 pci_read_config_dword(pdev, I5100_RECMEMB, &dw2);
513 cas = i5100_recmemb_cas(dw2);
514 ras = i5100_recmemb_ras(dw2);
515
516 /* FIXME: not really sure if this is what merr is...
517 */
518 if (!merr)
519 msg = i5100_err_msg(ferr);
520 else
521 msg = i5100_err_msg(nerr);
522
523 i5100_handle_ce(mci, chan, bank, rank, syndrome, cas, ras, msg);
524 }
525
526 if (i5100_validlog_nrecmemvalid(dw)) {
527 const char *msg;
528
529 pci_read_config_dword(pdev, I5100_NRECMEMA, &dw2);
530 merr = i5100_nrecmema_merr(dw2);
531 bank = i5100_nrecmema_bank(dw2);
532 rank = i5100_nrecmema_rank(dw2);
533
534 pci_read_config_dword(pdev, I5100_NRECMEMB, &dw2);
535 cas = i5100_nrecmemb_cas(dw2);
536 ras = i5100_nrecmemb_ras(dw2);
537
538 /* FIXME: not really sure if this is what merr is...
539 */
540 if (!merr)
541 msg = i5100_err_msg(ferr);
542 else
543 msg = i5100_err_msg(nerr);
544
545 i5100_handle_ue(mci, chan, bank, rank, syndrome, cas, ras, msg);
546 }
547
548 pci_write_config_dword(pdev, I5100_VALIDLOG, dw);
549 }
550
551 static void i5100_check_error(struct mem_ctl_info *mci)
552 {
553 struct i5100_priv *priv = mci->pvt_info;
554 u32 dw, dw2;
555
556 pci_read_config_dword(priv->mc, I5100_FERR_NF_MEM, &dw);
557 if (i5100_ferr_nf_mem_any(dw)) {
558
559 pci_read_config_dword(priv->mc, I5100_NERR_NF_MEM, &dw2);
560
561 i5100_read_log(mci, i5100_ferr_nf_mem_chan_indx(dw),
562 i5100_ferr_nf_mem_any(dw),
563 i5100_nerr_nf_mem_any(dw2));
564
565 pci_write_config_dword(priv->mc, I5100_NERR_NF_MEM, dw2);
566 }
567 pci_write_config_dword(priv->mc, I5100_FERR_NF_MEM, dw);
568 }
569
570 /* The i5100 chipset will scrub the entire memory once, then
571 * set a done bit. Continuous scrubbing is achieved by enqueing
572 * delayed work to a workqueue, checking every few minutes if
573 * the scrubbing has completed and if so reinitiating it.
574 */
575
576 static void i5100_refresh_scrubbing(struct work_struct *work)
577 {
578 struct delayed_work *i5100_scrubbing = container_of(work,
579 struct delayed_work,
580 work);
581 struct i5100_priv *priv = container_of(i5100_scrubbing,
582 struct i5100_priv,
583 i5100_scrubbing);
584 u32 dw;
585
586 pci_read_config_dword(priv->mc, I5100_MC, &dw);
587
588 if (priv->scrub_enable) {
589
590 pci_read_config_dword(priv->mc, I5100_MC, &dw);
591
592 if (i5100_mc_scrbdone(dw)) {
593 dw |= I5100_MC_SCRBEN_MASK;
594 pci_write_config_dword(priv->mc, I5100_MC, dw);
595 pci_read_config_dword(priv->mc, I5100_MC, &dw);
596 }
597
598 schedule_delayed_work(&(priv->i5100_scrubbing),
599 I5100_SCRUB_REFRESH_RATE);
600 }
601 }
602 /*
603 * The bandwidth is based on experimentation, feel free to refine it.
604 */
605 static int i5100_set_scrub_rate(struct mem_ctl_info *mci, u32 bandwidth)
606 {
607 struct i5100_priv *priv = mci->pvt_info;
608 u32 dw;
609
610 pci_read_config_dword(priv->mc, I5100_MC, &dw);
611 if (bandwidth) {
612 priv->scrub_enable = 1;
613 dw |= I5100_MC_SCRBEN_MASK;
614 schedule_delayed_work(&(priv->i5100_scrubbing),
615 I5100_SCRUB_REFRESH_RATE);
616 } else {
617 priv->scrub_enable = 0;
618 dw &= ~I5100_MC_SCRBEN_MASK;
619 cancel_delayed_work(&(priv->i5100_scrubbing));
620 }
621 pci_write_config_dword(priv->mc, I5100_MC, dw);
622
623 pci_read_config_dword(priv->mc, I5100_MC, &dw);
624
625 bandwidth = 5900000 * i5100_mc_scrben(dw);
626
627 return bandwidth;
628 }
629
630 static int i5100_get_scrub_rate(struct mem_ctl_info *mci)
631 {
632 struct i5100_priv *priv = mci->pvt_info;
633 u32 dw;
634
635 pci_read_config_dword(priv->mc, I5100_MC, &dw);
636
637 return 5900000 * i5100_mc_scrben(dw);
638 }
639
640 static struct pci_dev *pci_get_device_func(unsigned vendor,
641 unsigned device,
642 unsigned func)
643 {
644 struct pci_dev *ret = NULL;
645
646 while (1) {
647 ret = pci_get_device(vendor, device, ret);
648
649 if (!ret)
650 break;
651
652 if (PCI_FUNC(ret->devfn) == func)
653 break;
654 }
655
656 return ret;
657 }
658
659 static unsigned long i5100_npages(struct mem_ctl_info *mci, int csrow)
660 {
661 struct i5100_priv *priv = mci->pvt_info;
662 const unsigned chan_rank = i5100_csrow_to_rank(mci, csrow);
663 const unsigned chan = i5100_csrow_to_chan(mci, csrow);
664 unsigned addr_lines;
665
666 /* dimm present? */
667 if (!priv->mtr[chan][chan_rank].present)
668 return 0ULL;
669
670 addr_lines =
671 I5100_DIMM_ADDR_LINES +
672 priv->mtr[chan][chan_rank].numcol +
673 priv->mtr[chan][chan_rank].numrow +
674 priv->mtr[chan][chan_rank].numbank;
675
676 return (unsigned long)
677 ((unsigned long long) (1ULL << addr_lines) / PAGE_SIZE);
678 }
679
680 static void i5100_init_mtr(struct mem_ctl_info *mci)
681 {
682 struct i5100_priv *priv = mci->pvt_info;
683 struct pci_dev *mms[2] = { priv->ch0mm, priv->ch1mm };
684 int i;
685
686 for (i = 0; i < I5100_CHANNELS; i++) {
687 int j;
688 struct pci_dev *pdev = mms[i];
689
690 for (j = 0; j < I5100_MAX_RANKS_PER_CHAN; j++) {
691 const unsigned addr =
692 (j < 4) ? I5100_MTR_0 + j * 2 :
693 I5100_MTR_4 + (j - 4) * 2;
694 u16 w;
695
696 pci_read_config_word(pdev, addr, &w);
697
698 priv->mtr[i][j].present = i5100_mtr_present(w);
699 priv->mtr[i][j].ethrottle = i5100_mtr_ethrottle(w);
700 priv->mtr[i][j].width = 4 + 4 * i5100_mtr_width(w);
701 priv->mtr[i][j].numbank = 2 + i5100_mtr_numbank(w);
702 priv->mtr[i][j].numrow = 13 + i5100_mtr_numrow(w);
703 priv->mtr[i][j].numcol = 10 + i5100_mtr_numcol(w);
704 }
705 }
706 }
707
708 /*
709 * FIXME: make this into a real i2c adapter (so that dimm-decode
710 * will work)?
711 */
712 static int i5100_read_spd_byte(const struct mem_ctl_info *mci,
713 u8 ch, u8 slot, u8 addr, u8 *byte)
714 {
715 struct i5100_priv *priv = mci->pvt_info;
716 u16 w;
717 unsigned long et;
718
719 pci_read_config_word(priv->mc, I5100_SPDDATA, &w);
720 if (i5100_spddata_busy(w))
721 return -1;
722
723 pci_write_config_dword(priv->mc, I5100_SPDCMD,
724 i5100_spdcmd_create(0xa, 1, ch * 4 + slot, addr,
725 0, 0));
726
727 /* wait up to 100ms */
728 et = jiffies + HZ / 10;
729 udelay(100);
730 while (1) {
731 pci_read_config_word(priv->mc, I5100_SPDDATA, &w);
732 if (!i5100_spddata_busy(w))
733 break;
734 udelay(100);
735 }
736
737 if (!i5100_spddata_rdo(w) || i5100_spddata_sbe(w))
738 return -1;
739
740 *byte = i5100_spddata_data(w);
741
742 return 0;
743 }
744
745 /*
746 * fill dimm chip select map
747 *
748 * FIXME:
749 * o not the only way to may chip selects to dimm slots
750 * o investigate if there is some way to obtain this map from the bios
751 */
752 static void i5100_init_dimm_csmap(struct mem_ctl_info *mci)
753 {
754 struct i5100_priv *priv = mci->pvt_info;
755 int i;
756
757 for (i = 0; i < I5100_MAX_DIMM_SLOTS_PER_CHAN; i++) {
758 int j;
759
760 for (j = 0; j < I5100_MAX_RANKS_PER_DIMM; j++)
761 priv->dimm_csmap[i][j] = -1; /* default NC */
762 }
763
764 /* only 2 chip selects per slot... */
765 if (priv->ranksperchan == 4) {
766 priv->dimm_csmap[0][0] = 0;
767 priv->dimm_csmap[0][1] = 3;
768 priv->dimm_csmap[1][0] = 1;
769 priv->dimm_csmap[1][1] = 2;
770 priv->dimm_csmap[2][0] = 2;
771 priv->dimm_csmap[3][0] = 3;
772 } else {
773 priv->dimm_csmap[0][0] = 0;
774 priv->dimm_csmap[0][1] = 1;
775 priv->dimm_csmap[1][0] = 2;
776 priv->dimm_csmap[1][1] = 3;
777 priv->dimm_csmap[2][0] = 4;
778 priv->dimm_csmap[2][1] = 5;
779 }
780 }
781
782 static void i5100_init_dimm_layout(struct pci_dev *pdev,
783 struct mem_ctl_info *mci)
784 {
785 struct i5100_priv *priv = mci->pvt_info;
786 int i;
787
788 for (i = 0; i < I5100_CHANNELS; i++) {
789 int j;
790
791 for (j = 0; j < I5100_MAX_DIMM_SLOTS_PER_CHAN; j++) {
792 u8 rank;
793
794 if (i5100_read_spd_byte(mci, i, j, 5, &rank) < 0)
795 priv->dimm_numrank[i][j] = 0;
796 else
797 priv->dimm_numrank[i][j] = (rank & 3) + 1;
798 }
799 }
800
801 i5100_init_dimm_csmap(mci);
802 }
803
804 static void i5100_init_interleaving(struct pci_dev *pdev,
805 struct mem_ctl_info *mci)
806 {
807 u16 w;
808 u32 dw;
809 struct i5100_priv *priv = mci->pvt_info;
810 struct pci_dev *mms[2] = { priv->ch0mm, priv->ch1mm };
811 int i;
812
813 pci_read_config_word(pdev, I5100_TOLM, &w);
814 priv->tolm = (u64) i5100_tolm_tolm(w) * 256 * 1024 * 1024;
815
816 pci_read_config_word(pdev, I5100_MIR0, &w);
817 priv->mir[0].limit = (u64) i5100_mir_limit(w) << 28;
818 priv->mir[0].way[1] = i5100_mir_way1(w);
819 priv->mir[0].way[0] = i5100_mir_way0(w);
820
821 pci_read_config_word(pdev, I5100_MIR1, &w);
822 priv->mir[1].limit = (u64) i5100_mir_limit(w) << 28;
823 priv->mir[1].way[1] = i5100_mir_way1(w);
824 priv->mir[1].way[0] = i5100_mir_way0(w);
825
826 pci_read_config_word(pdev, I5100_AMIR_0, &w);
827 priv->amir[0] = w;
828 pci_read_config_word(pdev, I5100_AMIR_1, &w);
829 priv->amir[1] = w;
830
831 for (i = 0; i < I5100_CHANNELS; i++) {
832 int j;
833
834 for (j = 0; j < 5; j++) {
835 int k;
836
837 pci_read_config_dword(mms[i], I5100_DMIR + j * 4, &dw);
838
839 priv->dmir[i][j].limit =
840 (u64) i5100_dmir_limit(dw) << 28;
841 for (k = 0; k < I5100_MAX_RANKS_PER_DIMM; k++)
842 priv->dmir[i][j].rank[k] =
843 i5100_dmir_rank(dw, k);
844 }
845 }
846
847 i5100_init_mtr(mci);
848 }
849
850 static void i5100_init_csrows(struct mem_ctl_info *mci)
851 {
852 int i;
853 struct i5100_priv *priv = mci->pvt_info;
854
855 for (i = 0; i < mci->tot_dimms; i++) {
856 struct dimm_info *dimm;
857 const unsigned long npages = i5100_npages(mci, i);
858 const unsigned chan = i5100_csrow_to_chan(mci, i);
859 const unsigned rank = i5100_csrow_to_rank(mci, i);
860
861 if (!npages)
862 continue;
863
864 dimm = EDAC_DIMM_PTR(mci->layers, mci->dimms, mci->n_layers,
865 chan, rank, 0);
866
867 dimm->nr_pages = npages;
868 dimm->grain = 32;
869 dimm->dtype = (priv->mtr[chan][rank].width == 4) ?
870 DEV_X4 : DEV_X8;
871 dimm->mtype = MEM_RDDR2;
872 dimm->edac_mode = EDAC_SECDED;
873 snprintf(dimm->label, sizeof(dimm->label), "DIMM%u",
874 i5100_rank_to_slot(mci, chan, rank));
875
876 edac_dbg(2, "dimm channel %d, rank %d, size %ld\n",
877 chan, rank, (long)PAGES_TO_MiB(npages));
878 }
879 }
880
881 /****************************************************************************
882 * Error injection routines
883 ****************************************************************************/
884
885 static void i5100_do_inject(struct mem_ctl_info *mci)
886 {
887 struct i5100_priv *priv = mci->pvt_info;
888 u32 mask0;
889 u16 mask1;
890
891 /* MEM[1:0]EINJMSK0
892 * 31 - ADDRMATCHEN
893 * 29:28 - HLINESEL
894 * 00 Reserved
895 * 01 Lower half of cache line
896 * 10 Upper half of cache line
897 * 11 Both upper and lower parts of cache line
898 * 27 - EINJEN
899 * 25:19 - XORMASK1 for deviceptr1
900 * 9:5 - SEC2RAM for deviceptr2
901 * 4:0 - FIR2RAM for deviceptr1
902 */
903 mask0 = ((priv->inject_hlinesel & 0x3) << 28) |
904 I5100_MEMXEINJMSK0_EINJEN |
905 ((priv->inject_eccmask1 & 0xffff) << 10) |
906 ((priv->inject_deviceptr2 & 0x1f) << 5) |
907 (priv->inject_deviceptr1 & 0x1f);
908
909 /* MEM[1:0]EINJMSK1
910 * 15:0 - XORMASK2 for deviceptr2
911 */
912 mask1 = priv->inject_eccmask2;
913
914 if (priv->inject_channel == 0) {
915 pci_write_config_dword(priv->mc, I5100_MEM0EINJMSK0, mask0);
916 pci_write_config_word(priv->mc, I5100_MEM0EINJMSK1, mask1);
917 } else {
918 pci_write_config_dword(priv->mc, I5100_MEM1EINJMSK0, mask0);
919 pci_write_config_word(priv->mc, I5100_MEM1EINJMSK1, mask1);
920 }
921
922 /* Error Injection Response Function
923 * Intel 5100 Memory Controller Hub Chipset (318378) datasheet
924 * hints about this register but carry no data about them. All
925 * data regarding device 19 is based on experimentation and the
926 * Intel 7300 Chipset Memory Controller Hub (318082) datasheet
927 * which appears to be accurate for the i5100 in this area.
928 *
929 * The injection code don't work without setting this register.
930 * The register needs to be flipped off then on else the hardware
931 * will only preform the first injection.
932 *
933 * Stop condition bits 7:4
934 * 1010 - Stop after one injection
935 * 1011 - Never stop injecting faults
936 *
937 * Start condition bits 3:0
938 * 1010 - Never start
939 * 1011 - Start immediately
940 */
941 pci_write_config_byte(priv->einj, I5100_DINJ0, 0xaa);
942 pci_write_config_byte(priv->einj, I5100_DINJ0, 0xab);
943 }
944
945 #define to_mci(k) container_of(k, struct mem_ctl_info, dev)
946 static ssize_t inject_enable_write(struct file *file, const char __user *data,
947 size_t count, loff_t *ppos)
948 {
949 struct device *dev = file->private_data;
950 struct mem_ctl_info *mci = to_mci(dev);
951
952 i5100_do_inject(mci);
953
954 return count;
955 }
956
957 static const struct file_operations i5100_inject_enable_fops = {
958 .open = simple_open,
959 .write = inject_enable_write,
960 .llseek = generic_file_llseek,
961 };
962
963 static int i5100_setup_debugfs(struct mem_ctl_info *mci)
964 {
965 struct i5100_priv *priv = mci->pvt_info;
966
967 if (!i5100_debugfs)
968 return -ENODEV;
969
970 priv->debugfs = edac_debugfs_create_dir_at(mci->bus->name, i5100_debugfs);
971
972 if (!priv->debugfs)
973 return -ENOMEM;
974
975 edac_debugfs_create_x8("inject_channel", S_IRUGO | S_IWUSR, priv->debugfs,
976 &priv->inject_channel);
977 edac_debugfs_create_x8("inject_hlinesel", S_IRUGO | S_IWUSR, priv->debugfs,
978 &priv->inject_hlinesel);
979 edac_debugfs_create_x8("inject_deviceptr1", S_IRUGO | S_IWUSR, priv->debugfs,
980 &priv->inject_deviceptr1);
981 edac_debugfs_create_x8("inject_deviceptr2", S_IRUGO | S_IWUSR, priv->debugfs,
982 &priv->inject_deviceptr2);
983 edac_debugfs_create_x16("inject_eccmask1", S_IRUGO | S_IWUSR, priv->debugfs,
984 &priv->inject_eccmask1);
985 edac_debugfs_create_x16("inject_eccmask2", S_IRUGO | S_IWUSR, priv->debugfs,
986 &priv->inject_eccmask2);
987 edac_debugfs_create_file("inject_enable", S_IWUSR, priv->debugfs,
988 &mci->dev, &i5100_inject_enable_fops);
989
990 return 0;
991
992 }
993
994 static int i5100_init_one(struct pci_dev *pdev, const struct pci_device_id *id)
995 {
996 int rc;
997 struct mem_ctl_info *mci;
998 struct edac_mc_layer layers[2];
999 struct i5100_priv *priv;
1000 struct pci_dev *ch0mm, *ch1mm, *einj;
1001 int ret = 0;
1002 u32 dw;
1003 int ranksperch;
1004
1005 if (PCI_FUNC(pdev->devfn) != 1)
1006 return -ENODEV;
1007
1008 rc = pci_enable_device(pdev);
1009 if (rc < 0) {
1010 ret = rc;
1011 goto bail;
1012 }
1013
1014 /* ECC enabled? */
1015 pci_read_config_dword(pdev, I5100_MC, &dw);
1016 if (!i5100_mc_errdeten(dw)) {
1017 printk(KERN_INFO "i5100_edac: ECC not enabled.\n");
1018 ret = -ENODEV;
1019 goto bail_pdev;
1020 }
1021
1022 /* figure out how many ranks, from strapped state of 48GB_Mode input */
1023 pci_read_config_dword(pdev, I5100_MS, &dw);
1024 ranksperch = !!(dw & (1 << 8)) * 2 + 4;
1025
1026 /* enable error reporting... */
1027 pci_read_config_dword(pdev, I5100_EMASK_MEM, &dw);
1028 dw &= ~I5100_FERR_NF_MEM_ANY_MASK;
1029 pci_write_config_dword(pdev, I5100_EMASK_MEM, dw);
1030
1031 /* device 21, func 0, Channel 0 Memory Map, Error Flag/Mask, etc... */
1032 ch0mm = pci_get_device_func(PCI_VENDOR_ID_INTEL,
1033 PCI_DEVICE_ID_INTEL_5100_21, 0);
1034 if (!ch0mm) {
1035 ret = -ENODEV;
1036 goto bail_pdev;
1037 }
1038
1039 rc = pci_enable_device(ch0mm);
1040 if (rc < 0) {
1041 ret = rc;
1042 goto bail_ch0;
1043 }
1044
1045 /* device 22, func 0, Channel 1 Memory Map, Error Flag/Mask, etc... */
1046 ch1mm = pci_get_device_func(PCI_VENDOR_ID_INTEL,
1047 PCI_DEVICE_ID_INTEL_5100_22, 0);
1048 if (!ch1mm) {
1049 ret = -ENODEV;
1050 goto bail_disable_ch0;
1051 }
1052
1053 rc = pci_enable_device(ch1mm);
1054 if (rc < 0) {
1055 ret = rc;
1056 goto bail_ch1;
1057 }
1058
1059 layers[0].type = EDAC_MC_LAYER_CHANNEL;
1060 layers[0].size = 2;
1061 layers[0].is_virt_csrow = false;
1062 layers[1].type = EDAC_MC_LAYER_SLOT;
1063 layers[1].size = ranksperch;
1064 layers[1].is_virt_csrow = true;
1065 mci = edac_mc_alloc(0, ARRAY_SIZE(layers), layers,
1066 sizeof(*priv));
1067 if (!mci) {
1068 ret = -ENOMEM;
1069 goto bail_disable_ch1;
1070 }
1071
1072
1073 /* device 19, func 0, Error injection */
1074 einj = pci_get_device_func(PCI_VENDOR_ID_INTEL,
1075 PCI_DEVICE_ID_INTEL_5100_19, 0);
1076 if (!einj) {
1077 ret = -ENODEV;
1078 goto bail_einj;
1079 }
1080
1081 rc = pci_enable_device(einj);
1082 if (rc < 0) {
1083 ret = rc;
1084 goto bail_disable_einj;
1085 }
1086
1087
1088 mci->pdev = &pdev->dev;
1089
1090 priv = mci->pvt_info;
1091 priv->ranksperchan = ranksperch;
1092 priv->mc = pdev;
1093 priv->ch0mm = ch0mm;
1094 priv->ch1mm = ch1mm;
1095 priv->einj = einj;
1096
1097 INIT_DELAYED_WORK(&(priv->i5100_scrubbing), i5100_refresh_scrubbing);
1098
1099 /* If scrubbing was already enabled by the bios, start maintaining it */
1100 pci_read_config_dword(pdev, I5100_MC, &dw);
1101 if (i5100_mc_scrben(dw)) {
1102 priv->scrub_enable = 1;
1103 schedule_delayed_work(&(priv->i5100_scrubbing),
1104 I5100_SCRUB_REFRESH_RATE);
1105 }
1106
1107 i5100_init_dimm_layout(pdev, mci);
1108 i5100_init_interleaving(pdev, mci);
1109
1110 mci->mtype_cap = MEM_FLAG_FB_DDR2;
1111 mci->edac_ctl_cap = EDAC_FLAG_SECDED;
1112 mci->edac_cap = EDAC_FLAG_SECDED;
1113 mci->mod_name = "i5100_edac.c";
1114 mci->mod_ver = "not versioned";
1115 mci->ctl_name = "i5100";
1116 mci->dev_name = pci_name(pdev);
1117 mci->ctl_page_to_phys = NULL;
1118
1119 mci->edac_check = i5100_check_error;
1120 mci->set_sdram_scrub_rate = i5100_set_scrub_rate;
1121 mci->get_sdram_scrub_rate = i5100_get_scrub_rate;
1122
1123 priv->inject_channel = 0;
1124 priv->inject_hlinesel = 0;
1125 priv->inject_deviceptr1 = 0;
1126 priv->inject_deviceptr2 = 0;
1127 priv->inject_eccmask1 = 0;
1128 priv->inject_eccmask2 = 0;
1129
1130 i5100_init_csrows(mci);
1131
1132 /* this strange construction seems to be in every driver, dunno why */
1133 switch (edac_op_state) {
1134 case EDAC_OPSTATE_POLL:
1135 case EDAC_OPSTATE_NMI:
1136 break;
1137 default:
1138 edac_op_state = EDAC_OPSTATE_POLL;
1139 break;
1140 }
1141
1142 if (edac_mc_add_mc(mci)) {
1143 ret = -ENODEV;
1144 goto bail_scrub;
1145 }
1146
1147 i5100_setup_debugfs(mci);
1148
1149 return ret;
1150
1151 bail_scrub:
1152 priv->scrub_enable = 0;
1153 cancel_delayed_work_sync(&(priv->i5100_scrubbing));
1154 edac_mc_free(mci);
1155
1156 bail_disable_einj:
1157 pci_disable_device(einj);
1158
1159 bail_einj:
1160 pci_dev_put(einj);
1161
1162 bail_disable_ch1:
1163 pci_disable_device(ch1mm);
1164
1165 bail_ch1:
1166 pci_dev_put(ch1mm);
1167
1168 bail_disable_ch0:
1169 pci_disable_device(ch0mm);
1170
1171 bail_ch0:
1172 pci_dev_put(ch0mm);
1173
1174 bail_pdev:
1175 pci_disable_device(pdev);
1176
1177 bail:
1178 return ret;
1179 }
1180
1181 static void i5100_remove_one(struct pci_dev *pdev)
1182 {
1183 struct mem_ctl_info *mci;
1184 struct i5100_priv *priv;
1185
1186 mci = edac_mc_del_mc(&pdev->dev);
1187
1188 if (!mci)
1189 return;
1190
1191 priv = mci->pvt_info;
1192
1193 edac_debugfs_remove_recursive(priv->debugfs);
1194
1195 priv->scrub_enable = 0;
1196 cancel_delayed_work_sync(&(priv->i5100_scrubbing));
1197
1198 pci_disable_device(pdev);
1199 pci_disable_device(priv->ch0mm);
1200 pci_disable_device(priv->ch1mm);
1201 pci_disable_device(priv->einj);
1202 pci_dev_put(priv->ch0mm);
1203 pci_dev_put(priv->ch1mm);
1204 pci_dev_put(priv->einj);
1205
1206 edac_mc_free(mci);
1207 }
1208
1209 static const struct pci_device_id i5100_pci_tbl[] = {
1210 /* Device 16, Function 0, Channel 0 Memory Map, Error Flag/Mask, ... */
1211 { PCI_DEVICE(PCI_VENDOR_ID_INTEL, PCI_DEVICE_ID_INTEL_5100_16) },
1212 { 0, }
1213 };
1214 MODULE_DEVICE_TABLE(pci, i5100_pci_tbl);
1215
1216 static struct pci_driver i5100_driver = {
1217 .name = KBUILD_BASENAME,
1218 .probe = i5100_init_one,
1219 .remove = i5100_remove_one,
1220 .id_table = i5100_pci_tbl,
1221 };
1222
1223 static int __init i5100_init(void)
1224 {
1225 int pci_rc;
1226
1227 i5100_debugfs = edac_debugfs_create_dir_at("i5100_edac", NULL);
1228
1229 pci_rc = pci_register_driver(&i5100_driver);
1230 return (pci_rc < 0) ? pci_rc : 0;
1231 }
1232
1233 static void __exit i5100_exit(void)
1234 {
1235 edac_debugfs_remove(i5100_debugfs);
1236
1237 pci_unregister_driver(&i5100_driver);
1238 }
1239
1240 module_init(i5100_init);
1241 module_exit(i5100_exit);
1242
1243 MODULE_LICENSE("GPL");
1244 MODULE_AUTHOR
1245 ("Arthur Jones <ajones@riverbed.com>");
1246 MODULE_DESCRIPTION("MC Driver for Intel I5100 memory controllers");
This page took 0.070997 seconds and 5 git commands to generate.