i5100_edac.c 26 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093
  1. /*
  2. * Intel 5100 Memory Controllers kernel module
  3. *
  4. * This file may be distributed under the terms of the
  5. * GNU General Public License.
  6. *
  7. * This module is based on the following document:
  8. *
  9. * Intel 5100X Chipset Memory Controller Hub (MCH) - Datasheet
  10. * http://download.intel.com/design/chipsets/datashts/318378.pdf
  11. *
  12. * The intel 5100 has two independent channels. EDAC core currently
  13. * can not reflect this configuration so instead the chip-select
  14. * rows for each respective channel are layed out one after another,
  15. * the first half belonging to channel 0, the second half belonging
  16. * to channel 1.
  17. */
  18. #include <linux/module.h>
  19. #include <linux/init.h>
  20. #include <linux/pci.h>
  21. #include <linux/pci_ids.h>
  22. #include <linux/slab.h>
  23. #include <linux/edac.h>
  24. #include <linux/delay.h>
  25. #include <linux/mmzone.h>
  26. #include "edac_core.h"
  27. /* register addresses */
  28. /* device 16, func 1 */
  29. #define I5100_MC 0x40 /* Memory Control Register */
  30. #define I5100_MC_SCRBEN_MASK (1 << 7)
  31. #define I5100_MC_SCRBDONE_MASK (1 << 4)
  32. #define I5100_MS 0x44 /* Memory Status Register */
  33. #define I5100_SPDDATA 0x48 /* Serial Presence Detect Status Reg */
  34. #define I5100_SPDCMD 0x4c /* Serial Presence Detect Command Reg */
  35. #define I5100_TOLM 0x6c /* Top of Low Memory */
  36. #define I5100_MIR0 0x80 /* Memory Interleave Range 0 */
  37. #define I5100_MIR1 0x84 /* Memory Interleave Range 1 */
  38. #define I5100_AMIR_0 0x8c /* Adjusted Memory Interleave Range 0 */
  39. #define I5100_AMIR_1 0x90 /* Adjusted Memory Interleave Range 1 */
  40. #define I5100_FERR_NF_MEM 0xa0 /* MC First Non Fatal Errors */
  41. #define I5100_FERR_NF_MEM_M16ERR_MASK (1 << 16)
  42. #define I5100_FERR_NF_MEM_M15ERR_MASK (1 << 15)
  43. #define I5100_FERR_NF_MEM_M14ERR_MASK (1 << 14)
  44. #define I5100_FERR_NF_MEM_M12ERR_MASK (1 << 12)
  45. #define I5100_FERR_NF_MEM_M11ERR_MASK (1 << 11)
  46. #define I5100_FERR_NF_MEM_M10ERR_MASK (1 << 10)
  47. #define I5100_FERR_NF_MEM_M6ERR_MASK (1 << 6)
  48. #define I5100_FERR_NF_MEM_M5ERR_MASK (1 << 5)
  49. #define I5100_FERR_NF_MEM_M4ERR_MASK (1 << 4)
  50. #define I5100_FERR_NF_MEM_M1ERR_MASK 1
  51. #define I5100_FERR_NF_MEM_ANY_MASK \
  52. (I5100_FERR_NF_MEM_M16ERR_MASK | \
  53. I5100_FERR_NF_MEM_M15ERR_MASK | \
  54. I5100_FERR_NF_MEM_M14ERR_MASK | \
  55. I5100_FERR_NF_MEM_M12ERR_MASK | \
  56. I5100_FERR_NF_MEM_M11ERR_MASK | \
  57. I5100_FERR_NF_MEM_M10ERR_MASK | \
  58. I5100_FERR_NF_MEM_M6ERR_MASK | \
  59. I5100_FERR_NF_MEM_M5ERR_MASK | \
  60. I5100_FERR_NF_MEM_M4ERR_MASK | \
  61. I5100_FERR_NF_MEM_M1ERR_MASK)
  62. #define I5100_NERR_NF_MEM 0xa4 /* MC Next Non-Fatal Errors */
  63. #define I5100_EMASK_MEM 0xa8 /* MC Error Mask Register */
  64. /* device 21 and 22, func 0 */
  65. #define I5100_MTR_0 0x154 /* Memory Technology Registers 0-3 */
  66. #define I5100_DMIR 0x15c /* DIMM Interleave Range */
  67. #define I5100_VALIDLOG 0x18c /* Valid Log Markers */
  68. #define I5100_NRECMEMA 0x190 /* Non-Recoverable Memory Error Log Reg A */
  69. #define I5100_NRECMEMB 0x194 /* Non-Recoverable Memory Error Log Reg B */
  70. #define I5100_REDMEMA 0x198 /* Recoverable Memory Data Error Log Reg A */
  71. #define I5100_REDMEMB 0x19c /* Recoverable Memory Data Error Log Reg B */
  72. #define I5100_RECMEMA 0x1a0 /* Recoverable Memory Error Log Reg A */
  73. #define I5100_RECMEMB 0x1a4 /* Recoverable Memory Error Log Reg B */
  74. #define I5100_MTR_4 0x1b0 /* Memory Technology Registers 4,5 */
  75. /* bit field accessors */
  76. static inline u32 i5100_mc_scrben(u32 mc)
  77. {
  78. return mc >> 7 & 1;
  79. }
  80. static inline u32 i5100_mc_errdeten(u32 mc)
  81. {
  82. return mc >> 5 & 1;
  83. }
  84. static inline u32 i5100_mc_scrbdone(u32 mc)
  85. {
  86. return mc >> 4 & 1;
  87. }
  88. static inline u16 i5100_spddata_rdo(u16 a)
  89. {
  90. return a >> 15 & 1;
  91. }
  92. static inline u16 i5100_spddata_sbe(u16 a)
  93. {
  94. return a >> 13 & 1;
  95. }
  96. static inline u16 i5100_spddata_busy(u16 a)
  97. {
  98. return a >> 12 & 1;
  99. }
  100. static inline u16 i5100_spddata_data(u16 a)
  101. {
  102. return a & ((1 << 8) - 1);
  103. }
  104. static inline u32 i5100_spdcmd_create(u32 dti, u32 ckovrd, u32 sa, u32 ba,
  105. u32 data, u32 cmd)
  106. {
  107. return ((dti & ((1 << 4) - 1)) << 28) |
  108. ((ckovrd & 1) << 27) |
  109. ((sa & ((1 << 3) - 1)) << 24) |
  110. ((ba & ((1 << 8) - 1)) << 16) |
  111. ((data & ((1 << 8) - 1)) << 8) |
  112. (cmd & 1);
  113. }
  114. static inline u16 i5100_tolm_tolm(u16 a)
  115. {
  116. return a >> 12 & ((1 << 4) - 1);
  117. }
  118. static inline u16 i5100_mir_limit(u16 a)
  119. {
  120. return a >> 4 & ((1 << 12) - 1);
  121. }
  122. static inline u16 i5100_mir_way1(u16 a)
  123. {
  124. return a >> 1 & 1;
  125. }
  126. static inline u16 i5100_mir_way0(u16 a)
  127. {
  128. return a & 1;
  129. }
  130. static inline u32 i5100_ferr_nf_mem_chan_indx(u32 a)
  131. {
  132. return a >> 28 & 1;
  133. }
  134. static inline u32 i5100_ferr_nf_mem_any(u32 a)
  135. {
  136. return a & I5100_FERR_NF_MEM_ANY_MASK;
  137. }
  138. static inline u32 i5100_nerr_nf_mem_any(u32 a)
  139. {
  140. return i5100_ferr_nf_mem_any(a);
  141. }
  142. static inline u32 i5100_dmir_limit(u32 a)
  143. {
  144. return a >> 16 & ((1 << 11) - 1);
  145. }
  146. static inline u32 i5100_dmir_rank(u32 a, u32 i)
  147. {
  148. return a >> (4 * i) & ((1 << 2) - 1);
  149. }
  150. static inline u16 i5100_mtr_present(u16 a)
  151. {
  152. return a >> 10 & 1;
  153. }
  154. static inline u16 i5100_mtr_ethrottle(u16 a)
  155. {
  156. return a >> 9 & 1;
  157. }
  158. static inline u16 i5100_mtr_width(u16 a)
  159. {
  160. return a >> 8 & 1;
  161. }
  162. static inline u16 i5100_mtr_numbank(u16 a)
  163. {
  164. return a >> 6 & 1;
  165. }
  166. static inline u16 i5100_mtr_numrow(u16 a)
  167. {
  168. return a >> 2 & ((1 << 2) - 1);
  169. }
  170. static inline u16 i5100_mtr_numcol(u16 a)
  171. {
  172. return a & ((1 << 2) - 1);
  173. }
  174. static inline u32 i5100_validlog_redmemvalid(u32 a)
  175. {
  176. return a >> 2 & 1;
  177. }
  178. static inline u32 i5100_validlog_recmemvalid(u32 a)
  179. {
  180. return a >> 1 & 1;
  181. }
  182. static inline u32 i5100_validlog_nrecmemvalid(u32 a)
  183. {
  184. return a & 1;
  185. }
  186. static inline u32 i5100_nrecmema_merr(u32 a)
  187. {
  188. return a >> 15 & ((1 << 5) - 1);
  189. }
  190. static inline u32 i5100_nrecmema_bank(u32 a)
  191. {
  192. return a >> 12 & ((1 << 3) - 1);
  193. }
  194. static inline u32 i5100_nrecmema_rank(u32 a)
  195. {
  196. return a >> 8 & ((1 << 3) - 1);
  197. }
  198. static inline u32 i5100_nrecmema_dm_buf_id(u32 a)
  199. {
  200. return a & ((1 << 8) - 1);
  201. }
  202. static inline u32 i5100_nrecmemb_cas(u32 a)
  203. {
  204. return a >> 16 & ((1 << 13) - 1);
  205. }
  206. static inline u32 i5100_nrecmemb_ras(u32 a)
  207. {
  208. return a & ((1 << 16) - 1);
  209. }
  210. static inline u32 i5100_redmemb_ecc_locator(u32 a)
  211. {
  212. return a & ((1 << 18) - 1);
  213. }
  214. static inline u32 i5100_recmema_merr(u32 a)
  215. {
  216. return i5100_nrecmema_merr(a);
  217. }
  218. static inline u32 i5100_recmema_bank(u32 a)
  219. {
  220. return i5100_nrecmema_bank(a);
  221. }
  222. static inline u32 i5100_recmema_rank(u32 a)
  223. {
  224. return i5100_nrecmema_rank(a);
  225. }
  226. static inline u32 i5100_recmema_dm_buf_id(u32 a)
  227. {
  228. return i5100_nrecmema_dm_buf_id(a);
  229. }
  230. static inline u32 i5100_recmemb_cas(u32 a)
  231. {
  232. return i5100_nrecmemb_cas(a);
  233. }
  234. static inline u32 i5100_recmemb_ras(u32 a)
  235. {
  236. return i5100_nrecmemb_ras(a);
  237. }
  238. /* some generic limits */
  239. #define I5100_MAX_RANKS_PER_CHAN 6
  240. #define I5100_CHANNELS 2
  241. #define I5100_MAX_RANKS_PER_DIMM 4
  242. #define I5100_DIMM_ADDR_LINES (6 - 3) /* 64 bits / 8 bits per byte */
  243. #define I5100_MAX_DIMM_SLOTS_PER_CHAN 4
  244. #define I5100_MAX_RANK_INTERLEAVE 4
  245. #define I5100_MAX_DMIRS 5
  246. #define I5100_SCRUB_REFRESH_RATE (5 * 60 * HZ)
  247. struct i5100_priv {
  248. /* ranks on each dimm -- 0 maps to not present -- obtained via SPD */
  249. int dimm_numrank[I5100_CHANNELS][I5100_MAX_DIMM_SLOTS_PER_CHAN];
  250. /*
  251. * mainboard chip select map -- maps i5100 chip selects to
  252. * DIMM slot chip selects. In the case of only 4 ranks per
  253. * channel, the mapping is fairly obvious but not unique.
  254. * we map -1 -> NC and assume both channels use the same
  255. * map...
  256. *
  257. */
  258. int dimm_csmap[I5100_MAX_DIMM_SLOTS_PER_CHAN][I5100_MAX_RANKS_PER_DIMM];
  259. /* memory interleave range */
  260. struct {
  261. u64 limit;
  262. unsigned way[2];
  263. } mir[I5100_CHANNELS];
  264. /* adjusted memory interleave range register */
  265. unsigned amir[I5100_CHANNELS];
  266. /* dimm interleave range */
  267. struct {
  268. unsigned rank[I5100_MAX_RANK_INTERLEAVE];
  269. u64 limit;
  270. } dmir[I5100_CHANNELS][I5100_MAX_DMIRS];
  271. /* memory technology registers... */
  272. struct {
  273. unsigned present; /* 0 or 1 */
  274. unsigned ethrottle; /* 0 or 1 */
  275. unsigned width; /* 4 or 8 bits */
  276. unsigned numbank; /* 2 or 3 lines */
  277. unsigned numrow; /* 13 .. 16 lines */
  278. unsigned numcol; /* 11 .. 12 lines */
  279. } mtr[I5100_CHANNELS][I5100_MAX_RANKS_PER_CHAN];
  280. u64 tolm; /* top of low memory in bytes */
  281. unsigned ranksperchan; /* number of ranks per channel */
  282. struct pci_dev *mc; /* device 16 func 1 */
  283. struct pci_dev *ch0mm; /* device 21 func 0 */
  284. struct pci_dev *ch1mm; /* device 22 func 0 */
  285. struct delayed_work i5100_scrubbing;
  286. int scrub_enable;
  287. };
  288. /* map a rank/chan to a slot number on the mainboard */
  289. static int i5100_rank_to_slot(const struct mem_ctl_info *mci,
  290. int chan, int rank)
  291. {
  292. const struct i5100_priv *priv = mci->pvt_info;
  293. int i;
  294. for (i = 0; i < I5100_MAX_DIMM_SLOTS_PER_CHAN; i++) {
  295. int j;
  296. const int numrank = priv->dimm_numrank[chan][i];
  297. for (j = 0; j < numrank; j++)
  298. if (priv->dimm_csmap[i][j] == rank)
  299. return i * 2 + chan;
  300. }
  301. return -1;
  302. }
  303. static const char *i5100_err_msg(unsigned err)
  304. {
  305. static const char *merrs[] = {
  306. "unknown", /* 0 */
  307. "uncorrectable data ECC on replay", /* 1 */
  308. "unknown", /* 2 */
  309. "unknown", /* 3 */
  310. "aliased uncorrectable demand data ECC", /* 4 */
  311. "aliased uncorrectable spare-copy data ECC", /* 5 */
  312. "aliased uncorrectable patrol data ECC", /* 6 */
  313. "unknown", /* 7 */
  314. "unknown", /* 8 */
  315. "unknown", /* 9 */
  316. "non-aliased uncorrectable demand data ECC", /* 10 */
  317. "non-aliased uncorrectable spare-copy data ECC", /* 11 */
  318. "non-aliased uncorrectable patrol data ECC", /* 12 */
  319. "unknown", /* 13 */
  320. "correctable demand data ECC", /* 14 */
  321. "correctable spare-copy data ECC", /* 15 */
  322. "correctable patrol data ECC", /* 16 */
  323. "unknown", /* 17 */
  324. "SPD protocol error", /* 18 */
  325. "unknown", /* 19 */
  326. "spare copy initiated", /* 20 */
  327. "spare copy completed", /* 21 */
  328. };
  329. unsigned i;
  330. for (i = 0; i < ARRAY_SIZE(merrs); i++)
  331. if (1 << i & err)
  332. return merrs[i];
  333. return "none";
  334. }
  335. /* convert csrow index into a rank (per channel -- 0..5) */
  336. static int i5100_csrow_to_rank(const struct mem_ctl_info *mci, int csrow)
  337. {
  338. const struct i5100_priv *priv = mci->pvt_info;
  339. return csrow % priv->ranksperchan;
  340. }
  341. /* convert csrow index into a channel (0..1) */
  342. static int i5100_csrow_to_chan(const struct mem_ctl_info *mci, int csrow)
  343. {
  344. const struct i5100_priv *priv = mci->pvt_info;
  345. return csrow / priv->ranksperchan;
  346. }
  347. static unsigned i5100_rank_to_csrow(const struct mem_ctl_info *mci,
  348. int chan, int rank)
  349. {
  350. const struct i5100_priv *priv = mci->pvt_info;
  351. return chan * priv->ranksperchan + rank;
  352. }
  353. static void i5100_handle_ce(struct mem_ctl_info *mci,
  354. int chan,
  355. unsigned bank,
  356. unsigned rank,
  357. unsigned long syndrome,
  358. unsigned cas,
  359. unsigned ras,
  360. const char *msg)
  361. {
  362. const int csrow = i5100_rank_to_csrow(mci, chan, rank);
  363. printk(KERN_ERR
  364. "CE chan %d, bank %u, rank %u, syndrome 0x%lx, "
  365. "cas %u, ras %u, csrow %u, label \"%s\": %s\n",
  366. chan, bank, rank, syndrome, cas, ras,
  367. csrow, mci->csrows[csrow].channels[0].label, msg);
  368. mci->ce_count++;
  369. mci->csrows[csrow].ce_count++;
  370. mci->csrows[csrow].channels[0].ce_count++;
  371. }
  372. static void i5100_handle_ue(struct mem_ctl_info *mci,
  373. int chan,
  374. unsigned bank,
  375. unsigned rank,
  376. unsigned long syndrome,
  377. unsigned cas,
  378. unsigned ras,
  379. const char *msg)
  380. {
  381. const int csrow = i5100_rank_to_csrow(mci, chan, rank);
  382. printk(KERN_ERR
  383. "UE chan %d, bank %u, rank %u, syndrome 0x%lx, "
  384. "cas %u, ras %u, csrow %u, label \"%s\": %s\n",
  385. chan, bank, rank, syndrome, cas, ras,
  386. csrow, mci->csrows[csrow].channels[0].label, msg);
  387. mci->ue_count++;
  388. mci->csrows[csrow].ue_count++;
  389. }
  390. static void i5100_read_log(struct mem_ctl_info *mci, int chan,
  391. u32 ferr, u32 nerr)
  392. {
  393. struct i5100_priv *priv = mci->pvt_info;
  394. struct pci_dev *pdev = (chan) ? priv->ch1mm : priv->ch0mm;
  395. u32 dw;
  396. u32 dw2;
  397. unsigned syndrome = 0;
  398. unsigned ecc_loc = 0;
  399. unsigned merr;
  400. unsigned bank;
  401. unsigned rank;
  402. unsigned cas;
  403. unsigned ras;
  404. pci_read_config_dword(pdev, I5100_VALIDLOG, &dw);
  405. if (i5100_validlog_redmemvalid(dw)) {
  406. pci_read_config_dword(pdev, I5100_REDMEMA, &dw2);
  407. syndrome = dw2;
  408. pci_read_config_dword(pdev, I5100_REDMEMB, &dw2);
  409. ecc_loc = i5100_redmemb_ecc_locator(dw2);
  410. }
  411. if (i5100_validlog_recmemvalid(dw)) {
  412. const char *msg;
  413. pci_read_config_dword(pdev, I5100_RECMEMA, &dw2);
  414. merr = i5100_recmema_merr(dw2);
  415. bank = i5100_recmema_bank(dw2);
  416. rank = i5100_recmema_rank(dw2);
  417. pci_read_config_dword(pdev, I5100_RECMEMB, &dw2);
  418. cas = i5100_recmemb_cas(dw2);
  419. ras = i5100_recmemb_ras(dw2);
  420. /* FIXME: not really sure if this is what merr is...
  421. */
  422. if (!merr)
  423. msg = i5100_err_msg(ferr);
  424. else
  425. msg = i5100_err_msg(nerr);
  426. i5100_handle_ce(mci, chan, bank, rank, syndrome, cas, ras, msg);
  427. }
  428. if (i5100_validlog_nrecmemvalid(dw)) {
  429. const char *msg;
  430. pci_read_config_dword(pdev, I5100_NRECMEMA, &dw2);
  431. merr = i5100_nrecmema_merr(dw2);
  432. bank = i5100_nrecmema_bank(dw2);
  433. rank = i5100_nrecmema_rank(dw2);
  434. pci_read_config_dword(pdev, I5100_NRECMEMB, &dw2);
  435. cas = i5100_nrecmemb_cas(dw2);
  436. ras = i5100_nrecmemb_ras(dw2);
  437. /* FIXME: not really sure if this is what merr is...
  438. */
  439. if (!merr)
  440. msg = i5100_err_msg(ferr);
  441. else
  442. msg = i5100_err_msg(nerr);
  443. i5100_handle_ue(mci, chan, bank, rank, syndrome, cas, ras, msg);
  444. }
  445. pci_write_config_dword(pdev, I5100_VALIDLOG, dw);
  446. }
  447. static void i5100_check_error(struct mem_ctl_info *mci)
  448. {
  449. struct i5100_priv *priv = mci->pvt_info;
  450. u32 dw;
  451. pci_read_config_dword(priv->mc, I5100_FERR_NF_MEM, &dw);
  452. if (i5100_ferr_nf_mem_any(dw)) {
  453. u32 dw2;
  454. pci_read_config_dword(priv->mc, I5100_NERR_NF_MEM, &dw2);
  455. if (dw2)
  456. pci_write_config_dword(priv->mc, I5100_NERR_NF_MEM,
  457. dw2);
  458. pci_write_config_dword(priv->mc, I5100_FERR_NF_MEM, dw);
  459. i5100_read_log(mci, i5100_ferr_nf_mem_chan_indx(dw),
  460. i5100_ferr_nf_mem_any(dw),
  461. i5100_nerr_nf_mem_any(dw2));
  462. }
  463. }
  464. /* The i5100 chipset will scrub the entire memory once, then
  465. * set a done bit. Continuous scrubbing is achieved by enqueing
  466. * delayed work to a workqueue, checking every few minutes if
  467. * the scrubbing has completed and if so reinitiating it.
  468. */
  469. static void i5100_refresh_scrubbing(struct work_struct *work)
  470. {
  471. struct delayed_work *i5100_scrubbing = container_of(work,
  472. struct delayed_work,
  473. work);
  474. struct i5100_priv *priv = container_of(i5100_scrubbing,
  475. struct i5100_priv,
  476. i5100_scrubbing);
  477. u32 dw;
  478. pci_read_config_dword(priv->mc, I5100_MC, &dw);
  479. if (priv->scrub_enable) {
  480. pci_read_config_dword(priv->mc, I5100_MC, &dw);
  481. if (i5100_mc_scrbdone(dw)) {
  482. dw |= I5100_MC_SCRBEN_MASK;
  483. pci_write_config_dword(priv->mc, I5100_MC, dw);
  484. pci_read_config_dword(priv->mc, I5100_MC, &dw);
  485. }
  486. schedule_delayed_work(&(priv->i5100_scrubbing),
  487. I5100_SCRUB_REFRESH_RATE);
  488. }
  489. }
  490. /*
  491. * The bandwidth is based on experimentation, feel free to refine it.
  492. */
  493. static int i5100_set_scrub_rate(struct mem_ctl_info *mci,
  494. u32 *bandwidth)
  495. {
  496. struct i5100_priv *priv = mci->pvt_info;
  497. u32 dw;
  498. pci_read_config_dword(priv->mc, I5100_MC, &dw);
  499. if (*bandwidth) {
  500. priv->scrub_enable = 1;
  501. dw |= I5100_MC_SCRBEN_MASK;
  502. schedule_delayed_work(&(priv->i5100_scrubbing),
  503. I5100_SCRUB_REFRESH_RATE);
  504. } else {
  505. priv->scrub_enable = 0;
  506. dw &= ~I5100_MC_SCRBEN_MASK;
  507. cancel_delayed_work(&(priv->i5100_scrubbing));
  508. }
  509. pci_write_config_dword(priv->mc, I5100_MC, dw);
  510. pci_read_config_dword(priv->mc, I5100_MC, &dw);
  511. *bandwidth = 5900000 * i5100_mc_scrben(dw);
  512. return 0;
  513. }
  514. static int i5100_get_scrub_rate(struct mem_ctl_info *mci,
  515. u32 *bandwidth)
  516. {
  517. struct i5100_priv *priv = mci->pvt_info;
  518. u32 dw;
  519. pci_read_config_dword(priv->mc, I5100_MC, &dw);
  520. *bandwidth = 5900000 * i5100_mc_scrben(dw);
  521. return 0;
  522. }
  523. static struct pci_dev *pci_get_device_func(unsigned vendor,
  524. unsigned device,
  525. unsigned func)
  526. {
  527. struct pci_dev *ret = NULL;
  528. while (1) {
  529. ret = pci_get_device(vendor, device, ret);
  530. if (!ret)
  531. break;
  532. if (PCI_FUNC(ret->devfn) == func)
  533. break;
  534. }
  535. return ret;
  536. }
  537. static unsigned long __devinit i5100_npages(struct mem_ctl_info *mci,
  538. int csrow)
  539. {
  540. struct i5100_priv *priv = mci->pvt_info;
  541. const unsigned chan_rank = i5100_csrow_to_rank(mci, csrow);
  542. const unsigned chan = i5100_csrow_to_chan(mci, csrow);
  543. unsigned addr_lines;
  544. /* dimm present? */
  545. if (!priv->mtr[chan][chan_rank].present)
  546. return 0ULL;
  547. addr_lines =
  548. I5100_DIMM_ADDR_LINES +
  549. priv->mtr[chan][chan_rank].numcol +
  550. priv->mtr[chan][chan_rank].numrow +
  551. priv->mtr[chan][chan_rank].numbank;
  552. return (unsigned long)
  553. ((unsigned long long) (1ULL << addr_lines) / PAGE_SIZE);
  554. }
  555. static void __devinit i5100_init_mtr(struct mem_ctl_info *mci)
  556. {
  557. struct i5100_priv *priv = mci->pvt_info;
  558. struct pci_dev *mms[2] = { priv->ch0mm, priv->ch1mm };
  559. int i;
  560. for (i = 0; i < I5100_CHANNELS; i++) {
  561. int j;
  562. struct pci_dev *pdev = mms[i];
  563. for (j = 0; j < I5100_MAX_RANKS_PER_CHAN; j++) {
  564. const unsigned addr =
  565. (j < 4) ? I5100_MTR_0 + j * 2 :
  566. I5100_MTR_4 + (j - 4) * 2;
  567. u16 w;
  568. pci_read_config_word(pdev, addr, &w);
  569. priv->mtr[i][j].present = i5100_mtr_present(w);
  570. priv->mtr[i][j].ethrottle = i5100_mtr_ethrottle(w);
  571. priv->mtr[i][j].width = 4 + 4 * i5100_mtr_width(w);
  572. priv->mtr[i][j].numbank = 2 + i5100_mtr_numbank(w);
  573. priv->mtr[i][j].numrow = 13 + i5100_mtr_numrow(w);
  574. priv->mtr[i][j].numcol = 10 + i5100_mtr_numcol(w);
  575. }
  576. }
  577. }
  578. /*
  579. * FIXME: make this into a real i2c adapter (so that dimm-decode
  580. * will work)?
  581. */
  582. static int i5100_read_spd_byte(const struct mem_ctl_info *mci,
  583. u8 ch, u8 slot, u8 addr, u8 *byte)
  584. {
  585. struct i5100_priv *priv = mci->pvt_info;
  586. u16 w;
  587. unsigned long et;
  588. pci_read_config_word(priv->mc, I5100_SPDDATA, &w);
  589. if (i5100_spddata_busy(w))
  590. return -1;
  591. pci_write_config_dword(priv->mc, I5100_SPDCMD,
  592. i5100_spdcmd_create(0xa, 1, ch * 4 + slot, addr,
  593. 0, 0));
  594. /* wait up to 100ms */
  595. et = jiffies + HZ / 10;
  596. udelay(100);
  597. while (1) {
  598. pci_read_config_word(priv->mc, I5100_SPDDATA, &w);
  599. if (!i5100_spddata_busy(w))
  600. break;
  601. udelay(100);
  602. }
  603. if (!i5100_spddata_rdo(w) || i5100_spddata_sbe(w))
  604. return -1;
  605. *byte = i5100_spddata_data(w);
  606. return 0;
  607. }
  608. /*
  609. * fill dimm chip select map
  610. *
  611. * FIXME:
  612. * o not the only way to may chip selects to dimm slots
  613. * o investigate if there is some way to obtain this map from the bios
  614. */
  615. static void __devinit i5100_init_dimm_csmap(struct mem_ctl_info *mci)
  616. {
  617. struct i5100_priv *priv = mci->pvt_info;
  618. int i;
  619. for (i = 0; i < I5100_MAX_DIMM_SLOTS_PER_CHAN; i++) {
  620. int j;
  621. for (j = 0; j < I5100_MAX_RANKS_PER_DIMM; j++)
  622. priv->dimm_csmap[i][j] = -1; /* default NC */
  623. }
  624. /* only 2 chip selects per slot... */
  625. if (priv->ranksperchan == 4) {
  626. priv->dimm_csmap[0][0] = 0;
  627. priv->dimm_csmap[0][1] = 3;
  628. priv->dimm_csmap[1][0] = 1;
  629. priv->dimm_csmap[1][1] = 2;
  630. priv->dimm_csmap[2][0] = 2;
  631. priv->dimm_csmap[3][0] = 3;
  632. } else {
  633. priv->dimm_csmap[0][0] = 0;
  634. priv->dimm_csmap[0][1] = 1;
  635. priv->dimm_csmap[1][0] = 2;
  636. priv->dimm_csmap[1][1] = 3;
  637. priv->dimm_csmap[2][0] = 4;
  638. priv->dimm_csmap[2][1] = 5;
  639. }
  640. }
  641. static void __devinit i5100_init_dimm_layout(struct pci_dev *pdev,
  642. struct mem_ctl_info *mci)
  643. {
  644. struct i5100_priv *priv = mci->pvt_info;
  645. int i;
  646. for (i = 0; i < I5100_CHANNELS; i++) {
  647. int j;
  648. for (j = 0; j < I5100_MAX_DIMM_SLOTS_PER_CHAN; j++) {
  649. u8 rank;
  650. if (i5100_read_spd_byte(mci, i, j, 5, &rank) < 0)
  651. priv->dimm_numrank[i][j] = 0;
  652. else
  653. priv->dimm_numrank[i][j] = (rank & 3) + 1;
  654. }
  655. }
  656. i5100_init_dimm_csmap(mci);
  657. }
  658. static void __devinit i5100_init_interleaving(struct pci_dev *pdev,
  659. struct mem_ctl_info *mci)
  660. {
  661. u16 w;
  662. u32 dw;
  663. struct i5100_priv *priv = mci->pvt_info;
  664. struct pci_dev *mms[2] = { priv->ch0mm, priv->ch1mm };
  665. int i;
  666. pci_read_config_word(pdev, I5100_TOLM, &w);
  667. priv->tolm = (u64) i5100_tolm_tolm(w) * 256 * 1024 * 1024;
  668. pci_read_config_word(pdev, I5100_MIR0, &w);
  669. priv->mir[0].limit = (u64) i5100_mir_limit(w) << 28;
  670. priv->mir[0].way[1] = i5100_mir_way1(w);
  671. priv->mir[0].way[0] = i5100_mir_way0(w);
  672. pci_read_config_word(pdev, I5100_MIR1, &w);
  673. priv->mir[1].limit = (u64) i5100_mir_limit(w) << 28;
  674. priv->mir[1].way[1] = i5100_mir_way1(w);
  675. priv->mir[1].way[0] = i5100_mir_way0(w);
  676. pci_read_config_word(pdev, I5100_AMIR_0, &w);
  677. priv->amir[0] = w;
  678. pci_read_config_word(pdev, I5100_AMIR_1, &w);
  679. priv->amir[1] = w;
  680. for (i = 0; i < I5100_CHANNELS; i++) {
  681. int j;
  682. for (j = 0; j < 5; j++) {
  683. int k;
  684. pci_read_config_dword(mms[i], I5100_DMIR + j * 4, &dw);
  685. priv->dmir[i][j].limit =
  686. (u64) i5100_dmir_limit(dw) << 28;
  687. for (k = 0; k < I5100_MAX_RANKS_PER_DIMM; k++)
  688. priv->dmir[i][j].rank[k] =
  689. i5100_dmir_rank(dw, k);
  690. }
  691. }
  692. i5100_init_mtr(mci);
  693. }
  694. static void __devinit i5100_init_csrows(struct mem_ctl_info *mci)
  695. {
  696. int i;
  697. unsigned long total_pages = 0UL;
  698. struct i5100_priv *priv = mci->pvt_info;
  699. for (i = 0; i < mci->nr_csrows; i++) {
  700. const unsigned long npages = i5100_npages(mci, i);
  701. const unsigned chan = i5100_csrow_to_chan(mci, i);
  702. const unsigned rank = i5100_csrow_to_rank(mci, i);
  703. if (!npages)
  704. continue;
  705. /*
  706. * FIXME: these two are totally bogus -- I don't see how to
  707. * map them correctly to this structure...
  708. */
  709. mci->csrows[i].first_page = total_pages;
  710. mci->csrows[i].last_page = total_pages + npages - 1;
  711. mci->csrows[i].page_mask = 0UL;
  712. mci->csrows[i].nr_pages = npages;
  713. mci->csrows[i].grain = 32;
  714. mci->csrows[i].csrow_idx = i;
  715. mci->csrows[i].dtype =
  716. (priv->mtr[chan][rank].width == 4) ? DEV_X4 : DEV_X8;
  717. mci->csrows[i].ue_count = 0;
  718. mci->csrows[i].ce_count = 0;
  719. mci->csrows[i].mtype = MEM_RDDR2;
  720. mci->csrows[i].edac_mode = EDAC_SECDED;
  721. mci->csrows[i].mci = mci;
  722. mci->csrows[i].nr_channels = 1;
  723. mci->csrows[i].channels[0].chan_idx = 0;
  724. mci->csrows[i].channels[0].ce_count = 0;
  725. mci->csrows[i].channels[0].csrow = mci->csrows + i;
  726. snprintf(mci->csrows[i].channels[0].label,
  727. sizeof(mci->csrows[i].channels[0].label),
  728. "DIMM%u", i5100_rank_to_slot(mci, chan, rank));
  729. total_pages += npages;
  730. }
  731. }
  732. static int __devinit i5100_init_one(struct pci_dev *pdev,
  733. const struct pci_device_id *id)
  734. {
  735. int rc;
  736. struct mem_ctl_info *mci;
  737. struct i5100_priv *priv;
  738. struct pci_dev *ch0mm, *ch1mm;
  739. int ret = 0;
  740. u32 dw;
  741. int ranksperch;
  742. if (PCI_FUNC(pdev->devfn) != 1)
  743. return -ENODEV;
  744. rc = pci_enable_device(pdev);
  745. if (rc < 0) {
  746. ret = rc;
  747. goto bail;
  748. }
  749. /* ECC enabled? */
  750. pci_read_config_dword(pdev, I5100_MC, &dw);
  751. if (!i5100_mc_errdeten(dw)) {
  752. printk(KERN_INFO "i5100_edac: ECC not enabled.\n");
  753. ret = -ENODEV;
  754. goto bail_pdev;
  755. }
  756. /* figure out how many ranks, from strapped state of 48GB_Mode input */
  757. pci_read_config_dword(pdev, I5100_MS, &dw);
  758. ranksperch = !!(dw & (1 << 8)) * 2 + 4;
  759. /* enable error reporting... */
  760. pci_read_config_dword(pdev, I5100_EMASK_MEM, &dw);
  761. dw &= ~I5100_FERR_NF_MEM_ANY_MASK;
  762. pci_write_config_dword(pdev, I5100_EMASK_MEM, dw);
  763. /* device 21, func 0, Channel 0 Memory Map, Error Flag/Mask, etc... */
  764. ch0mm = pci_get_device_func(PCI_VENDOR_ID_INTEL,
  765. PCI_DEVICE_ID_INTEL_5100_21, 0);
  766. if (!ch0mm) {
  767. ret = -ENODEV;
  768. goto bail_pdev;
  769. }
  770. rc = pci_enable_device(ch0mm);
  771. if (rc < 0) {
  772. ret = rc;
  773. goto bail_ch0;
  774. }
  775. /* device 22, func 0, Channel 1 Memory Map, Error Flag/Mask, etc... */
  776. ch1mm = pci_get_device_func(PCI_VENDOR_ID_INTEL,
  777. PCI_DEVICE_ID_INTEL_5100_22, 0);
  778. if (!ch1mm) {
  779. ret = -ENODEV;
  780. goto bail_disable_ch0;
  781. }
  782. rc = pci_enable_device(ch1mm);
  783. if (rc < 0) {
  784. ret = rc;
  785. goto bail_ch1;
  786. }
  787. mci = edac_mc_alloc(sizeof(*priv), ranksperch * 2, 1, 0);
  788. if (!mci) {
  789. ret = -ENOMEM;
  790. goto bail_disable_ch1;
  791. }
  792. mci->dev = &pdev->dev;
  793. priv = mci->pvt_info;
  794. priv->ranksperchan = ranksperch;
  795. priv->mc = pdev;
  796. priv->ch0mm = ch0mm;
  797. priv->ch1mm = ch1mm;
  798. INIT_DELAYED_WORK(&(priv->i5100_scrubbing), i5100_refresh_scrubbing);
  799. /* If scrubbing was already enabled by the bios, start maintaining it */
  800. pci_read_config_dword(pdev, I5100_MC, &dw);
  801. if (i5100_mc_scrben(dw)) {
  802. priv->scrub_enable = 1;
  803. schedule_delayed_work(&(priv->i5100_scrubbing),
  804. I5100_SCRUB_REFRESH_RATE);
  805. }
  806. i5100_init_dimm_layout(pdev, mci);
  807. i5100_init_interleaving(pdev, mci);
  808. mci->mtype_cap = MEM_FLAG_FB_DDR2;
  809. mci->edac_ctl_cap = EDAC_FLAG_SECDED;
  810. mci->edac_cap = EDAC_FLAG_SECDED;
  811. mci->mod_name = "i5100_edac.c";
  812. mci->mod_ver = "not versioned";
  813. mci->ctl_name = "i5100";
  814. mci->dev_name = pci_name(pdev);
  815. mci->ctl_page_to_phys = NULL;
  816. mci->edac_check = i5100_check_error;
  817. mci->set_sdram_scrub_rate = i5100_set_scrub_rate;
  818. mci->get_sdram_scrub_rate = i5100_get_scrub_rate;
  819. i5100_init_csrows(mci);
  820. /* this strange construction seems to be in every driver, dunno why */
  821. switch (edac_op_state) {
  822. case EDAC_OPSTATE_POLL:
  823. case EDAC_OPSTATE_NMI:
  824. break;
  825. default:
  826. edac_op_state = EDAC_OPSTATE_POLL;
  827. break;
  828. }
  829. if (edac_mc_add_mc(mci)) {
  830. ret = -ENODEV;
  831. goto bail_scrub;
  832. }
  833. return ret;
  834. bail_scrub:
  835. priv->scrub_enable = 0;
  836. cancel_delayed_work_sync(&(priv->i5100_scrubbing));
  837. edac_mc_free(mci);
  838. bail_disable_ch1:
  839. pci_disable_device(ch1mm);
  840. bail_ch1:
  841. pci_dev_put(ch1mm);
  842. bail_disable_ch0:
  843. pci_disable_device(ch0mm);
  844. bail_ch0:
  845. pci_dev_put(ch0mm);
  846. bail_pdev:
  847. pci_disable_device(pdev);
  848. bail:
  849. return ret;
  850. }
  851. static void __devexit i5100_remove_one(struct pci_dev *pdev)
  852. {
  853. struct mem_ctl_info *mci;
  854. struct i5100_priv *priv;
  855. mci = edac_mc_del_mc(&pdev->dev);
  856. if (!mci)
  857. return;
  858. priv = mci->pvt_info;
  859. priv->scrub_enable = 0;
  860. cancel_delayed_work_sync(&(priv->i5100_scrubbing));
  861. pci_disable_device(pdev);
  862. pci_disable_device(priv->ch0mm);
  863. pci_disable_device(priv->ch1mm);
  864. pci_dev_put(priv->ch0mm);
  865. pci_dev_put(priv->ch1mm);
  866. edac_mc_free(mci);
  867. }
  868. static const struct pci_device_id i5100_pci_tbl[] __devinitdata = {
  869. /* Device 16, Function 0, Channel 0 Memory Map, Error Flag/Mask, ... */
  870. { PCI_DEVICE(PCI_VENDOR_ID_INTEL, PCI_DEVICE_ID_INTEL_5100_16) },
  871. { 0, }
  872. };
  873. MODULE_DEVICE_TABLE(pci, i5100_pci_tbl);
  874. static struct pci_driver i5100_driver = {
  875. .name = KBUILD_BASENAME,
  876. .probe = i5100_init_one,
  877. .remove = __devexit_p(i5100_remove_one),
  878. .id_table = i5100_pci_tbl,
  879. };
  880. static int __init i5100_init(void)
  881. {
  882. int pci_rc;
  883. pci_rc = pci_register_driver(&i5100_driver);
  884. return (pci_rc < 0) ? pci_rc : 0;
  885. }
  886. static void __exit i5100_exit(void)
  887. {
  888. pci_unregister_driver(&i5100_driver);
  889. }
  890. module_init(i5100_init);
  891. module_exit(i5100_exit);
  892. MODULE_LICENSE("GPL");
  893. MODULE_AUTHOR
  894. ("Arthur Jones <ajones@riverbed.com>");
  895. MODULE_DESCRIPTION("MC Driver for Intel I5100 memory controllers");