i5100_edac.c 23 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855
  1. /*
  2. * Intel 5100 Memory Controllers kernel module
  3. *
  4. * This file may be distributed under the terms of the
  5. * GNU General Public License.
  6. *
  7. * This module is based on the following document:
  8. *
  9. * Intel 5100X Chipset Memory Controller Hub (MCH) - Datasheet
  10. * http://download.intel.com/design/chipsets/datashts/318378.pdf
  11. *
  12. */
  13. #include <linux/module.h>
  14. #include <linux/init.h>
  15. #include <linux/pci.h>
  16. #include <linux/pci_ids.h>
  17. #include <linux/slab.h>
  18. #include <linux/edac.h>
  19. #include <linux/delay.h>
  20. #include <linux/mmzone.h>
  21. #include "edac_core.h"
  22. /* register addresses and bit field accessors... */
  23. /* device 16, func 1 */
  24. #define I5100_MC 0x40 /* Memory Control Register */
  25. #define I5100_MC_ERRDETEN(a) ((a) >> 5 & 1)
  26. #define I5100_MS 0x44 /* Memory Status Register */
  27. #define I5100_SPDDATA 0x48 /* Serial Presence Detect Status Reg */
  28. #define I5100_SPDDATA_RDO(a) ((a) >> 15 & 1)
  29. #define I5100_SPDDATA_SBE(a) ((a) >> 13 & 1)
  30. #define I5100_SPDDATA_BUSY(a) ((a) >> 12 & 1)
  31. #define I5100_SPDDATA_DATA(a) ((a) & ((1 << 8) - 1))
  32. #define I5100_SPDCMD 0x4c /* Serial Presence Detect Command Reg */
  33. #define I5100_SPDCMD_DTI(a) (((a) & ((1 << 4) - 1)) << 28)
  34. #define I5100_SPDCMD_CKOVRD(a) (((a) & 1) << 27)
  35. #define I5100_SPDCMD_SA(a) (((a) & ((1 << 3) - 1)) << 24)
  36. #define I5100_SPDCMD_BA(a) (((a) & ((1 << 8) - 1)) << 16)
  37. #define I5100_SPDCMD_DATA(a) (((a) & ((1 << 8) - 1)) << 8)
  38. #define I5100_SPDCMD_CMD(a) ((a) & 1)
  39. #define I5100_TOLM 0x6c /* Top of Low Memory */
  40. #define I5100_TOLM_TOLM(a) ((a) >> 12 & ((1 << 4) - 1))
  41. #define I5100_MIR0 0x80 /* Memory Interleave Range 0 */
  42. #define I5100_MIR1 0x84 /* Memory Interleave Range 1 */
  43. #define I5100_AMIR_0 0x8c /* Adjusted Memory Interleave Range 0 */
  44. #define I5100_AMIR_1 0x90 /* Adjusted Memory Interleave Range 1 */
  45. #define I5100_MIR_LIMIT(a) ((a) >> 4 & ((1 << 12) - 1))
  46. #define I5100_MIR_WAY1(a) ((a) >> 1 & 1)
  47. #define I5100_MIR_WAY0(a) ((a) & 1)
  48. #define I5100_FERR_NF_MEM 0xa0 /* MC First Non Fatal Errors */
  49. #define I5100_FERR_NF_MEM_CHAN_INDX(a) ((a) >> 28 & 1)
  50. #define I5100_FERR_NF_MEM_SPD_MASK (1 << 18)
  51. #define I5100_FERR_NF_MEM_M16ERR_MASK (1 << 16)
  52. #define I5100_FERR_NF_MEM_M15ERR_MASK (1 << 15)
  53. #define I5100_FERR_NF_MEM_M14ERR_MASK (1 << 14)
  54. #define I5100_FERR_NF_MEM_M12ERR_MASK (1 << 12)
  55. #define I5100_FERR_NF_MEM_M11ERR_MASK (1 << 11)
  56. #define I5100_FERR_NF_MEM_M10ERR_MASK (1 << 10)
  57. #define I5100_FERR_NF_MEM_M6ERR_MASK (1 << 6)
  58. #define I5100_FERR_NF_MEM_M5ERR_MASK (1 << 5)
  59. #define I5100_FERR_NF_MEM_M4ERR_MASK (1 << 4)
  60. #define I5100_FERR_NF_MEM_M1ERR_MASK 1
  61. #define I5100_FERR_NF_MEM_ANY_MASK \
  62. (I5100_FERR_NF_MEM_M16ERR_MASK | \
  63. I5100_FERR_NF_MEM_M15ERR_MASK | \
  64. I5100_FERR_NF_MEM_M14ERR_MASK | \
  65. I5100_FERR_NF_MEM_M12ERR_MASK | \
  66. I5100_FERR_NF_MEM_M11ERR_MASK | \
  67. I5100_FERR_NF_MEM_M10ERR_MASK | \
  68. I5100_FERR_NF_MEM_M6ERR_MASK | \
  69. I5100_FERR_NF_MEM_M5ERR_MASK | \
  70. I5100_FERR_NF_MEM_M4ERR_MASK | \
  71. I5100_FERR_NF_MEM_M1ERR_MASK)
  72. #define I5100_FERR_NF_MEM_ANY(a) ((a) & I5100_FERR_NF_MEM_ANY_MASK)
  73. #define I5100_NERR_NF_MEM 0xa4 /* MC Next Non-Fatal Errors */
  74. #define I5100_NERR_NF_MEM_ANY(a) I5100_FERR_NF_MEM_ANY(a)
  75. #define I5100_EMASK_MEM 0xa8 /* MC Error Mask Register */
  76. /* device 21 and 22, func 0 */
  77. #define I5100_MTR_0 0x154 /* Memory Technology Registers 0-3 */
  78. #define I5100_DMIR 0x15c /* DIMM Interleave Range */
  79. #define I5100_DMIR_LIMIT(a) ((a) >> 16 & ((1 << 11) - 1))
  80. #define I5100_DMIR_RANK(a, i) ((a) >> (4 * i) & ((1 << 2) - 1))
  81. #define I5100_MTR_4 0x1b0 /* Memory Technology Registers 4,5 */
  82. #define I5100_MTR_PRESENT(a) ((a) >> 10 & 1)
  83. #define I5100_MTR_ETHROTTLE(a) ((a) >> 9 & 1)
  84. #define I5100_MTR_WIDTH(a) ((a) >> 8 & 1)
  85. #define I5100_MTR_NUMBANK(a) ((a) >> 6 & 1)
  86. #define I5100_MTR_NUMROW(a) ((a) >> 2 & ((1 << 2) - 1))
  87. #define I5100_MTR_NUMCOL(a) ((a) & ((1 << 2) - 1))
  88. #define I5100_VALIDLOG 0x18c /* Valid Log Markers */
  89. #define I5100_VALIDLOG_REDMEMVALID(a) ((a) >> 2 & 1)
  90. #define I5100_VALIDLOG_RECMEMVALID(a) ((a) >> 1 & 1)
  91. #define I5100_VALIDLOG_NRECMEMVALID(a) ((a) & 1)
  92. #define I5100_NRECMEMA 0x190 /* Non-Recoverable Memory Error Log Reg A */
  93. #define I5100_NRECMEMA_MERR(a) ((a) >> 15 & ((1 << 5) - 1))
  94. #define I5100_NRECMEMA_BANK(a) ((a) >> 12 & ((1 << 3) - 1))
  95. #define I5100_NRECMEMA_RANK(a) ((a) >> 8 & ((1 << 3) - 1))
  96. #define I5100_NRECMEMA_DM_BUF_ID(a) ((a) & ((1 << 8) - 1))
  97. #define I5100_NRECMEMB 0x194 /* Non-Recoverable Memory Error Log Reg B */
  98. #define I5100_NRECMEMB_CAS(a) ((a) >> 16 & ((1 << 13) - 1))
  99. #define I5100_NRECMEMB_RAS(a) ((a) & ((1 << 16) - 1))
  100. #define I5100_REDMEMA 0x198 /* Recoverable Memory Data Error Log Reg A */
  101. #define I5100_REDMEMA_SYNDROME(a) (a)
  102. #define I5100_REDMEMB 0x19c /* Recoverable Memory Data Error Log Reg B */
  103. #define I5100_REDMEMB_ECC_LOCATOR(a) ((a) & ((1 << 18) - 1))
  104. #define I5100_RECMEMA 0x1a0 /* Recoverable Memory Error Log Reg A */
  105. #define I5100_RECMEMA_MERR(a) I5100_NRECMEMA_MERR(a)
  106. #define I5100_RECMEMA_BANK(a) I5100_NRECMEMA_BANK(a)
  107. #define I5100_RECMEMA_RANK(a) I5100_NRECMEMA_RANK(a)
  108. #define I5100_RECMEMA_DM_BUF_ID(a) I5100_NRECMEMA_DM_BUF_ID(a)
  109. #define I5100_RECMEMB 0x1a4 /* Recoverable Memory Error Log Reg B */
  110. #define I5100_RECMEMB_CAS(a) I5100_NRECMEMB_CAS(a)
  111. #define I5100_RECMEMB_RAS(a) I5100_NRECMEMB_RAS(a)
  112. /* some generic limits */
  113. #define I5100_MAX_RANKS_PER_CTLR 6
  114. #define I5100_MAX_CTLRS 2
  115. #define I5100_MAX_RANKS_PER_DIMM 4
  116. #define I5100_DIMM_ADDR_LINES (6 - 3) /* 64 bits / 8 bits per byte */
  117. #define I5100_MAX_DIMM_SLOTS_PER_CTLR 4
  118. #define I5100_MAX_RANK_INTERLEAVE 4
  119. #define I5100_MAX_DMIRS 5
  120. struct i5100_priv {
  121. /* ranks on each dimm -- 0 maps to not present -- obtained via SPD */
  122. int dimm_numrank[I5100_MAX_CTLRS][I5100_MAX_DIMM_SLOTS_PER_CTLR];
  123. /*
  124. * mainboard chip select map -- maps i5100 chip selects to
  125. * DIMM slot chip selects. In the case of only 4 ranks per
  126. * controller, the mapping is fairly obvious but not unique.
  127. * we map -1 -> NC and assume both controllers use the same
  128. * map...
  129. *
  130. */
  131. int dimm_csmap[I5100_MAX_DIMM_SLOTS_PER_CTLR][I5100_MAX_RANKS_PER_DIMM];
  132. /* memory interleave range */
  133. struct {
  134. u64 limit;
  135. unsigned way[2];
  136. } mir[I5100_MAX_CTLRS];
  137. /* adjusted memory interleave range register */
  138. unsigned amir[I5100_MAX_CTLRS];
  139. /* dimm interleave range */
  140. struct {
  141. unsigned rank[I5100_MAX_RANK_INTERLEAVE];
  142. u64 limit;
  143. } dmir[I5100_MAX_CTLRS][I5100_MAX_DMIRS];
  144. /* memory technology registers... */
  145. struct {
  146. unsigned present; /* 0 or 1 */
  147. unsigned ethrottle; /* 0 or 1 */
  148. unsigned width; /* 4 or 8 bits */
  149. unsigned numbank; /* 2 or 3 lines */
  150. unsigned numrow; /* 13 .. 16 lines */
  151. unsigned numcol; /* 11 .. 12 lines */
  152. } mtr[I5100_MAX_CTLRS][I5100_MAX_RANKS_PER_CTLR];
  153. u64 tolm; /* top of low memory in bytes */
  154. unsigned ranksperctlr; /* number of ranks per controller */
  155. struct pci_dev *mc; /* device 16 func 1 */
  156. struct pci_dev *ch0mm; /* device 21 func 0 */
  157. struct pci_dev *ch1mm; /* device 22 func 0 */
  158. };
  159. /* map a rank/ctlr to a slot number on the mainboard */
  160. static int i5100_rank_to_slot(const struct mem_ctl_info *mci,
  161. int ctlr, int rank)
  162. {
  163. const struct i5100_priv *priv = mci->pvt_info;
  164. int i;
  165. for (i = 0; i < I5100_MAX_DIMM_SLOTS_PER_CTLR; i++) {
  166. int j;
  167. const int numrank = priv->dimm_numrank[ctlr][i];
  168. for (j = 0; j < numrank; j++)
  169. if (priv->dimm_csmap[i][j] == rank)
  170. return i * 2 + ctlr;
  171. }
  172. return -1;
  173. }
  174. /*
  175. * The processor bus memory addresses are broken into three
  176. * pieces, whereas the controller addresses are contiguous.
  177. *
  178. * here we map from the controller address space to the
  179. * processor address space:
  180. *
  181. * Processor Address Space
  182. * +-----------------------------+
  183. * | |
  184. * | "high" memory addresses |
  185. * | |
  186. * +-----------------------------+ <- 4GB on the i5100
  187. * | |
  188. * | other non-memory addresses |
  189. * | |
  190. * +-----------------------------+ <- top of low memory
  191. * | |
  192. * | "low" memory addresses |
  193. * | |
  194. * +-----------------------------+
  195. */
  196. static unsigned long i5100_ctl_page_to_phys(struct mem_ctl_info *mci,
  197. unsigned long cntlr_addr)
  198. {
  199. const struct i5100_priv *priv = mci->pvt_info;
  200. if (cntlr_addr < priv->tolm)
  201. return cntlr_addr;
  202. return (1ULL << 32) + (cntlr_addr - priv->tolm);
  203. }
  204. static const char *i5100_err_msg(unsigned err)
  205. {
  206. const char *merrs[] = {
  207. "unknown", /* 0 */
  208. "uncorrectable data ECC on replay", /* 1 */
  209. "unknown", /* 2 */
  210. "unknown", /* 3 */
  211. "aliased uncorrectable demand data ECC", /* 4 */
  212. "aliased uncorrectable spare-copy data ECC", /* 5 */
  213. "aliased uncorrectable patrol data ECC", /* 6 */
  214. "unknown", /* 7 */
  215. "unknown", /* 8 */
  216. "unknown", /* 9 */
  217. "non-aliased uncorrectable demand data ECC", /* 10 */
  218. "non-aliased uncorrectable spare-copy data ECC", /* 11 */
  219. "non-aliased uncorrectable patrol data ECC", /* 12 */
  220. "unknown", /* 13 */
  221. "correctable demand data ECC", /* 14 */
  222. "correctable spare-copy data ECC", /* 15 */
  223. "correctable patrol data ECC", /* 16 */
  224. "unknown", /* 17 */
  225. "SPD protocol error", /* 18 */
  226. "unknown", /* 19 */
  227. "spare copy initiated", /* 20 */
  228. "spare copy completed", /* 21 */
  229. };
  230. unsigned i;
  231. for (i = 0; i < ARRAY_SIZE(merrs); i++)
  232. if (1 << i & err)
  233. return merrs[i];
  234. return "none";
  235. }
  236. /* convert csrow index into a rank (per controller -- 0..5) */
  237. static int i5100_csrow_to_rank(const struct mem_ctl_info *mci, int csrow)
  238. {
  239. const struct i5100_priv *priv = mci->pvt_info;
  240. return csrow % priv->ranksperctlr;
  241. }
  242. /* convert csrow index into a controller (0..1) */
  243. static int i5100_csrow_to_cntlr(const struct mem_ctl_info *mci, int csrow)
  244. {
  245. const struct i5100_priv *priv = mci->pvt_info;
  246. return csrow / priv->ranksperctlr;
  247. }
  248. static unsigned i5100_rank_to_csrow(const struct mem_ctl_info *mci,
  249. int ctlr, int rank)
  250. {
  251. const struct i5100_priv *priv = mci->pvt_info;
  252. return ctlr * priv->ranksperctlr + rank;
  253. }
  254. static void i5100_handle_ce(struct mem_ctl_info *mci,
  255. int ctlr,
  256. unsigned bank,
  257. unsigned rank,
  258. unsigned long syndrome,
  259. unsigned cas,
  260. unsigned ras,
  261. const char *msg)
  262. {
  263. const int csrow = i5100_rank_to_csrow(mci, ctlr, rank);
  264. printk(KERN_ERR
  265. "CE ctlr %d, bank %u, rank %u, syndrome 0x%lx, "
  266. "cas %u, ras %u, csrow %u, label \"%s\": %s\n",
  267. ctlr, bank, rank, syndrome, cas, ras,
  268. csrow, mci->csrows[csrow].channels[0].label, msg);
  269. mci->ce_count++;
  270. mci->csrows[csrow].ce_count++;
  271. mci->csrows[csrow].channels[0].ce_count++;
  272. }
  273. static void i5100_handle_ue(struct mem_ctl_info *mci,
  274. int ctlr,
  275. unsigned bank,
  276. unsigned rank,
  277. unsigned long syndrome,
  278. unsigned cas,
  279. unsigned ras,
  280. const char *msg)
  281. {
  282. const int csrow = i5100_rank_to_csrow(mci, ctlr, rank);
  283. printk(KERN_ERR
  284. "UE ctlr %d, bank %u, rank %u, syndrome 0x%lx, "
  285. "cas %u, ras %u, csrow %u, label \"%s\": %s\n",
  286. ctlr, bank, rank, syndrome, cas, ras,
  287. csrow, mci->csrows[csrow].channels[0].label, msg);
  288. mci->ue_count++;
  289. mci->csrows[csrow].ue_count++;
  290. }
  291. static void i5100_read_log(struct mem_ctl_info *mci, int ctlr,
  292. u32 ferr, u32 nerr)
  293. {
  294. struct i5100_priv *priv = mci->pvt_info;
  295. struct pci_dev *pdev = (ctlr) ? priv->ch1mm : priv->ch0mm;
  296. u32 dw;
  297. u32 dw2;
  298. unsigned syndrome = 0;
  299. unsigned ecc_loc = 0;
  300. unsigned merr;
  301. unsigned bank;
  302. unsigned rank;
  303. unsigned cas;
  304. unsigned ras;
  305. pci_read_config_dword(pdev, I5100_VALIDLOG, &dw);
  306. if (I5100_VALIDLOG_REDMEMVALID(dw)) {
  307. pci_read_config_dword(pdev, I5100_REDMEMA, &dw2);
  308. syndrome = I5100_REDMEMA_SYNDROME(dw2);
  309. pci_read_config_dword(pdev, I5100_REDMEMB, &dw2);
  310. ecc_loc = I5100_REDMEMB_ECC_LOCATOR(dw2);
  311. }
  312. if (I5100_VALIDLOG_RECMEMVALID(dw)) {
  313. const char *msg;
  314. pci_read_config_dword(pdev, I5100_RECMEMA, &dw2);
  315. merr = I5100_RECMEMA_MERR(dw2);
  316. bank = I5100_RECMEMA_BANK(dw2);
  317. rank = I5100_RECMEMA_RANK(dw2);
  318. pci_read_config_dword(pdev, I5100_RECMEMB, &dw2);
  319. cas = I5100_RECMEMB_CAS(dw2);
  320. ras = I5100_RECMEMB_RAS(dw2);
  321. /* FIXME: not really sure if this is what merr is...
  322. */
  323. if (!merr)
  324. msg = i5100_err_msg(ferr);
  325. else
  326. msg = i5100_err_msg(nerr);
  327. i5100_handle_ce(mci, ctlr, bank, rank, syndrome, cas, ras, msg);
  328. }
  329. if (I5100_VALIDLOG_NRECMEMVALID(dw)) {
  330. const char *msg;
  331. pci_read_config_dword(pdev, I5100_NRECMEMA, &dw2);
  332. merr = I5100_NRECMEMA_MERR(dw2);
  333. bank = I5100_NRECMEMA_BANK(dw2);
  334. rank = I5100_NRECMEMA_RANK(dw2);
  335. pci_read_config_dword(pdev, I5100_NRECMEMB, &dw2);
  336. cas = I5100_NRECMEMB_CAS(dw2);
  337. ras = I5100_NRECMEMB_RAS(dw2);
  338. /* FIXME: not really sure if this is what merr is...
  339. */
  340. if (!merr)
  341. msg = i5100_err_msg(ferr);
  342. else
  343. msg = i5100_err_msg(nerr);
  344. i5100_handle_ue(mci, ctlr, bank, rank, syndrome, cas, ras, msg);
  345. }
  346. pci_write_config_dword(pdev, I5100_VALIDLOG, dw);
  347. }
  348. static void i5100_check_error(struct mem_ctl_info *mci)
  349. {
  350. struct i5100_priv *priv = mci->pvt_info;
  351. u32 dw;
  352. pci_read_config_dword(priv->mc, I5100_FERR_NF_MEM, &dw);
  353. if (I5100_FERR_NF_MEM_ANY(dw)) {
  354. u32 dw2;
  355. pci_read_config_dword(priv->mc, I5100_NERR_NF_MEM, &dw2);
  356. if (dw2)
  357. pci_write_config_dword(priv->mc, I5100_NERR_NF_MEM,
  358. dw2);
  359. pci_write_config_dword(priv->mc, I5100_FERR_NF_MEM, dw);
  360. i5100_read_log(mci, I5100_FERR_NF_MEM_CHAN_INDX(dw),
  361. I5100_FERR_NF_MEM_ANY(dw),
  362. I5100_NERR_NF_MEM_ANY(dw2));
  363. }
  364. }
  365. static struct pci_dev *pci_get_device_func(unsigned vendor,
  366. unsigned device,
  367. unsigned func)
  368. {
  369. struct pci_dev *ret = NULL;
  370. while (1) {
  371. ret = pci_get_device(vendor, device, ret);
  372. if (!ret)
  373. break;
  374. if (PCI_FUNC(ret->devfn) == func)
  375. break;
  376. }
  377. return ret;
  378. }
  379. static unsigned long __devinit i5100_npages(struct mem_ctl_info *mci,
  380. int csrow)
  381. {
  382. struct i5100_priv *priv = mci->pvt_info;
  383. const unsigned ctlr_rank = i5100_csrow_to_rank(mci, csrow);
  384. const unsigned ctlr = i5100_csrow_to_cntlr(mci, csrow);
  385. unsigned addr_lines;
  386. /* dimm present? */
  387. if (!priv->mtr[ctlr][ctlr_rank].present)
  388. return 0ULL;
  389. addr_lines =
  390. I5100_DIMM_ADDR_LINES +
  391. priv->mtr[ctlr][ctlr_rank].numcol +
  392. priv->mtr[ctlr][ctlr_rank].numrow +
  393. priv->mtr[ctlr][ctlr_rank].numbank;
  394. return (unsigned long)
  395. ((unsigned long long) (1ULL << addr_lines) / PAGE_SIZE);
  396. }
  397. static void __devinit i5100_init_mtr(struct mem_ctl_info *mci)
  398. {
  399. struct i5100_priv *priv = mci->pvt_info;
  400. struct pci_dev *mms[2] = { priv->ch0mm, priv->ch1mm };
  401. int i;
  402. for (i = 0; i < I5100_MAX_CTLRS; i++) {
  403. int j;
  404. struct pci_dev *pdev = mms[i];
  405. for (j = 0; j < I5100_MAX_RANKS_PER_CTLR; j++) {
  406. const unsigned addr =
  407. (j < 4) ? I5100_MTR_0 + j * 2 :
  408. I5100_MTR_4 + (j - 4) * 2;
  409. u16 w;
  410. pci_read_config_word(pdev, addr, &w);
  411. priv->mtr[i][j].present = I5100_MTR_PRESENT(w);
  412. priv->mtr[i][j].ethrottle = I5100_MTR_ETHROTTLE(w);
  413. priv->mtr[i][j].width = 4 + 4 * I5100_MTR_WIDTH(w);
  414. priv->mtr[i][j].numbank = 2 + I5100_MTR_NUMBANK(w);
  415. priv->mtr[i][j].numrow = 13 + I5100_MTR_NUMROW(w);
  416. priv->mtr[i][j].numcol = 10 + I5100_MTR_NUMCOL(w);
  417. }
  418. }
  419. }
  420. /*
  421. * FIXME: make this into a real i2c adapter (so that dimm-decode
  422. * will work)?
  423. */
  424. static int i5100_read_spd_byte(const struct mem_ctl_info *mci,
  425. u8 ch, u8 slot, u8 addr, u8 *byte)
  426. {
  427. struct i5100_priv *priv = mci->pvt_info;
  428. u16 w;
  429. u32 dw;
  430. unsigned long et;
  431. pci_read_config_word(priv->mc, I5100_SPDDATA, &w);
  432. if (I5100_SPDDATA_BUSY(w))
  433. return -1;
  434. dw = I5100_SPDCMD_DTI(0xa) |
  435. I5100_SPDCMD_CKOVRD(1) |
  436. I5100_SPDCMD_SA(ch * 4 + slot) |
  437. I5100_SPDCMD_BA(addr) |
  438. I5100_SPDCMD_DATA(0) |
  439. I5100_SPDCMD_CMD(0);
  440. pci_write_config_dword(priv->mc, I5100_SPDCMD, dw);
  441. /* wait up to 100ms */
  442. et = jiffies + HZ / 10;
  443. udelay(100);
  444. while (1) {
  445. pci_read_config_word(priv->mc, I5100_SPDDATA, &w);
  446. if (!I5100_SPDDATA_BUSY(w))
  447. break;
  448. udelay(100);
  449. }
  450. if (!I5100_SPDDATA_RDO(w) || I5100_SPDDATA_SBE(w))
  451. return -1;
  452. *byte = I5100_SPDDATA_DATA(w);
  453. return 0;
  454. }
  455. /*
  456. * fill dimm chip select map
  457. *
  458. * FIXME:
  459. * o only valid for 4 ranks per controller
  460. * o not the only way to may chip selects to dimm slots
  461. * o investigate if there is some way to obtain this map from the bios
  462. */
  463. static void __devinit i5100_init_dimm_csmap(struct mem_ctl_info *mci)
  464. {
  465. struct i5100_priv *priv = mci->pvt_info;
  466. int i;
  467. WARN_ON(priv->ranksperctlr != 4);
  468. for (i = 0; i < I5100_MAX_DIMM_SLOTS_PER_CTLR; i++) {
  469. int j;
  470. for (j = 0; j < I5100_MAX_RANKS_PER_DIMM; j++)
  471. priv->dimm_csmap[i][j] = -1; /* default NC */
  472. }
  473. /* only 2 chip selects per slot... */
  474. priv->dimm_csmap[0][0] = 0;
  475. priv->dimm_csmap[0][1] = 3;
  476. priv->dimm_csmap[1][0] = 1;
  477. priv->dimm_csmap[1][1] = 2;
  478. priv->dimm_csmap[2][0] = 2;
  479. priv->dimm_csmap[3][0] = 3;
  480. }
  481. static void __devinit i5100_init_dimm_layout(struct pci_dev *pdev,
  482. struct mem_ctl_info *mci)
  483. {
  484. struct i5100_priv *priv = mci->pvt_info;
  485. int i;
  486. for (i = 0; i < I5100_MAX_CTLRS; i++) {
  487. int j;
  488. for (j = 0; j < I5100_MAX_DIMM_SLOTS_PER_CTLR; j++) {
  489. u8 rank;
  490. if (i5100_read_spd_byte(mci, i, j, 5, &rank) < 0)
  491. priv->dimm_numrank[i][j] = 0;
  492. else
  493. priv->dimm_numrank[i][j] = (rank & 3) + 1;
  494. }
  495. }
  496. i5100_init_dimm_csmap(mci);
  497. }
  498. static void __devinit i5100_init_interleaving(struct pci_dev *pdev,
  499. struct mem_ctl_info *mci)
  500. {
  501. u16 w;
  502. u32 dw;
  503. struct i5100_priv *priv = mci->pvt_info;
  504. struct pci_dev *mms[2] = { priv->ch0mm, priv->ch1mm };
  505. int i;
  506. pci_read_config_word(pdev, I5100_TOLM, &w);
  507. priv->tolm = (u64) I5100_TOLM_TOLM(w) * 256 * 1024 * 1024;
  508. pci_read_config_word(pdev, I5100_MIR0, &w);
  509. priv->mir[0].limit = (u64) I5100_MIR_LIMIT(w) << 28;
  510. priv->mir[0].way[1] = I5100_MIR_WAY1(w);
  511. priv->mir[0].way[0] = I5100_MIR_WAY0(w);
  512. pci_read_config_word(pdev, I5100_MIR1, &w);
  513. priv->mir[1].limit = (u64) I5100_MIR_LIMIT(w) << 28;
  514. priv->mir[1].way[1] = I5100_MIR_WAY1(w);
  515. priv->mir[1].way[0] = I5100_MIR_WAY0(w);
  516. pci_read_config_word(pdev, I5100_AMIR_0, &w);
  517. priv->amir[0] = w;
  518. pci_read_config_word(pdev, I5100_AMIR_1, &w);
  519. priv->amir[1] = w;
  520. for (i = 0; i < I5100_MAX_CTLRS; i++) {
  521. int j;
  522. for (j = 0; j < 5; j++) {
  523. int k;
  524. pci_read_config_dword(mms[i], I5100_DMIR + j * 4, &dw);
  525. priv->dmir[i][j].limit =
  526. (u64) I5100_DMIR_LIMIT(dw) << 28;
  527. for (k = 0; k < I5100_MAX_RANKS_PER_DIMM; k++)
  528. priv->dmir[i][j].rank[k] =
  529. I5100_DMIR_RANK(dw, k);
  530. }
  531. }
  532. i5100_init_mtr(mci);
  533. }
  534. static void __devinit i5100_init_csrows(struct mem_ctl_info *mci)
  535. {
  536. int i;
  537. unsigned long total_pages = 0UL;
  538. struct i5100_priv *priv = mci->pvt_info;
  539. for (i = 0; i < mci->nr_csrows; i++) {
  540. const unsigned long npages = i5100_npages(mci, i);
  541. const unsigned cntlr = i5100_csrow_to_cntlr(mci, i);
  542. const unsigned rank = i5100_csrow_to_rank(mci, i);
  543. if (!npages)
  544. continue;
  545. /*
  546. * FIXME: these two are totally bogus -- I don't see how to
  547. * map them correctly to this structure...
  548. */
  549. mci->csrows[i].first_page = total_pages;
  550. mci->csrows[i].last_page = total_pages + npages - 1;
  551. mci->csrows[i].page_mask = 0UL;
  552. mci->csrows[i].nr_pages = npages;
  553. mci->csrows[i].grain = 32;
  554. mci->csrows[i].csrow_idx = i;
  555. mci->csrows[i].dtype =
  556. (priv->mtr[cntlr][rank].width == 4) ? DEV_X4 : DEV_X8;
  557. mci->csrows[i].ue_count = 0;
  558. mci->csrows[i].ce_count = 0;
  559. mci->csrows[i].mtype = MEM_RDDR2;
  560. mci->csrows[i].edac_mode = EDAC_SECDED;
  561. mci->csrows[i].mci = mci;
  562. mci->csrows[i].nr_channels = 1;
  563. mci->csrows[i].channels[0].chan_idx = 0;
  564. mci->csrows[i].channels[0].ce_count = 0;
  565. mci->csrows[i].channels[0].csrow = mci->csrows + i;
  566. snprintf(mci->csrows[i].channels[0].label,
  567. sizeof(mci->csrows[i].channels[0].label),
  568. "DIMM%u", i5100_rank_to_slot(mci, cntlr, rank));
  569. total_pages += npages;
  570. }
  571. }
  572. static int __devinit i5100_init_one(struct pci_dev *pdev,
  573. const struct pci_device_id *id)
  574. {
  575. int rc;
  576. struct mem_ctl_info *mci;
  577. struct i5100_priv *priv;
  578. struct pci_dev *ch0mm, *ch1mm;
  579. int ret = 0;
  580. u32 dw;
  581. int ranksperch;
  582. if (PCI_FUNC(pdev->devfn) != 1)
  583. return -ENODEV;
  584. rc = pci_enable_device(pdev);
  585. if (rc < 0) {
  586. ret = rc;
  587. goto bail;
  588. }
  589. /* ECC enabled? */
  590. pci_read_config_dword(pdev, I5100_MC, &dw);
  591. if (!I5100_MC_ERRDETEN(dw)) {
  592. printk(KERN_INFO "i5100_edac: ECC not enabled.\n");
  593. ret = -ENODEV;
  594. goto bail;
  595. }
  596. /* figure out how many ranks, from strapped state of 48GB_Mode input */
  597. pci_read_config_dword(pdev, I5100_MS, &dw);
  598. ranksperch = !!(dw & (1 << 8)) * 2 + 4;
  599. if (ranksperch != 4) {
  600. /* FIXME: get 6 ranks / controller to work - need hw... */
  601. printk(KERN_INFO "i5100_edac: unsupported configuration.\n");
  602. ret = -ENODEV;
  603. goto bail;
  604. }
  605. /* enable error reporting... */
  606. pci_read_config_dword(pdev, I5100_EMASK_MEM, &dw);
  607. dw &= ~I5100_FERR_NF_MEM_ANY_MASK;
  608. pci_write_config_dword(pdev, I5100_EMASK_MEM, dw);
  609. /* device 21, func 0, Channel 0 Memory Map, Error Flag/Mask, etc... */
  610. ch0mm = pci_get_device_func(PCI_VENDOR_ID_INTEL,
  611. PCI_DEVICE_ID_INTEL_5100_21, 0);
  612. if (!ch0mm)
  613. return -ENODEV;
  614. rc = pci_enable_device(ch0mm);
  615. if (rc < 0) {
  616. ret = rc;
  617. goto bail_ch0;
  618. }
  619. /* device 22, func 0, Channel 1 Memory Map, Error Flag/Mask, etc... */
  620. ch1mm = pci_get_device_func(PCI_VENDOR_ID_INTEL,
  621. PCI_DEVICE_ID_INTEL_5100_22, 0);
  622. if (!ch1mm) {
  623. ret = -ENODEV;
  624. goto bail_ch0;
  625. }
  626. rc = pci_enable_device(ch1mm);
  627. if (rc < 0) {
  628. ret = rc;
  629. goto bail_ch1;
  630. }
  631. mci = edac_mc_alloc(sizeof(*priv), ranksperch * 2, 1, 0);
  632. if (!mci) {
  633. ret = -ENOMEM;
  634. goto bail_ch1;
  635. }
  636. mci->dev = &pdev->dev;
  637. priv = mci->pvt_info;
  638. priv->ranksperctlr = ranksperch;
  639. priv->mc = pdev;
  640. priv->ch0mm = ch0mm;
  641. priv->ch1mm = ch1mm;
  642. i5100_init_dimm_layout(pdev, mci);
  643. i5100_init_interleaving(pdev, mci);
  644. mci->mtype_cap = MEM_FLAG_FB_DDR2;
  645. mci->edac_ctl_cap = EDAC_FLAG_SECDED;
  646. mci->edac_cap = EDAC_FLAG_SECDED;
  647. mci->mod_name = "i5100_edac.c";
  648. mci->mod_ver = "not versioned";
  649. mci->ctl_name = "i5100";
  650. mci->dev_name = pci_name(pdev);
  651. mci->ctl_page_to_phys = i5100_ctl_page_to_phys;
  652. mci->edac_check = i5100_check_error;
  653. i5100_init_csrows(mci);
  654. /* this strange construction seems to be in every driver, dunno why */
  655. switch (edac_op_state) {
  656. case EDAC_OPSTATE_POLL:
  657. case EDAC_OPSTATE_NMI:
  658. break;
  659. default:
  660. edac_op_state = EDAC_OPSTATE_POLL;
  661. break;
  662. }
  663. if (edac_mc_add_mc(mci)) {
  664. ret = -ENODEV;
  665. goto bail_mc;
  666. }
  667. goto bail;
  668. bail_mc:
  669. edac_mc_free(mci);
  670. bail_ch1:
  671. pci_dev_put(ch1mm);
  672. bail_ch0:
  673. pci_dev_put(ch0mm);
  674. bail:
  675. return ret;
  676. }
  677. static void __devexit i5100_remove_one(struct pci_dev *pdev)
  678. {
  679. struct mem_ctl_info *mci;
  680. struct i5100_priv *priv;
  681. mci = edac_mc_del_mc(&pdev->dev);
  682. if (!mci)
  683. return;
  684. priv = mci->pvt_info;
  685. pci_dev_put(priv->ch0mm);
  686. pci_dev_put(priv->ch1mm);
  687. edac_mc_free(mci);
  688. }
  689. static const struct pci_device_id i5100_pci_tbl[] __devinitdata = {
  690. /* Device 16, Function 0, Channel 0 Memory Map, Error Flag/Mask, ... */
  691. { PCI_DEVICE(PCI_VENDOR_ID_INTEL, PCI_DEVICE_ID_INTEL_5100_16) },
  692. { 0, }
  693. };
  694. MODULE_DEVICE_TABLE(pci, i5100_pci_tbl);
  695. static struct pci_driver i5100_driver = {
  696. .name = KBUILD_BASENAME,
  697. .probe = i5100_init_one,
  698. .remove = __devexit_p(i5100_remove_one),
  699. .id_table = i5100_pci_tbl,
  700. };
  701. static int __init i5100_init(void)
  702. {
  703. int pci_rc;
  704. pci_rc = pci_register_driver(&i5100_driver);
  705. return (pci_rc < 0) ? pci_rc : 0;
  706. }
  707. static void __exit i5100_exit(void)
  708. {
  709. pci_unregister_driver(&i5100_driver);
  710. }
  711. module_init(i5100_init);
  712. module_exit(i5100_exit);
  713. MODULE_LICENSE("GPL");
  714. MODULE_AUTHOR
  715. ("Arthur Jones <ajones@riverbed.com>");
  716. MODULE_DESCRIPTION("MC Driver for Intel I5100 memory controllers");