i5100_edac.c 26 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086
  1. /*
  2. * Intel 5100 Memory Controllers kernel module
  3. *
  4. * This file may be distributed under the terms of the
  5. * GNU General Public License.
  6. *
  7. * This module is based on the following document:
  8. *
  9. * Intel 5100X Chipset Memory Controller Hub (MCH) - Datasheet
  10. * http://download.intel.com/design/chipsets/datashts/318378.pdf
  11. *
  12. * The intel 5100 has two independent channels. EDAC core currently
  13. * can not reflect this configuration so instead the chip-select
  14. * rows for each respective channel are laid out one after another,
  15. * the first half belonging to channel 0, the second half belonging
  16. * to channel 1.
  17. */
  18. #include <linux/module.h>
  19. #include <linux/init.h>
  20. #include <linux/pci.h>
  21. #include <linux/pci_ids.h>
  22. #include <linux/edac.h>
  23. #include <linux/delay.h>
  24. #include <linux/mmzone.h>
  25. #include "edac_core.h"
  26. /* register addresses */
  27. /* device 16, func 1 */
  28. #define I5100_MC 0x40 /* Memory Control Register */
  29. #define I5100_MC_SCRBEN_MASK (1 << 7)
  30. #define I5100_MC_SCRBDONE_MASK (1 << 4)
  31. #define I5100_MS 0x44 /* Memory Status Register */
  32. #define I5100_SPDDATA 0x48 /* Serial Presence Detect Status Reg */
  33. #define I5100_SPDCMD 0x4c /* Serial Presence Detect Command Reg */
  34. #define I5100_TOLM 0x6c /* Top of Low Memory */
  35. #define I5100_MIR0 0x80 /* Memory Interleave Range 0 */
  36. #define I5100_MIR1 0x84 /* Memory Interleave Range 1 */
  37. #define I5100_AMIR_0 0x8c /* Adjusted Memory Interleave Range 0 */
  38. #define I5100_AMIR_1 0x90 /* Adjusted Memory Interleave Range 1 */
  39. #define I5100_FERR_NF_MEM 0xa0 /* MC First Non Fatal Errors */
  40. #define I5100_FERR_NF_MEM_M16ERR_MASK (1 << 16)
  41. #define I5100_FERR_NF_MEM_M15ERR_MASK (1 << 15)
  42. #define I5100_FERR_NF_MEM_M14ERR_MASK (1 << 14)
  43. #define I5100_FERR_NF_MEM_M12ERR_MASK (1 << 12)
  44. #define I5100_FERR_NF_MEM_M11ERR_MASK (1 << 11)
  45. #define I5100_FERR_NF_MEM_M10ERR_MASK (1 << 10)
  46. #define I5100_FERR_NF_MEM_M6ERR_MASK (1 << 6)
  47. #define I5100_FERR_NF_MEM_M5ERR_MASK (1 << 5)
  48. #define I5100_FERR_NF_MEM_M4ERR_MASK (1 << 4)
  49. #define I5100_FERR_NF_MEM_M1ERR_MASK (1 << 1)
  50. #define I5100_FERR_NF_MEM_ANY_MASK \
  51. (I5100_FERR_NF_MEM_M16ERR_MASK | \
  52. I5100_FERR_NF_MEM_M15ERR_MASK | \
  53. I5100_FERR_NF_MEM_M14ERR_MASK | \
  54. I5100_FERR_NF_MEM_M12ERR_MASK | \
  55. I5100_FERR_NF_MEM_M11ERR_MASK | \
  56. I5100_FERR_NF_MEM_M10ERR_MASK | \
  57. I5100_FERR_NF_MEM_M6ERR_MASK | \
  58. I5100_FERR_NF_MEM_M5ERR_MASK | \
  59. I5100_FERR_NF_MEM_M4ERR_MASK | \
  60. I5100_FERR_NF_MEM_M1ERR_MASK)
  61. #define I5100_NERR_NF_MEM 0xa4 /* MC Next Non-Fatal Errors */
  62. #define I5100_EMASK_MEM 0xa8 /* MC Error Mask Register */
  63. /* device 21 and 22, func 0 */
  64. #define I5100_MTR_0 0x154 /* Memory Technology Registers 0-3 */
  65. #define I5100_DMIR 0x15c /* DIMM Interleave Range */
  66. #define I5100_VALIDLOG 0x18c /* Valid Log Markers */
  67. #define I5100_NRECMEMA 0x190 /* Non-Recoverable Memory Error Log Reg A */
  68. #define I5100_NRECMEMB 0x194 /* Non-Recoverable Memory Error Log Reg B */
  69. #define I5100_REDMEMA 0x198 /* Recoverable Memory Data Error Log Reg A */
  70. #define I5100_REDMEMB 0x19c /* Recoverable Memory Data Error Log Reg B */
  71. #define I5100_RECMEMA 0x1a0 /* Recoverable Memory Error Log Reg A */
  72. #define I5100_RECMEMB 0x1a4 /* Recoverable Memory Error Log Reg B */
  73. #define I5100_MTR_4 0x1b0 /* Memory Technology Registers 4,5 */
  74. /* bit field accessors */
  75. static inline u32 i5100_mc_scrben(u32 mc)
  76. {
  77. return mc >> 7 & 1;
  78. }
  79. static inline u32 i5100_mc_errdeten(u32 mc)
  80. {
  81. return mc >> 5 & 1;
  82. }
  83. static inline u32 i5100_mc_scrbdone(u32 mc)
  84. {
  85. return mc >> 4 & 1;
  86. }
  87. static inline u16 i5100_spddata_rdo(u16 a)
  88. {
  89. return a >> 15 & 1;
  90. }
  91. static inline u16 i5100_spddata_sbe(u16 a)
  92. {
  93. return a >> 13 & 1;
  94. }
  95. static inline u16 i5100_spddata_busy(u16 a)
  96. {
  97. return a >> 12 & 1;
  98. }
  99. static inline u16 i5100_spddata_data(u16 a)
  100. {
  101. return a & ((1 << 8) - 1);
  102. }
  103. static inline u32 i5100_spdcmd_create(u32 dti, u32 ckovrd, u32 sa, u32 ba,
  104. u32 data, u32 cmd)
  105. {
  106. return ((dti & ((1 << 4) - 1)) << 28) |
  107. ((ckovrd & 1) << 27) |
  108. ((sa & ((1 << 3) - 1)) << 24) |
  109. ((ba & ((1 << 8) - 1)) << 16) |
  110. ((data & ((1 << 8) - 1)) << 8) |
  111. (cmd & 1);
  112. }
  113. static inline u16 i5100_tolm_tolm(u16 a)
  114. {
  115. return a >> 12 & ((1 << 4) - 1);
  116. }
  117. static inline u16 i5100_mir_limit(u16 a)
  118. {
  119. return a >> 4 & ((1 << 12) - 1);
  120. }
  121. static inline u16 i5100_mir_way1(u16 a)
  122. {
  123. return a >> 1 & 1;
  124. }
  125. static inline u16 i5100_mir_way0(u16 a)
  126. {
  127. return a & 1;
  128. }
  129. static inline u32 i5100_ferr_nf_mem_chan_indx(u32 a)
  130. {
  131. return a >> 28 & 1;
  132. }
  133. static inline u32 i5100_ferr_nf_mem_any(u32 a)
  134. {
  135. return a & I5100_FERR_NF_MEM_ANY_MASK;
  136. }
  137. static inline u32 i5100_nerr_nf_mem_any(u32 a)
  138. {
  139. return i5100_ferr_nf_mem_any(a);
  140. }
  141. static inline u32 i5100_dmir_limit(u32 a)
  142. {
  143. return a >> 16 & ((1 << 11) - 1);
  144. }
  145. static inline u32 i5100_dmir_rank(u32 a, u32 i)
  146. {
  147. return a >> (4 * i) & ((1 << 2) - 1);
  148. }
  149. static inline u16 i5100_mtr_present(u16 a)
  150. {
  151. return a >> 10 & 1;
  152. }
  153. static inline u16 i5100_mtr_ethrottle(u16 a)
  154. {
  155. return a >> 9 & 1;
  156. }
  157. static inline u16 i5100_mtr_width(u16 a)
  158. {
  159. return a >> 8 & 1;
  160. }
  161. static inline u16 i5100_mtr_numbank(u16 a)
  162. {
  163. return a >> 6 & 1;
  164. }
  165. static inline u16 i5100_mtr_numrow(u16 a)
  166. {
  167. return a >> 2 & ((1 << 2) - 1);
  168. }
  169. static inline u16 i5100_mtr_numcol(u16 a)
  170. {
  171. return a & ((1 << 2) - 1);
  172. }
  173. static inline u32 i5100_validlog_redmemvalid(u32 a)
  174. {
  175. return a >> 2 & 1;
  176. }
  177. static inline u32 i5100_validlog_recmemvalid(u32 a)
  178. {
  179. return a >> 1 & 1;
  180. }
  181. static inline u32 i5100_validlog_nrecmemvalid(u32 a)
  182. {
  183. return a & 1;
  184. }
  185. static inline u32 i5100_nrecmema_merr(u32 a)
  186. {
  187. return a >> 15 & ((1 << 5) - 1);
  188. }
  189. static inline u32 i5100_nrecmema_bank(u32 a)
  190. {
  191. return a >> 12 & ((1 << 3) - 1);
  192. }
  193. static inline u32 i5100_nrecmema_rank(u32 a)
  194. {
  195. return a >> 8 & ((1 << 3) - 1);
  196. }
  197. static inline u32 i5100_nrecmema_dm_buf_id(u32 a)
  198. {
  199. return a & ((1 << 8) - 1);
  200. }
  201. static inline u32 i5100_nrecmemb_cas(u32 a)
  202. {
  203. return a >> 16 & ((1 << 13) - 1);
  204. }
  205. static inline u32 i5100_nrecmemb_ras(u32 a)
  206. {
  207. return a & ((1 << 16) - 1);
  208. }
  209. static inline u32 i5100_redmemb_ecc_locator(u32 a)
  210. {
  211. return a & ((1 << 18) - 1);
  212. }
  213. static inline u32 i5100_recmema_merr(u32 a)
  214. {
  215. return i5100_nrecmema_merr(a);
  216. }
  217. static inline u32 i5100_recmema_bank(u32 a)
  218. {
  219. return i5100_nrecmema_bank(a);
  220. }
  221. static inline u32 i5100_recmema_rank(u32 a)
  222. {
  223. return i5100_nrecmema_rank(a);
  224. }
  225. static inline u32 i5100_recmema_dm_buf_id(u32 a)
  226. {
  227. return i5100_nrecmema_dm_buf_id(a);
  228. }
  229. static inline u32 i5100_recmemb_cas(u32 a)
  230. {
  231. return i5100_nrecmemb_cas(a);
  232. }
  233. static inline u32 i5100_recmemb_ras(u32 a)
  234. {
  235. return i5100_nrecmemb_ras(a);
  236. }
  237. /* some generic limits */
  238. #define I5100_MAX_RANKS_PER_CHAN 6
  239. #define I5100_CHANNELS 2
  240. #define I5100_MAX_RANKS_PER_DIMM 4
  241. #define I5100_DIMM_ADDR_LINES (6 - 3) /* 64 bits / 8 bits per byte */
  242. #define I5100_MAX_DIMM_SLOTS_PER_CHAN 4
  243. #define I5100_MAX_RANK_INTERLEAVE 4
  244. #define I5100_MAX_DMIRS 5
  245. #define I5100_SCRUB_REFRESH_RATE (5 * 60 * HZ)
  246. struct i5100_priv {
  247. /* ranks on each dimm -- 0 maps to not present -- obtained via SPD */
  248. int dimm_numrank[I5100_CHANNELS][I5100_MAX_DIMM_SLOTS_PER_CHAN];
  249. /*
  250. * mainboard chip select map -- maps i5100 chip selects to
  251. * DIMM slot chip selects. In the case of only 4 ranks per
  252. * channel, the mapping is fairly obvious but not unique.
  253. * we map -1 -> NC and assume both channels use the same
  254. * map...
  255. *
  256. */
  257. int dimm_csmap[I5100_MAX_DIMM_SLOTS_PER_CHAN][I5100_MAX_RANKS_PER_DIMM];
  258. /* memory interleave range */
  259. struct {
  260. u64 limit;
  261. unsigned way[2];
  262. } mir[I5100_CHANNELS];
  263. /* adjusted memory interleave range register */
  264. unsigned amir[I5100_CHANNELS];
  265. /* dimm interleave range */
  266. struct {
  267. unsigned rank[I5100_MAX_RANK_INTERLEAVE];
  268. u64 limit;
  269. } dmir[I5100_CHANNELS][I5100_MAX_DMIRS];
  270. /* memory technology registers... */
  271. struct {
  272. unsigned present; /* 0 or 1 */
  273. unsigned ethrottle; /* 0 or 1 */
  274. unsigned width; /* 4 or 8 bits */
  275. unsigned numbank; /* 2 or 3 lines */
  276. unsigned numrow; /* 13 .. 16 lines */
  277. unsigned numcol; /* 11 .. 12 lines */
  278. } mtr[I5100_CHANNELS][I5100_MAX_RANKS_PER_CHAN];
  279. u64 tolm; /* top of low memory in bytes */
  280. unsigned ranksperchan; /* number of ranks per channel */
  281. struct pci_dev *mc; /* device 16 func 1 */
  282. struct pci_dev *ch0mm; /* device 21 func 0 */
  283. struct pci_dev *ch1mm; /* device 22 func 0 */
  284. struct delayed_work i5100_scrubbing;
  285. int scrub_enable;
  286. };
  287. /* map a rank/chan to a slot number on the mainboard */
  288. static int i5100_rank_to_slot(const struct mem_ctl_info *mci,
  289. int chan, int rank)
  290. {
  291. const struct i5100_priv *priv = mci->pvt_info;
  292. int i;
  293. for (i = 0; i < I5100_MAX_DIMM_SLOTS_PER_CHAN; i++) {
  294. int j;
  295. const int numrank = priv->dimm_numrank[chan][i];
  296. for (j = 0; j < numrank; j++)
  297. if (priv->dimm_csmap[i][j] == rank)
  298. return i * 2 + chan;
  299. }
  300. return -1;
  301. }
  302. static const char *i5100_err_msg(unsigned err)
  303. {
  304. static const char *merrs[] = {
  305. "unknown", /* 0 */
  306. "uncorrectable data ECC on replay", /* 1 */
  307. "unknown", /* 2 */
  308. "unknown", /* 3 */
  309. "aliased uncorrectable demand data ECC", /* 4 */
  310. "aliased uncorrectable spare-copy data ECC", /* 5 */
  311. "aliased uncorrectable patrol data ECC", /* 6 */
  312. "unknown", /* 7 */
  313. "unknown", /* 8 */
  314. "unknown", /* 9 */
  315. "non-aliased uncorrectable demand data ECC", /* 10 */
  316. "non-aliased uncorrectable spare-copy data ECC", /* 11 */
  317. "non-aliased uncorrectable patrol data ECC", /* 12 */
  318. "unknown", /* 13 */
  319. "correctable demand data ECC", /* 14 */
  320. "correctable spare-copy data ECC", /* 15 */
  321. "correctable patrol data ECC", /* 16 */
  322. "unknown", /* 17 */
  323. "SPD protocol error", /* 18 */
  324. "unknown", /* 19 */
  325. "spare copy initiated", /* 20 */
  326. "spare copy completed", /* 21 */
  327. };
  328. unsigned i;
  329. for (i = 0; i < ARRAY_SIZE(merrs); i++)
  330. if (1 << i & err)
  331. return merrs[i];
  332. return "none";
  333. }
  334. /* convert csrow index into a rank (per channel -- 0..5) */
  335. static int i5100_csrow_to_rank(const struct mem_ctl_info *mci, int csrow)
  336. {
  337. const struct i5100_priv *priv = mci->pvt_info;
  338. return csrow % priv->ranksperchan;
  339. }
  340. /* convert csrow index into a channel (0..1) */
  341. static int i5100_csrow_to_chan(const struct mem_ctl_info *mci, int csrow)
  342. {
  343. const struct i5100_priv *priv = mci->pvt_info;
  344. return csrow / priv->ranksperchan;
  345. }
  346. static unsigned i5100_rank_to_csrow(const struct mem_ctl_info *mci,
  347. int chan, int rank)
  348. {
  349. const struct i5100_priv *priv = mci->pvt_info;
  350. return chan * priv->ranksperchan + rank;
  351. }
  352. static void i5100_handle_ce(struct mem_ctl_info *mci,
  353. int chan,
  354. unsigned bank,
  355. unsigned rank,
  356. unsigned long syndrome,
  357. unsigned cas,
  358. unsigned ras,
  359. const char *msg)
  360. {
  361. const int csrow = i5100_rank_to_csrow(mci, chan, rank);
  362. printk(KERN_ERR
  363. "CE chan %d, bank %u, rank %u, syndrome 0x%lx, "
  364. "cas %u, ras %u, csrow %u, label \"%s\": %s\n",
  365. chan, bank, rank, syndrome, cas, ras,
  366. csrow, mci->csrows[csrow].channels[0].label, msg);
  367. mci->ce_count++;
  368. mci->csrows[csrow].ce_count++;
  369. mci->csrows[csrow].channels[0].ce_count++;
  370. }
  371. static void i5100_handle_ue(struct mem_ctl_info *mci,
  372. int chan,
  373. unsigned bank,
  374. unsigned rank,
  375. unsigned long syndrome,
  376. unsigned cas,
  377. unsigned ras,
  378. const char *msg)
  379. {
  380. const int csrow = i5100_rank_to_csrow(mci, chan, rank);
  381. printk(KERN_ERR
  382. "UE chan %d, bank %u, rank %u, syndrome 0x%lx, "
  383. "cas %u, ras %u, csrow %u, label \"%s\": %s\n",
  384. chan, bank, rank, syndrome, cas, ras,
  385. csrow, mci->csrows[csrow].channels[0].label, msg);
  386. mci->ue_count++;
  387. mci->csrows[csrow].ue_count++;
  388. }
  389. static void i5100_read_log(struct mem_ctl_info *mci, int chan,
  390. u32 ferr, u32 nerr)
  391. {
  392. struct i5100_priv *priv = mci->pvt_info;
  393. struct pci_dev *pdev = (chan) ? priv->ch1mm : priv->ch0mm;
  394. u32 dw;
  395. u32 dw2;
  396. unsigned syndrome = 0;
  397. unsigned ecc_loc = 0;
  398. unsigned merr;
  399. unsigned bank;
  400. unsigned rank;
  401. unsigned cas;
  402. unsigned ras;
  403. pci_read_config_dword(pdev, I5100_VALIDLOG, &dw);
  404. if (i5100_validlog_redmemvalid(dw)) {
  405. pci_read_config_dword(pdev, I5100_REDMEMA, &dw2);
  406. syndrome = dw2;
  407. pci_read_config_dword(pdev, I5100_REDMEMB, &dw2);
  408. ecc_loc = i5100_redmemb_ecc_locator(dw2);
  409. }
  410. if (i5100_validlog_recmemvalid(dw)) {
  411. const char *msg;
  412. pci_read_config_dword(pdev, I5100_RECMEMA, &dw2);
  413. merr = i5100_recmema_merr(dw2);
  414. bank = i5100_recmema_bank(dw2);
  415. rank = i5100_recmema_rank(dw2);
  416. pci_read_config_dword(pdev, I5100_RECMEMB, &dw2);
  417. cas = i5100_recmemb_cas(dw2);
  418. ras = i5100_recmemb_ras(dw2);
  419. /* FIXME: not really sure if this is what merr is...
  420. */
  421. if (!merr)
  422. msg = i5100_err_msg(ferr);
  423. else
  424. msg = i5100_err_msg(nerr);
  425. i5100_handle_ce(mci, chan, bank, rank, syndrome, cas, ras, msg);
  426. }
  427. if (i5100_validlog_nrecmemvalid(dw)) {
  428. const char *msg;
  429. pci_read_config_dword(pdev, I5100_NRECMEMA, &dw2);
  430. merr = i5100_nrecmema_merr(dw2);
  431. bank = i5100_nrecmema_bank(dw2);
  432. rank = i5100_nrecmema_rank(dw2);
  433. pci_read_config_dword(pdev, I5100_NRECMEMB, &dw2);
  434. cas = i5100_nrecmemb_cas(dw2);
  435. ras = i5100_nrecmemb_ras(dw2);
  436. /* FIXME: not really sure if this is what merr is...
  437. */
  438. if (!merr)
  439. msg = i5100_err_msg(ferr);
  440. else
  441. msg = i5100_err_msg(nerr);
  442. i5100_handle_ue(mci, chan, bank, rank, syndrome, cas, ras, msg);
  443. }
  444. pci_write_config_dword(pdev, I5100_VALIDLOG, dw);
  445. }
  446. static void i5100_check_error(struct mem_ctl_info *mci)
  447. {
  448. struct i5100_priv *priv = mci->pvt_info;
  449. u32 dw, dw2;
  450. pci_read_config_dword(priv->mc, I5100_FERR_NF_MEM, &dw);
  451. if (i5100_ferr_nf_mem_any(dw)) {
  452. pci_read_config_dword(priv->mc, I5100_NERR_NF_MEM, &dw2);
  453. i5100_read_log(mci, i5100_ferr_nf_mem_chan_indx(dw),
  454. i5100_ferr_nf_mem_any(dw),
  455. i5100_nerr_nf_mem_any(dw2));
  456. pci_write_config_dword(priv->mc, I5100_NERR_NF_MEM, dw2);
  457. }
  458. pci_write_config_dword(priv->mc, I5100_FERR_NF_MEM, dw);
  459. }
  460. /* The i5100 chipset will scrub the entire memory once, then
  461. * set a done bit. Continuous scrubbing is achieved by enqueing
  462. * delayed work to a workqueue, checking every few minutes if
  463. * the scrubbing has completed and if so reinitiating it.
  464. */
  465. static void i5100_refresh_scrubbing(struct work_struct *work)
  466. {
  467. struct delayed_work *i5100_scrubbing = container_of(work,
  468. struct delayed_work,
  469. work);
  470. struct i5100_priv *priv = container_of(i5100_scrubbing,
  471. struct i5100_priv,
  472. i5100_scrubbing);
  473. u32 dw;
  474. pci_read_config_dword(priv->mc, I5100_MC, &dw);
  475. if (priv->scrub_enable) {
  476. pci_read_config_dword(priv->mc, I5100_MC, &dw);
  477. if (i5100_mc_scrbdone(dw)) {
  478. dw |= I5100_MC_SCRBEN_MASK;
  479. pci_write_config_dword(priv->mc, I5100_MC, dw);
  480. pci_read_config_dword(priv->mc, I5100_MC, &dw);
  481. }
  482. schedule_delayed_work(&(priv->i5100_scrubbing),
  483. I5100_SCRUB_REFRESH_RATE);
  484. }
  485. }
  486. /*
  487. * The bandwidth is based on experimentation, feel free to refine it.
  488. */
  489. static int i5100_set_scrub_rate(struct mem_ctl_info *mci, u32 bandwidth)
  490. {
  491. struct i5100_priv *priv = mci->pvt_info;
  492. u32 dw;
  493. pci_read_config_dword(priv->mc, I5100_MC, &dw);
  494. if (bandwidth) {
  495. priv->scrub_enable = 1;
  496. dw |= I5100_MC_SCRBEN_MASK;
  497. schedule_delayed_work(&(priv->i5100_scrubbing),
  498. I5100_SCRUB_REFRESH_RATE);
  499. } else {
  500. priv->scrub_enable = 0;
  501. dw &= ~I5100_MC_SCRBEN_MASK;
  502. cancel_delayed_work(&(priv->i5100_scrubbing));
  503. }
  504. pci_write_config_dword(priv->mc, I5100_MC, dw);
  505. pci_read_config_dword(priv->mc, I5100_MC, &dw);
  506. bandwidth = 5900000 * i5100_mc_scrben(dw);
  507. return bandwidth;
  508. }
  509. static int i5100_get_scrub_rate(struct mem_ctl_info *mci)
  510. {
  511. struct i5100_priv *priv = mci->pvt_info;
  512. u32 dw;
  513. pci_read_config_dword(priv->mc, I5100_MC, &dw);
  514. return 5900000 * i5100_mc_scrben(dw);
  515. }
  516. static struct pci_dev *pci_get_device_func(unsigned vendor,
  517. unsigned device,
  518. unsigned func)
  519. {
  520. struct pci_dev *ret = NULL;
  521. while (1) {
  522. ret = pci_get_device(vendor, device, ret);
  523. if (!ret)
  524. break;
  525. if (PCI_FUNC(ret->devfn) == func)
  526. break;
  527. }
  528. return ret;
  529. }
  530. static unsigned long __devinit i5100_npages(struct mem_ctl_info *mci,
  531. int csrow)
  532. {
  533. struct i5100_priv *priv = mci->pvt_info;
  534. const unsigned chan_rank = i5100_csrow_to_rank(mci, csrow);
  535. const unsigned chan = i5100_csrow_to_chan(mci, csrow);
  536. unsigned addr_lines;
  537. /* dimm present? */
  538. if (!priv->mtr[chan][chan_rank].present)
  539. return 0ULL;
  540. addr_lines =
  541. I5100_DIMM_ADDR_LINES +
  542. priv->mtr[chan][chan_rank].numcol +
  543. priv->mtr[chan][chan_rank].numrow +
  544. priv->mtr[chan][chan_rank].numbank;
  545. return (unsigned long)
  546. ((unsigned long long) (1ULL << addr_lines) / PAGE_SIZE);
  547. }
  548. static void __devinit i5100_init_mtr(struct mem_ctl_info *mci)
  549. {
  550. struct i5100_priv *priv = mci->pvt_info;
  551. struct pci_dev *mms[2] = { priv->ch0mm, priv->ch1mm };
  552. int i;
  553. for (i = 0; i < I5100_CHANNELS; i++) {
  554. int j;
  555. struct pci_dev *pdev = mms[i];
  556. for (j = 0; j < I5100_MAX_RANKS_PER_CHAN; j++) {
  557. const unsigned addr =
  558. (j < 4) ? I5100_MTR_0 + j * 2 :
  559. I5100_MTR_4 + (j - 4) * 2;
  560. u16 w;
  561. pci_read_config_word(pdev, addr, &w);
  562. priv->mtr[i][j].present = i5100_mtr_present(w);
  563. priv->mtr[i][j].ethrottle = i5100_mtr_ethrottle(w);
  564. priv->mtr[i][j].width = 4 + 4 * i5100_mtr_width(w);
  565. priv->mtr[i][j].numbank = 2 + i5100_mtr_numbank(w);
  566. priv->mtr[i][j].numrow = 13 + i5100_mtr_numrow(w);
  567. priv->mtr[i][j].numcol = 10 + i5100_mtr_numcol(w);
  568. }
  569. }
  570. }
  571. /*
  572. * FIXME: make this into a real i2c adapter (so that dimm-decode
  573. * will work)?
  574. */
  575. static int i5100_read_spd_byte(const struct mem_ctl_info *mci,
  576. u8 ch, u8 slot, u8 addr, u8 *byte)
  577. {
  578. struct i5100_priv *priv = mci->pvt_info;
  579. u16 w;
  580. unsigned long et;
  581. pci_read_config_word(priv->mc, I5100_SPDDATA, &w);
  582. if (i5100_spddata_busy(w))
  583. return -1;
  584. pci_write_config_dword(priv->mc, I5100_SPDCMD,
  585. i5100_spdcmd_create(0xa, 1, ch * 4 + slot, addr,
  586. 0, 0));
  587. /* wait up to 100ms */
  588. et = jiffies + HZ / 10;
  589. udelay(100);
  590. while (1) {
  591. pci_read_config_word(priv->mc, I5100_SPDDATA, &w);
  592. if (!i5100_spddata_busy(w))
  593. break;
  594. udelay(100);
  595. }
  596. if (!i5100_spddata_rdo(w) || i5100_spddata_sbe(w))
  597. return -1;
  598. *byte = i5100_spddata_data(w);
  599. return 0;
  600. }
  601. /*
  602. * fill dimm chip select map
  603. *
  604. * FIXME:
  605. * o not the only way to may chip selects to dimm slots
  606. * o investigate if there is some way to obtain this map from the bios
  607. */
  608. static void __devinit i5100_init_dimm_csmap(struct mem_ctl_info *mci)
  609. {
  610. struct i5100_priv *priv = mci->pvt_info;
  611. int i;
  612. for (i = 0; i < I5100_MAX_DIMM_SLOTS_PER_CHAN; i++) {
  613. int j;
  614. for (j = 0; j < I5100_MAX_RANKS_PER_DIMM; j++)
  615. priv->dimm_csmap[i][j] = -1; /* default NC */
  616. }
  617. /* only 2 chip selects per slot... */
  618. if (priv->ranksperchan == 4) {
  619. priv->dimm_csmap[0][0] = 0;
  620. priv->dimm_csmap[0][1] = 3;
  621. priv->dimm_csmap[1][0] = 1;
  622. priv->dimm_csmap[1][1] = 2;
  623. priv->dimm_csmap[2][0] = 2;
  624. priv->dimm_csmap[3][0] = 3;
  625. } else {
  626. priv->dimm_csmap[0][0] = 0;
  627. priv->dimm_csmap[0][1] = 1;
  628. priv->dimm_csmap[1][0] = 2;
  629. priv->dimm_csmap[1][1] = 3;
  630. priv->dimm_csmap[2][0] = 4;
  631. priv->dimm_csmap[2][1] = 5;
  632. }
  633. }
  634. static void __devinit i5100_init_dimm_layout(struct pci_dev *pdev,
  635. struct mem_ctl_info *mci)
  636. {
  637. struct i5100_priv *priv = mci->pvt_info;
  638. int i;
  639. for (i = 0; i < I5100_CHANNELS; i++) {
  640. int j;
  641. for (j = 0; j < I5100_MAX_DIMM_SLOTS_PER_CHAN; j++) {
  642. u8 rank;
  643. if (i5100_read_spd_byte(mci, i, j, 5, &rank) < 0)
  644. priv->dimm_numrank[i][j] = 0;
  645. else
  646. priv->dimm_numrank[i][j] = (rank & 3) + 1;
  647. }
  648. }
  649. i5100_init_dimm_csmap(mci);
  650. }
  651. static void __devinit i5100_init_interleaving(struct pci_dev *pdev,
  652. struct mem_ctl_info *mci)
  653. {
  654. u16 w;
  655. u32 dw;
  656. struct i5100_priv *priv = mci->pvt_info;
  657. struct pci_dev *mms[2] = { priv->ch0mm, priv->ch1mm };
  658. int i;
  659. pci_read_config_word(pdev, I5100_TOLM, &w);
  660. priv->tolm = (u64) i5100_tolm_tolm(w) * 256 * 1024 * 1024;
  661. pci_read_config_word(pdev, I5100_MIR0, &w);
  662. priv->mir[0].limit = (u64) i5100_mir_limit(w) << 28;
  663. priv->mir[0].way[1] = i5100_mir_way1(w);
  664. priv->mir[0].way[0] = i5100_mir_way0(w);
  665. pci_read_config_word(pdev, I5100_MIR1, &w);
  666. priv->mir[1].limit = (u64) i5100_mir_limit(w) << 28;
  667. priv->mir[1].way[1] = i5100_mir_way1(w);
  668. priv->mir[1].way[0] = i5100_mir_way0(w);
  669. pci_read_config_word(pdev, I5100_AMIR_0, &w);
  670. priv->amir[0] = w;
  671. pci_read_config_word(pdev, I5100_AMIR_1, &w);
  672. priv->amir[1] = w;
  673. for (i = 0; i < I5100_CHANNELS; i++) {
  674. int j;
  675. for (j = 0; j < 5; j++) {
  676. int k;
  677. pci_read_config_dword(mms[i], I5100_DMIR + j * 4, &dw);
  678. priv->dmir[i][j].limit =
  679. (u64) i5100_dmir_limit(dw) << 28;
  680. for (k = 0; k < I5100_MAX_RANKS_PER_DIMM; k++)
  681. priv->dmir[i][j].rank[k] =
  682. i5100_dmir_rank(dw, k);
  683. }
  684. }
  685. i5100_init_mtr(mci);
  686. }
  687. static void __devinit i5100_init_csrows(struct mem_ctl_info *mci)
  688. {
  689. int i;
  690. unsigned long total_pages = 0UL;
  691. struct i5100_priv *priv = mci->pvt_info;
  692. for (i = 0; i < mci->nr_csrows; i++) {
  693. const unsigned long npages = i5100_npages(mci, i);
  694. const unsigned chan = i5100_csrow_to_chan(mci, i);
  695. const unsigned rank = i5100_csrow_to_rank(mci, i);
  696. if (!npages)
  697. continue;
  698. /*
  699. * FIXME: these two are totally bogus -- I don't see how to
  700. * map them correctly to this structure...
  701. */
  702. mci->csrows[i].first_page = total_pages;
  703. mci->csrows[i].last_page = total_pages + npages - 1;
  704. mci->csrows[i].page_mask = 0UL;
  705. mci->csrows[i].nr_pages = npages;
  706. mci->csrows[i].grain = 32;
  707. mci->csrows[i].csrow_idx = i;
  708. mci->csrows[i].dtype =
  709. (priv->mtr[chan][rank].width == 4) ? DEV_X4 : DEV_X8;
  710. mci->csrows[i].ue_count = 0;
  711. mci->csrows[i].ce_count = 0;
  712. mci->csrows[i].mtype = MEM_RDDR2;
  713. mci->csrows[i].edac_mode = EDAC_SECDED;
  714. mci->csrows[i].mci = mci;
  715. mci->csrows[i].nr_channels = 1;
  716. mci->csrows[i].channels[0].chan_idx = 0;
  717. mci->csrows[i].channels[0].ce_count = 0;
  718. mci->csrows[i].channels[0].csrow = mci->csrows + i;
  719. snprintf(mci->csrows[i].channels[0].label,
  720. sizeof(mci->csrows[i].channels[0].label),
  721. "DIMM%u", i5100_rank_to_slot(mci, chan, rank));
  722. total_pages += npages;
  723. }
  724. }
  725. static int __devinit i5100_init_one(struct pci_dev *pdev,
  726. const struct pci_device_id *id)
  727. {
  728. int rc;
  729. struct mem_ctl_info *mci;
  730. struct i5100_priv *priv;
  731. struct pci_dev *ch0mm, *ch1mm;
  732. int ret = 0;
  733. u32 dw;
  734. int ranksperch;
  735. if (PCI_FUNC(pdev->devfn) != 1)
  736. return -ENODEV;
  737. rc = pci_enable_device(pdev);
  738. if (rc < 0) {
  739. ret = rc;
  740. goto bail;
  741. }
  742. /* ECC enabled? */
  743. pci_read_config_dword(pdev, I5100_MC, &dw);
  744. if (!i5100_mc_errdeten(dw)) {
  745. printk(KERN_INFO "i5100_edac: ECC not enabled.\n");
  746. ret = -ENODEV;
  747. goto bail_pdev;
  748. }
  749. /* figure out how many ranks, from strapped state of 48GB_Mode input */
  750. pci_read_config_dword(pdev, I5100_MS, &dw);
  751. ranksperch = !!(dw & (1 << 8)) * 2 + 4;
  752. /* enable error reporting... */
  753. pci_read_config_dword(pdev, I5100_EMASK_MEM, &dw);
  754. dw &= ~I5100_FERR_NF_MEM_ANY_MASK;
  755. pci_write_config_dword(pdev, I5100_EMASK_MEM, dw);
  756. /* device 21, func 0, Channel 0 Memory Map, Error Flag/Mask, etc... */
  757. ch0mm = pci_get_device_func(PCI_VENDOR_ID_INTEL,
  758. PCI_DEVICE_ID_INTEL_5100_21, 0);
  759. if (!ch0mm) {
  760. ret = -ENODEV;
  761. goto bail_pdev;
  762. }
  763. rc = pci_enable_device(ch0mm);
  764. if (rc < 0) {
  765. ret = rc;
  766. goto bail_ch0;
  767. }
  768. /* device 22, func 0, Channel 1 Memory Map, Error Flag/Mask, etc... */
  769. ch1mm = pci_get_device_func(PCI_VENDOR_ID_INTEL,
  770. PCI_DEVICE_ID_INTEL_5100_22, 0);
  771. if (!ch1mm) {
  772. ret = -ENODEV;
  773. goto bail_disable_ch0;
  774. }
  775. rc = pci_enable_device(ch1mm);
  776. if (rc < 0) {
  777. ret = rc;
  778. goto bail_ch1;
  779. }
  780. mci = edac_mc_alloc(sizeof(*priv), ranksperch * 2, 1, 0);
  781. if (!mci) {
  782. ret = -ENOMEM;
  783. goto bail_disable_ch1;
  784. }
  785. mci->dev = &pdev->dev;
  786. priv = mci->pvt_info;
  787. priv->ranksperchan = ranksperch;
  788. priv->mc = pdev;
  789. priv->ch0mm = ch0mm;
  790. priv->ch1mm = ch1mm;
  791. INIT_DELAYED_WORK(&(priv->i5100_scrubbing), i5100_refresh_scrubbing);
  792. /* If scrubbing was already enabled by the bios, start maintaining it */
  793. pci_read_config_dword(pdev, I5100_MC, &dw);
  794. if (i5100_mc_scrben(dw)) {
  795. priv->scrub_enable = 1;
  796. schedule_delayed_work(&(priv->i5100_scrubbing),
  797. I5100_SCRUB_REFRESH_RATE);
  798. }
  799. i5100_init_dimm_layout(pdev, mci);
  800. i5100_init_interleaving(pdev, mci);
  801. mci->mtype_cap = MEM_FLAG_FB_DDR2;
  802. mci->edac_ctl_cap = EDAC_FLAG_SECDED;
  803. mci->edac_cap = EDAC_FLAG_SECDED;
  804. mci->mod_name = "i5100_edac.c";
  805. mci->mod_ver = "not versioned";
  806. mci->ctl_name = "i5100";
  807. mci->dev_name = pci_name(pdev);
  808. mci->ctl_page_to_phys = NULL;
  809. mci->edac_check = i5100_check_error;
  810. mci->set_sdram_scrub_rate = i5100_set_scrub_rate;
  811. mci->get_sdram_scrub_rate = i5100_get_scrub_rate;
  812. i5100_init_csrows(mci);
  813. /* this strange construction seems to be in every driver, dunno why */
  814. switch (edac_op_state) {
  815. case EDAC_OPSTATE_POLL:
  816. case EDAC_OPSTATE_NMI:
  817. break;
  818. default:
  819. edac_op_state = EDAC_OPSTATE_POLL;
  820. break;
  821. }
  822. if (edac_mc_add_mc(mci)) {
  823. ret = -ENODEV;
  824. goto bail_scrub;
  825. }
  826. return ret;
  827. bail_scrub:
  828. priv->scrub_enable = 0;
  829. cancel_delayed_work_sync(&(priv->i5100_scrubbing));
  830. edac_mc_free(mci);
  831. bail_disable_ch1:
  832. pci_disable_device(ch1mm);
  833. bail_ch1:
  834. pci_dev_put(ch1mm);
  835. bail_disable_ch0:
  836. pci_disable_device(ch0mm);
  837. bail_ch0:
  838. pci_dev_put(ch0mm);
  839. bail_pdev:
  840. pci_disable_device(pdev);
  841. bail:
  842. return ret;
  843. }
  844. static void __devexit i5100_remove_one(struct pci_dev *pdev)
  845. {
  846. struct mem_ctl_info *mci;
  847. struct i5100_priv *priv;
  848. mci = edac_mc_del_mc(&pdev->dev);
  849. if (!mci)
  850. return;
  851. priv = mci->pvt_info;
  852. priv->scrub_enable = 0;
  853. cancel_delayed_work_sync(&(priv->i5100_scrubbing));
  854. pci_disable_device(pdev);
  855. pci_disable_device(priv->ch0mm);
  856. pci_disable_device(priv->ch1mm);
  857. pci_dev_put(priv->ch0mm);
  858. pci_dev_put(priv->ch1mm);
  859. edac_mc_free(mci);
  860. }
  861. static DEFINE_PCI_DEVICE_TABLE(i5100_pci_tbl) = {
  862. /* Device 16, Function 0, Channel 0 Memory Map, Error Flag/Mask, ... */
  863. { PCI_DEVICE(PCI_VENDOR_ID_INTEL, PCI_DEVICE_ID_INTEL_5100_16) },
  864. { 0, }
  865. };
  866. MODULE_DEVICE_TABLE(pci, i5100_pci_tbl);
  867. static struct pci_driver i5100_driver = {
  868. .name = KBUILD_BASENAME,
  869. .probe = i5100_init_one,
  870. .remove = __devexit_p(i5100_remove_one),
  871. .id_table = i5100_pci_tbl,
  872. };
  873. static int __init i5100_init(void)
  874. {
  875. int pci_rc;
  876. pci_rc = pci_register_driver(&i5100_driver);
  877. return (pci_rc < 0) ? pci_rc : 0;
  878. }
  879. static void __exit i5100_exit(void)
  880. {
  881. pci_unregister_driver(&i5100_driver);
  882. }
  883. module_init(i5100_init);
  884. module_exit(i5100_exit);
  885. MODULE_LICENSE("GPL");
  886. MODULE_AUTHOR
  887. ("Arthur Jones <ajones@riverbed.com>");
  888. MODULE_DESCRIPTION("MC Driver for Intel I5100 memory controllers");