i10nm_base.c 32 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285
  1. // SPDX-License-Identifier: GPL-2.0
  2. /*
  3. * Driver for Intel(R) 10nm server memory controller.
  4. * Copyright (c) 2019, Intel Corporation.
  5. *
  6. */
  7. #include <linux/kernel.h>
  8. #include <linux/io.h>
  9. #include <asm/cpu_device_id.h>
  10. #include <asm/intel-family.h>
  11. #include <asm/mce.h>
  12. #include "edac_module.h"
  13. #include "skx_common.h"
  14. #define I10NM_REVISION "v0.0.6"
  15. #define EDAC_MOD_STR "i10nm_edac"
  16. /* Debug macros */
  17. #define i10nm_printk(level, fmt, arg...) \
  18. edac_printk(level, "i10nm", fmt, ##arg)
  19. #define I10NM_GET_SCK_BAR(d, reg) \
  20. pci_read_config_dword((d)->uracu, 0xd0, &(reg))
  21. #define I10NM_GET_IMC_BAR(d, i, reg) \
  22. pci_read_config_dword((d)->uracu, \
  23. (res_cfg->type == GNR ? 0xd4 : 0xd8) + (i) * 4, &(reg))
  24. #define I10NM_GET_SAD(d, offset, i, reg)\
  25. pci_read_config_dword((d)->sad_all, (offset) + (i) * \
  26. (res_cfg->type == GNR ? 12 : 8), &(reg))
  27. #define I10NM_GET_HBM_IMC_BAR(d, reg) \
  28. pci_read_config_dword((d)->uracu, 0xd4, &(reg))
  29. #define I10NM_GET_CAPID3_CFG(d, reg) \
  30. pci_read_config_dword((d)->pcu_cr3, \
  31. res_cfg->type == GNR ? 0x290 : 0x90, &(reg))
  32. #define I10NM_GET_CAPID5_CFG(d, reg) \
  33. pci_read_config_dword((d)->pcu_cr3, \
  34. res_cfg->type == GNR ? 0x298 : 0x98, &(reg))
  35. #define I10NM_GET_DIMMMTR(m, i, j) \
  36. readl((m)->mbase + ((m)->hbm_mc ? 0x80c : \
  37. (res_cfg->type == GNR ? 0xc0c : 0x2080c)) + \
  38. (i) * (m)->chan_mmio_sz + (j) * 4)
  39. #define I10NM_GET_MCDDRTCFG(m, i) \
  40. readl((m)->mbase + ((m)->hbm_mc ? 0x970 : 0x20970) + \
  41. (i) * (m)->chan_mmio_sz)
  42. #define I10NM_GET_MCMTR(m, i) \
  43. readl((m)->mbase + ((m)->hbm_mc ? 0xef8 : \
  44. (res_cfg->type == GNR ? 0xaf8 : 0x20ef8)) + \
  45. (i) * (m)->chan_mmio_sz)
  46. #define I10NM_GET_REG32(m, i, offset) \
  47. readl((m)->mbase + (i) * (m)->chan_mmio_sz + (offset))
  48. #define I10NM_GET_REG64(m, i, offset) \
  49. readq((m)->mbase + (i) * (m)->chan_mmio_sz + (offset))
  50. #define I10NM_SET_REG32(m, i, offset, v) \
  51. writel(v, (m)->mbase + (i) * (m)->chan_mmio_sz + (offset))
  52. #define I10NM_GET_SCK_MMIO_BASE(reg) (GET_BITFIELD(reg, 0, 28) << 23)
  53. #define I10NM_GET_IMC_MMIO_OFFSET(reg) (GET_BITFIELD(reg, 0, 10) << 12)
  54. #define I10NM_GET_IMC_MMIO_SIZE(reg) ((GET_BITFIELD(reg, 13, 23) - \
  55. GET_BITFIELD(reg, 0, 10) + 1) << 12)
  56. #define I10NM_GET_HBM_IMC_MMIO_OFFSET(reg) \
  57. ((GET_BITFIELD(reg, 0, 10) << 12) + 0x140000)
  58. #define I10NM_GNR_IMC_MMIO_OFFSET 0x24c000
  59. #define I10NM_GNR_D_IMC_MMIO_OFFSET 0x206000
  60. #define I10NM_GNR_IMC_MMIO_SIZE 0x4000
  61. #define I10NM_HBM_IMC_MMIO_SIZE 0x9000
  62. #define I10NM_DDR_IMC_CH_CNT(reg) GET_BITFIELD(reg, 21, 24)
  63. #define I10NM_IS_HBM_PRESENT(reg) GET_BITFIELD(reg, 27, 30)
  64. #define I10NM_IS_HBM_IMC(reg) GET_BITFIELD(reg, 29, 29)
  65. #define I10NM_MAX_SAD 16
  66. #define I10NM_SAD_ENABLE(reg) GET_BITFIELD(reg, 0, 0)
  67. #define I10NM_SAD_NM_CACHEABLE(reg) GET_BITFIELD(reg, 5, 5)
  68. static struct list_head *i10nm_edac_list;
  69. static struct res_config *res_cfg;
  70. static int retry_rd_err_log;
  71. static int decoding_via_mca;
  72. static bool mem_cfg_2lm;
  73. static struct reg_rrl icx_reg_rrl_ddr = {
  74. .set_num = 2,
  75. .reg_num = 6,
  76. .modes = {LRE_SCRUB, LRE_DEMAND},
  77. .offsets = {
  78. {0x22c60, 0x22c54, 0x22c5c, 0x22c58, 0x22c28, 0x20ed8},
  79. {0x22e54, 0x22e60, 0x22e64, 0x22e58, 0x22e5c, 0x20ee0},
  80. },
  81. .widths = {4, 4, 4, 4, 4, 8},
  82. .v_mask = BIT(0),
  83. .uc_mask = BIT(1),
  84. .over_mask = BIT(2),
  85. .en_patspr_mask = BIT(13),
  86. .noover_mask = BIT(14),
  87. .en_mask = BIT(15),
  88. .cecnt_num = 4,
  89. .cecnt_offsets = {0x22c18, 0x22c1c, 0x22c20, 0x22c24},
  90. .cecnt_widths = {4, 4, 4, 4},
  91. };
  92. static struct reg_rrl spr_reg_rrl_ddr = {
  93. .set_num = 3,
  94. .reg_num = 6,
  95. .modes = {LRE_SCRUB, LRE_DEMAND, FRE_DEMAND},
  96. .offsets = {
  97. {0x22c60, 0x22c54, 0x22f08, 0x22c58, 0x22c28, 0x20ed8},
  98. {0x22e54, 0x22e60, 0x22f10, 0x22e58, 0x22e5c, 0x20ee0},
  99. {0x22c70, 0x22d80, 0x22f18, 0x22d58, 0x22c64, 0x20f10},
  100. },
  101. .widths = {4, 4, 8, 4, 4, 8},
  102. .v_mask = BIT(0),
  103. .uc_mask = BIT(1),
  104. .over_mask = BIT(2),
  105. .en_patspr_mask = BIT(13),
  106. .noover_mask = BIT(14),
  107. .en_mask = BIT(15),
  108. .cecnt_num = 4,
  109. .cecnt_offsets = {0x22c18, 0x22c1c, 0x22c20, 0x22c24},
  110. .cecnt_widths = {4, 4, 4, 4},
  111. };
  112. static struct reg_rrl spr_reg_rrl_hbm_pch0 = {
  113. .set_num = 2,
  114. .reg_num = 6,
  115. .modes = {LRE_SCRUB, LRE_DEMAND},
  116. .offsets = {
  117. {0x2860, 0x2854, 0x2b08, 0x2858, 0x2828, 0x0ed8},
  118. {0x2a54, 0x2a60, 0x2b10, 0x2a58, 0x2a5c, 0x0ee0},
  119. },
  120. .widths = {4, 4, 8, 4, 4, 8},
  121. .v_mask = BIT(0),
  122. .uc_mask = BIT(1),
  123. .over_mask = BIT(2),
  124. .en_patspr_mask = BIT(13),
  125. .noover_mask = BIT(14),
  126. .en_mask = BIT(15),
  127. .cecnt_num = 4,
  128. .cecnt_offsets = {0x2818, 0x281c, 0x2820, 0x2824},
  129. .cecnt_widths = {4, 4, 4, 4},
  130. };
  131. static struct reg_rrl spr_reg_rrl_hbm_pch1 = {
  132. .set_num = 2,
  133. .reg_num = 6,
  134. .modes = {LRE_SCRUB, LRE_DEMAND},
  135. .offsets = {
  136. {0x2c60, 0x2c54, 0x2f08, 0x2c58, 0x2c28, 0x0fa8},
  137. {0x2e54, 0x2e60, 0x2f10, 0x2e58, 0x2e5c, 0x0fb0},
  138. },
  139. .widths = {4, 4, 8, 4, 4, 8},
  140. .v_mask = BIT(0),
  141. .uc_mask = BIT(1),
  142. .over_mask = BIT(2),
  143. .en_patspr_mask = BIT(13),
  144. .noover_mask = BIT(14),
  145. .en_mask = BIT(15),
  146. .cecnt_num = 4,
  147. .cecnt_offsets = {0x2c18, 0x2c1c, 0x2c20, 0x2c24},
  148. .cecnt_widths = {4, 4, 4, 4},
  149. };
  150. static struct reg_rrl gnr_reg_rrl_ddr = {
  151. .set_num = 4,
  152. .reg_num = 6,
  153. .modes = {FRE_SCRUB, FRE_DEMAND, LRE_SCRUB, LRE_DEMAND},
  154. .offsets = {
  155. {0x2f10, 0x2f20, 0x2f30, 0x2f50, 0x2f60, 0xba0},
  156. {0x2f14, 0x2f24, 0x2f38, 0x2f54, 0x2f64, 0xba8},
  157. {0x2f18, 0x2f28, 0x2f40, 0x2f58, 0x2f68, 0xbb0},
  158. {0x2f1c, 0x2f2c, 0x2f48, 0x2f5c, 0x2f6c, 0xbb8},
  159. },
  160. .widths = {4, 4, 8, 4, 4, 8},
  161. .v_mask = BIT(0),
  162. .uc_mask = BIT(1),
  163. .over_mask = BIT(2),
  164. .en_patspr_mask = BIT(14),
  165. .noover_mask = BIT(15),
  166. .en_mask = BIT(12),
  167. .cecnt_num = 8,
  168. .cecnt_offsets = {0x2c10, 0x2c14, 0x2c18, 0x2c1c, 0x2c20, 0x2c24, 0x2c28, 0x2c2c},
  169. .cecnt_widths = {4, 4, 4, 4, 4, 4, 4, 4},
  170. };
  171. static u64 read_imc_reg(struct skx_imc *imc, int chan, u32 offset, u8 width)
  172. {
  173. switch (width) {
  174. case 4:
  175. return I10NM_GET_REG32(imc, chan, offset);
  176. case 8:
  177. return I10NM_GET_REG64(imc, chan, offset);
  178. default:
  179. i10nm_printk(KERN_ERR, "Invalid readd RRL 0x%x width %d\n", offset, width);
  180. return 0;
  181. }
  182. }
  183. static void write_imc_reg(struct skx_imc *imc, int chan, u32 offset, u8 width, u64 val)
  184. {
  185. switch (width) {
  186. case 4:
  187. return I10NM_SET_REG32(imc, chan, offset, (u32)val);
  188. default:
  189. i10nm_printk(KERN_ERR, "Invalid write RRL 0x%x width %d\n", offset, width);
  190. }
  191. }
  192. static void enable_rrl(struct skx_imc *imc, int chan, struct reg_rrl *rrl,
  193. int rrl_set, bool enable, u32 *rrl_ctl)
  194. {
  195. enum rrl_mode mode = rrl->modes[rrl_set];
  196. u32 offset = rrl->offsets[rrl_set][0], v;
  197. u8 width = rrl->widths[0];
  198. bool first, scrub;
  199. /* First or last read error. */
  200. first = (mode == FRE_SCRUB || mode == FRE_DEMAND);
  201. /* Patrol scrub or on-demand read error. */
  202. scrub = (mode == FRE_SCRUB || mode == LRE_SCRUB);
  203. v = read_imc_reg(imc, chan, offset, width);
  204. if (enable) {
  205. /* Save default configurations. */
  206. *rrl_ctl = v;
  207. v &= ~rrl->uc_mask;
  208. if (first)
  209. v |= rrl->noover_mask;
  210. else
  211. v &= ~rrl->noover_mask;
  212. if (scrub)
  213. v |= rrl->en_patspr_mask;
  214. else
  215. v &= ~rrl->en_patspr_mask;
  216. v |= rrl->en_mask;
  217. } else {
  218. /* Restore default configurations. */
  219. if (*rrl_ctl & rrl->uc_mask)
  220. v |= rrl->uc_mask;
  221. if (first) {
  222. if (!(*rrl_ctl & rrl->noover_mask))
  223. v &= ~rrl->noover_mask;
  224. } else {
  225. if (*rrl_ctl & rrl->noover_mask)
  226. v |= rrl->noover_mask;
  227. }
  228. if (scrub) {
  229. if (!(*rrl_ctl & rrl->en_patspr_mask))
  230. v &= ~rrl->en_patspr_mask;
  231. } else {
  232. if (*rrl_ctl & rrl->en_patspr_mask)
  233. v |= rrl->en_patspr_mask;
  234. }
  235. if (!(*rrl_ctl & rrl->en_mask))
  236. v &= ~rrl->en_mask;
  237. }
  238. write_imc_reg(imc, chan, offset, width, v);
  239. }
  240. static void enable_rrls(struct skx_imc *imc, int chan, struct reg_rrl *rrl,
  241. bool enable, u32 *rrl_ctl)
  242. {
  243. for (int i = 0; i < rrl->set_num; i++)
  244. enable_rrl(imc, chan, rrl, i, enable, rrl_ctl + i);
  245. }
  246. static void enable_rrls_ddr(struct skx_imc *imc, bool enable)
  247. {
  248. struct reg_rrl *rrl_ddr = res_cfg->reg_rrl_ddr;
  249. int i, chan_num = res_cfg->ddr_chan_num;
  250. struct skx_channel *chan = imc->chan;
  251. if (!imc->mbase)
  252. return;
  253. for (i = 0; i < chan_num; i++)
  254. enable_rrls(imc, i, rrl_ddr, enable, chan[i].rrl_ctl[0]);
  255. }
  256. static void enable_rrls_hbm(struct skx_imc *imc, bool enable)
  257. {
  258. struct reg_rrl **rrl_hbm = res_cfg->reg_rrl_hbm;
  259. int i, chan_num = res_cfg->hbm_chan_num;
  260. struct skx_channel *chan = imc->chan;
  261. if (!imc->mbase || !imc->hbm_mc || !rrl_hbm[0] || !rrl_hbm[1])
  262. return;
  263. for (i = 0; i < chan_num; i++) {
  264. enable_rrls(imc, i, rrl_hbm[0], enable, chan[i].rrl_ctl[0]);
  265. enable_rrls(imc, i, rrl_hbm[1], enable, chan[i].rrl_ctl[1]);
  266. }
  267. }
  268. static void enable_retry_rd_err_log(bool enable)
  269. {
  270. struct skx_dev *d;
  271. int i, imc_num;
  272. edac_dbg(2, "\n");
  273. list_for_each_entry(d, i10nm_edac_list, list) {
  274. imc_num = res_cfg->ddr_imc_num;
  275. for (i = 0; i < imc_num; i++)
  276. enable_rrls_ddr(&d->imc[i], enable);
  277. imc_num += res_cfg->hbm_imc_num;
  278. for (; i < imc_num; i++)
  279. enable_rrls_hbm(&d->imc[i], enable);
  280. }
  281. }
  282. static void show_retry_rd_err_log(struct decoded_addr *res, char *msg,
  283. int len, bool scrub_err)
  284. {
  285. int i, j, n, ch = res->channel, pch = res->cs & 1;
  286. struct skx_imc *imc = &res->dev->imc[res->imc];
  287. u64 log, corr, status_mask;
  288. struct reg_rrl *rrl;
  289. bool scrub;
  290. u32 offset;
  291. u8 width;
  292. if (!imc->mbase)
  293. return;
  294. rrl = imc->hbm_mc ? res_cfg->reg_rrl_hbm[pch] : res_cfg->reg_rrl_ddr;
  295. if (!rrl)
  296. return;
  297. status_mask = rrl->over_mask | rrl->uc_mask | rrl->v_mask;
  298. n = scnprintf(msg, len, " retry_rd_err_log[");
  299. for (i = 0; i < rrl->set_num; i++) {
  300. scrub = (rrl->modes[i] == FRE_SCRUB || rrl->modes[i] == LRE_SCRUB);
  301. if (scrub_err != scrub)
  302. continue;
  303. for (j = 0; j < rrl->reg_num && len - n > 0; j++) {
  304. offset = rrl->offsets[i][j];
  305. width = rrl->widths[j];
  306. log = read_imc_reg(imc, ch, offset, width);
  307. if (width == 4)
  308. n += scnprintf(msg + n, len - n, "%.8llx ", log);
  309. else
  310. n += scnprintf(msg + n, len - n, "%.16llx ", log);
  311. /* Clear RRL status if RRL in Linux control mode. */
  312. if (retry_rd_err_log == 2 && !j && (log & status_mask))
  313. write_imc_reg(imc, ch, offset, width, log & ~status_mask);
  314. }
  315. }
  316. /* Move back one space. */
  317. n--;
  318. n += scnprintf(msg + n, len - n, "]");
  319. if (len - n > 0) {
  320. n += scnprintf(msg + n, len - n, " correrrcnt[");
  321. for (i = 0; i < rrl->cecnt_num && len - n > 0; i++) {
  322. offset = rrl->cecnt_offsets[i];
  323. width = rrl->cecnt_widths[i];
  324. corr = read_imc_reg(imc, ch, offset, width);
  325. /* CPUs {ICX,SPR} encode two counters per 4-byte CORRERRCNT register. */
  326. if (res_cfg->type <= SPR) {
  327. n += scnprintf(msg + n, len - n, "%.4llx %.4llx ",
  328. corr & 0xffff, corr >> 16);
  329. } else {
  330. /* CPUs {GNR} encode one counter per CORRERRCNT register. */
  331. if (width == 4)
  332. n += scnprintf(msg + n, len - n, "%.8llx ", corr);
  333. else
  334. n += scnprintf(msg + n, len - n, "%.16llx ", corr);
  335. }
  336. }
  337. /* Move back one space. */
  338. n--;
  339. n += scnprintf(msg + n, len - n, "]");
  340. }
  341. }
  342. static struct pci_dev *pci_get_dev_wrapper(int dom, unsigned int bus,
  343. unsigned int dev, unsigned int fun)
  344. {
  345. struct pci_dev *pdev;
  346. pdev = pci_get_domain_bus_and_slot(dom, bus, PCI_DEVFN(dev, fun));
  347. if (!pdev) {
  348. edac_dbg(2, "No device %02x:%02x.%x\n",
  349. bus, dev, fun);
  350. return NULL;
  351. }
  352. if (unlikely(pci_enable_device(pdev) < 0)) {
  353. edac_dbg(2, "Failed to enable device %02x:%02x.%x\n",
  354. bus, dev, fun);
  355. pci_dev_put(pdev);
  356. return NULL;
  357. }
  358. return pdev;
  359. }
  360. /**
  361. * i10nm_get_imc_num() - Get the number of present DDR memory controllers.
  362. *
  363. * @cfg : The pointer to the structure of EDAC resource configurations.
  364. *
  365. * For Granite Rapids CPUs, the number of present DDR memory controllers read
  366. * at runtime overwrites the value statically configured in @cfg->ddr_imc_num.
  367. * For other CPUs, the number of present DDR memory controllers is statically
  368. * configured in @cfg->ddr_imc_num.
  369. *
  370. * RETURNS : 0 on success, < 0 on failure.
  371. */
  372. static int i10nm_get_imc_num(struct res_config *cfg)
  373. {
  374. int n, imc_num, chan_num = 0;
  375. struct skx_dev *d;
  376. u32 reg;
  377. list_for_each_entry(d, i10nm_edac_list, list) {
  378. d->pcu_cr3 = pci_get_dev_wrapper(d->seg, d->bus[res_cfg->pcu_cr3_bdf.bus],
  379. res_cfg->pcu_cr3_bdf.dev,
  380. res_cfg->pcu_cr3_bdf.fun);
  381. if (!d->pcu_cr3)
  382. continue;
  383. if (I10NM_GET_CAPID5_CFG(d, reg))
  384. continue;
  385. n = I10NM_DDR_IMC_CH_CNT(reg);
  386. if (!chan_num) {
  387. chan_num = n;
  388. edac_dbg(2, "Get DDR CH number: %d\n", chan_num);
  389. } else if (chan_num != n) {
  390. i10nm_printk(KERN_NOTICE, "Get DDR CH numbers: %d, %d\n", chan_num, n);
  391. }
  392. }
  393. switch (cfg->type) {
  394. case GNR:
  395. /*
  396. * One channel per DDR memory controller for Granite Rapids CPUs.
  397. */
  398. imc_num = chan_num;
  399. if (!imc_num) {
  400. i10nm_printk(KERN_ERR, "Invalid DDR MC number\n");
  401. return -ENODEV;
  402. }
  403. if (cfg->ddr_imc_num != imc_num) {
  404. /*
  405. * Update the configuration data to reflect the number of
  406. * present DDR memory controllers.
  407. */
  408. cfg->ddr_imc_num = imc_num;
  409. edac_dbg(2, "Set DDR MC number: %d", imc_num);
  410. /* Release and reallocate skx_dev list with the updated number. */
  411. skx_remove();
  412. if (skx_get_all_bus_mappings(cfg, &i10nm_edac_list) <= 0)
  413. return -ENODEV;
  414. }
  415. return 0;
  416. default:
  417. /*
  418. * For other CPUs, the number of present DDR memory controllers
  419. * is statically pre-configured in cfg->ddr_imc_num.
  420. */
  421. return 0;
  422. }
  423. }
  424. static bool i10nm_check_2lm(struct res_config *cfg)
  425. {
  426. struct skx_dev *d;
  427. u32 reg;
  428. int i;
  429. list_for_each_entry(d, i10nm_edac_list, list) {
  430. d->sad_all = pci_get_dev_wrapper(d->seg, d->bus[res_cfg->sad_all_bdf.bus],
  431. res_cfg->sad_all_bdf.dev,
  432. res_cfg->sad_all_bdf.fun);
  433. if (!d->sad_all)
  434. continue;
  435. for (i = 0; i < I10NM_MAX_SAD; i++) {
  436. I10NM_GET_SAD(d, cfg->sad_all_offset, i, reg);
  437. if (I10NM_SAD_ENABLE(reg) && I10NM_SAD_NM_CACHEABLE(reg)) {
  438. edac_dbg(2, "2-level memory configuration.\n");
  439. return true;
  440. }
  441. }
  442. }
  443. return false;
  444. }
  445. /*
  446. * Check whether the error comes from DDRT by ICX/Tremont/SPR model specific error code.
  447. * Refer to SDM vol3B 17.11.3/17.13.2 Intel IMC MC error codes for IA32_MCi_STATUS.
  448. */
  449. static bool i10nm_mscod_is_ddrt(u32 mscod)
  450. {
  451. switch (res_cfg->type) {
  452. case I10NM:
  453. switch (mscod) {
  454. case 0x0106: case 0x0107:
  455. case 0x0800: case 0x0804:
  456. case 0x0806 ... 0x0808:
  457. case 0x080a ... 0x080e:
  458. case 0x0810: case 0x0811:
  459. case 0x0816: case 0x081e:
  460. case 0x081f:
  461. return true;
  462. }
  463. break;
  464. case SPR:
  465. switch (mscod) {
  466. case 0x0800: case 0x0804:
  467. case 0x0806 ... 0x0808:
  468. case 0x080a ... 0x080e:
  469. case 0x0810: case 0x0811:
  470. case 0x0816: case 0x081e:
  471. case 0x081f:
  472. return true;
  473. }
  474. break;
  475. default:
  476. return false;
  477. }
  478. return false;
  479. }
  480. static bool i10nm_mc_decode_available(struct mce *mce)
  481. {
  482. #define ICX_IMCx_CHy 0x06666000
  483. u8 bank;
  484. if (!decoding_via_mca || mem_cfg_2lm)
  485. return false;
  486. if ((mce->status & (MCI_STATUS_MISCV | MCI_STATUS_ADDRV))
  487. != (MCI_STATUS_MISCV | MCI_STATUS_ADDRV))
  488. return false;
  489. bank = mce->bank;
  490. switch (res_cfg->type) {
  491. case I10NM:
  492. /* Check whether the bank is one of {13,14,17,18,21,22,25,26} */
  493. if (!(ICX_IMCx_CHy & (1 << bank)))
  494. return false;
  495. break;
  496. case SPR:
  497. if (bank < 13 || bank > 20)
  498. return false;
  499. break;
  500. default:
  501. return false;
  502. }
  503. /* DDRT errors can't be decoded from MCA bank registers */
  504. if (MCI_MISC_ECC_MODE(mce->misc) == MCI_MISC_ECC_DDRT)
  505. return false;
  506. if (i10nm_mscod_is_ddrt(MCI_STATUS_MSCOD(mce->status)))
  507. return false;
  508. return true;
  509. }
  510. static bool i10nm_mc_decode(struct decoded_addr *res)
  511. {
  512. struct mce *m = res->mce;
  513. struct skx_dev *d;
  514. u8 bank;
  515. if (!i10nm_mc_decode_available(m))
  516. return false;
  517. list_for_each_entry(d, i10nm_edac_list, list) {
  518. if (d->imc[0].src_id == m->socketid) {
  519. res->socket = m->socketid;
  520. res->dev = d;
  521. break;
  522. }
  523. }
  524. switch (res_cfg->type) {
  525. case I10NM:
  526. bank = m->bank - 13;
  527. res->imc = bank / 4;
  528. res->channel = bank % 2;
  529. res->column = GET_BITFIELD(m->misc, 9, 18) << 2;
  530. res->row = GET_BITFIELD(m->misc, 19, 39);
  531. res->bank_group = GET_BITFIELD(m->misc, 40, 41);
  532. res->bank_address = GET_BITFIELD(m->misc, 42, 43);
  533. res->bank_group |= GET_BITFIELD(m->misc, 44, 44) << 2;
  534. res->rank = GET_BITFIELD(m->misc, 56, 58);
  535. res->dimm = res->rank >> 2;
  536. res->rank = res->rank % 4;
  537. break;
  538. case SPR:
  539. bank = m->bank - 13;
  540. res->imc = bank / 2;
  541. res->channel = bank % 2;
  542. res->column = GET_BITFIELD(m->misc, 9, 18) << 2;
  543. res->row = GET_BITFIELD(m->misc, 19, 36);
  544. res->bank_group = GET_BITFIELD(m->misc, 37, 38);
  545. res->bank_address = GET_BITFIELD(m->misc, 39, 40);
  546. res->bank_group |= GET_BITFIELD(m->misc, 41, 41) << 2;
  547. res->rank = GET_BITFIELD(m->misc, 57, 57);
  548. res->dimm = GET_BITFIELD(m->misc, 58, 58);
  549. break;
  550. default:
  551. return false;
  552. }
  553. if (!res->dev) {
  554. skx_printk(KERN_ERR, "No device for src_id %d imc %d\n",
  555. m->socketid, res->imc);
  556. return false;
  557. }
  558. return true;
  559. }
  560. /**
  561. * get_gnr_mdev() - Get the PCI device of the @logical_idx-th DDR memory controller.
  562. *
  563. * @d : The pointer to the structure of CPU socket EDAC device.
  564. * @logical_idx : The logical index of the present memory controller (0 ~ max present MC# - 1).
  565. * @physical_idx : To store the corresponding physical index of @logical_idx.
  566. *
  567. * RETURNS : The PCI device of the @logical_idx-th DDR memory controller, NULL on failure.
  568. */
  569. static struct pci_dev *get_gnr_mdev(struct skx_dev *d, int logical_idx, int *physical_idx)
  570. {
  571. #define GNR_MAX_IMC_PCI_CNT 28
  572. struct pci_dev *mdev;
  573. int i, logical = 0;
  574. /*
  575. * Detect present memory controllers from { PCI device: 8-5, function 7-1 }
  576. */
  577. for (i = 0; i < GNR_MAX_IMC_PCI_CNT; i++) {
  578. mdev = pci_get_dev_wrapper(d->seg,
  579. d->bus[res_cfg->ddr_mdev_bdf.bus],
  580. res_cfg->ddr_mdev_bdf.dev + i / 7,
  581. res_cfg->ddr_mdev_bdf.fun + i % 7);
  582. if (mdev) {
  583. if (logical == logical_idx) {
  584. *physical_idx = i;
  585. return mdev;
  586. }
  587. pci_dev_put(mdev);
  588. logical++;
  589. }
  590. }
  591. return NULL;
  592. }
  593. static u32 get_gnr_imc_mmio_offset(void)
  594. {
  595. if (boot_cpu_data.x86_vfm == INTEL_GRANITERAPIDS_D)
  596. return I10NM_GNR_D_IMC_MMIO_OFFSET;
  597. return I10NM_GNR_IMC_MMIO_OFFSET;
  598. }
  599. /**
  600. * get_ddr_munit() - Get the resource of the i-th DDR memory controller.
  601. *
  602. * @d : The pointer to the structure of CPU socket EDAC device.
  603. * @i : The index of the CPU socket relative DDR memory controller.
  604. * @offset : To store the MMIO offset of the i-th DDR memory controller.
  605. * @size : To store the MMIO size of the i-th DDR memory controller.
  606. *
  607. * RETURNS : The PCI device of the i-th DDR memory controller, NULL on failure.
  608. */
  609. static struct pci_dev *get_ddr_munit(struct skx_dev *d, int i, u32 *offset, unsigned long *size)
  610. {
  611. struct pci_dev *mdev;
  612. int physical_idx;
  613. u32 reg;
  614. switch (res_cfg->type) {
  615. case GNR:
  616. if (I10NM_GET_IMC_BAR(d, 0, reg)) {
  617. i10nm_printk(KERN_ERR, "Failed to get mc0 bar\n");
  618. return NULL;
  619. }
  620. mdev = get_gnr_mdev(d, i, &physical_idx);
  621. if (!mdev)
  622. return NULL;
  623. *offset = I10NM_GET_IMC_MMIO_OFFSET(reg) +
  624. get_gnr_imc_mmio_offset() +
  625. physical_idx * I10NM_GNR_IMC_MMIO_SIZE;
  626. *size = I10NM_GNR_IMC_MMIO_SIZE;
  627. break;
  628. default:
  629. if (I10NM_GET_IMC_BAR(d, i, reg)) {
  630. i10nm_printk(KERN_ERR, "Failed to get mc%d bar\n", i);
  631. return NULL;
  632. }
  633. mdev = pci_get_dev_wrapper(d->seg,
  634. d->bus[res_cfg->ddr_mdev_bdf.bus],
  635. res_cfg->ddr_mdev_bdf.dev + i,
  636. res_cfg->ddr_mdev_bdf.fun);
  637. if (!mdev)
  638. return NULL;
  639. *offset = I10NM_GET_IMC_MMIO_OFFSET(reg);
  640. *size = I10NM_GET_IMC_MMIO_SIZE(reg);
  641. }
  642. return mdev;
  643. }
  644. /**
  645. * i10nm_imc_absent() - Check whether the memory controller @imc is absent
  646. *
  647. * @imc : The pointer to the structure of memory controller EDAC device.
  648. *
  649. * RETURNS : true if the memory controller EDAC device is absent, false otherwise.
  650. */
  651. static bool i10nm_imc_absent(struct skx_imc *imc)
  652. {
  653. u32 mcmtr;
  654. int i;
  655. switch (res_cfg->type) {
  656. case SPR:
  657. for (i = 0; i < res_cfg->ddr_chan_num; i++) {
  658. mcmtr = I10NM_GET_MCMTR(imc, i);
  659. edac_dbg(1, "ch%d mcmtr reg %x\n", i, mcmtr);
  660. if (mcmtr != ~0)
  661. return false;
  662. }
  663. /*
  664. * Some workstations' absent memory controllers still
  665. * appear as PCIe devices, misleading the EDAC driver.
  666. * By observing that the MMIO registers of these absent
  667. * memory controllers consistently hold the value of ~0.
  668. *
  669. * We identify a memory controller as absent by checking
  670. * if its MMIO register "mcmtr" == ~0 in all its channels.
  671. */
  672. return true;
  673. default:
  674. return false;
  675. }
  676. }
  677. static int i10nm_get_ddr_munits(void)
  678. {
  679. struct pci_dev *mdev;
  680. void __iomem *mbase;
  681. unsigned long size;
  682. struct skx_dev *d;
  683. int i, lmc, j = 0;
  684. u32 reg, off;
  685. u64 base;
  686. list_for_each_entry(d, i10nm_edac_list, list) {
  687. d->util_all = pci_get_dev_wrapper(d->seg, d->bus[res_cfg->util_all_bdf.bus],
  688. res_cfg->util_all_bdf.dev,
  689. res_cfg->util_all_bdf.fun);
  690. if (!d->util_all)
  691. return -ENODEV;
  692. d->uracu = pci_get_dev_wrapper(d->seg, d->bus[res_cfg->uracu_bdf.bus],
  693. res_cfg->uracu_bdf.dev,
  694. res_cfg->uracu_bdf.fun);
  695. if (!d->uracu)
  696. return -ENODEV;
  697. if (I10NM_GET_SCK_BAR(d, reg)) {
  698. i10nm_printk(KERN_ERR, "Failed to socket bar\n");
  699. return -ENODEV;
  700. }
  701. base = I10NM_GET_SCK_MMIO_BASE(reg);
  702. edac_dbg(2, "socket%d mmio base 0x%llx (reg 0x%x)\n",
  703. j++, base, reg);
  704. for (lmc = 0, i = 0; i < res_cfg->ddr_imc_num; i++) {
  705. mdev = get_ddr_munit(d, i, &off, &size);
  706. if (i == 0 && !mdev) {
  707. i10nm_printk(KERN_ERR, "No IMC found\n");
  708. return -ENODEV;
  709. }
  710. if (!mdev)
  711. continue;
  712. edac_dbg(2, "mc%d mmio base 0x%llx size 0x%lx (reg 0x%x)\n",
  713. i, base + off, size, reg);
  714. mbase = ioremap(base + off, size);
  715. if (!mbase) {
  716. i10nm_printk(KERN_ERR, "Failed to ioremap 0x%llx\n",
  717. base + off);
  718. return -ENODEV;
  719. }
  720. d->imc[lmc].mbase = mbase;
  721. if (i10nm_imc_absent(&d->imc[lmc])) {
  722. pci_dev_put(mdev);
  723. iounmap(mbase);
  724. d->imc[lmc].mbase = NULL;
  725. edac_dbg(2, "Skip absent mc%d\n", i);
  726. continue;
  727. } else {
  728. d->imc[lmc].mdev = mdev;
  729. if (res_cfg->type == SPR)
  730. skx_set_mc_mapping(d, i, lmc);
  731. lmc++;
  732. }
  733. }
  734. }
  735. return 0;
  736. }
  737. static bool i10nm_check_hbm_imc(struct skx_dev *d)
  738. {
  739. u32 reg;
  740. if (I10NM_GET_CAPID3_CFG(d, reg)) {
  741. i10nm_printk(KERN_ERR, "Failed to get capid3_cfg\n");
  742. return false;
  743. }
  744. return I10NM_IS_HBM_PRESENT(reg) != 0;
  745. }
  746. static int i10nm_get_hbm_munits(void)
  747. {
  748. struct pci_dev *mdev;
  749. void __iomem *mbase;
  750. u32 reg, off, mcmtr;
  751. struct skx_dev *d;
  752. int i, lmc;
  753. u64 base;
  754. list_for_each_entry(d, i10nm_edac_list, list) {
  755. if (!d->pcu_cr3)
  756. return -ENODEV;
  757. if (!i10nm_check_hbm_imc(d)) {
  758. i10nm_printk(KERN_DEBUG, "No hbm memory\n");
  759. return -ENODEV;
  760. }
  761. if (I10NM_GET_SCK_BAR(d, reg)) {
  762. i10nm_printk(KERN_ERR, "Failed to get socket bar\n");
  763. return -ENODEV;
  764. }
  765. base = I10NM_GET_SCK_MMIO_BASE(reg);
  766. if (I10NM_GET_HBM_IMC_BAR(d, reg)) {
  767. i10nm_printk(KERN_ERR, "Failed to get hbm mc bar\n");
  768. return -ENODEV;
  769. }
  770. base += I10NM_GET_HBM_IMC_MMIO_OFFSET(reg);
  771. lmc = res_cfg->ddr_imc_num;
  772. for (i = 0; i < res_cfg->hbm_imc_num; i++) {
  773. mdev = pci_get_dev_wrapper(d->seg, d->bus[res_cfg->hbm_mdev_bdf.bus],
  774. res_cfg->hbm_mdev_bdf.dev + i / 4,
  775. res_cfg->hbm_mdev_bdf.fun + i % 4);
  776. if (i == 0 && !mdev) {
  777. i10nm_printk(KERN_ERR, "No hbm mc found\n");
  778. return -ENODEV;
  779. }
  780. if (!mdev)
  781. continue;
  782. d->imc[lmc].mdev = mdev;
  783. off = i * I10NM_HBM_IMC_MMIO_SIZE;
  784. edac_dbg(2, "hbm mc%d mmio base 0x%llx size 0x%x\n",
  785. lmc, base + off, I10NM_HBM_IMC_MMIO_SIZE);
  786. mbase = ioremap(base + off, I10NM_HBM_IMC_MMIO_SIZE);
  787. if (!mbase) {
  788. pci_dev_put(d->imc[lmc].mdev);
  789. d->imc[lmc].mdev = NULL;
  790. i10nm_printk(KERN_ERR, "Failed to ioremap for hbm mc 0x%llx\n",
  791. base + off);
  792. return -ENOMEM;
  793. }
  794. d->imc[lmc].mbase = mbase;
  795. d->imc[lmc].hbm_mc = true;
  796. mcmtr = I10NM_GET_MCMTR(&d->imc[lmc], 0);
  797. if (!I10NM_IS_HBM_IMC(mcmtr)) {
  798. iounmap(d->imc[lmc].mbase);
  799. d->imc[lmc].mbase = NULL;
  800. d->imc[lmc].hbm_mc = false;
  801. pci_dev_put(d->imc[lmc].mdev);
  802. d->imc[lmc].mdev = NULL;
  803. i10nm_printk(KERN_ERR, "This isn't an hbm mc!\n");
  804. return -ENODEV;
  805. }
  806. lmc++;
  807. }
  808. }
  809. return 0;
  810. }
  811. static struct res_config i10nm_cfg0 = {
  812. .type = I10NM,
  813. .decs_did = 0x3452,
  814. .busno_cfg_offset = 0xcc,
  815. .ddr_imc_num = 4,
  816. .ddr_chan_num = 2,
  817. .ddr_dimm_num = 2,
  818. .ddr_chan_mmio_sz = 0x4000,
  819. .sad_all_bdf = {1, 29, 0},
  820. .pcu_cr3_bdf = {1, 30, 3},
  821. .util_all_bdf = {1, 29, 1},
  822. .uracu_bdf = {0, 0, 1},
  823. .ddr_mdev_bdf = {0, 12, 0},
  824. .hbm_mdev_bdf = {0, 12, 1},
  825. .sad_all_offset = 0x108,
  826. .reg_rrl_ddr = &icx_reg_rrl_ddr,
  827. };
  828. static struct res_config i10nm_cfg1 = {
  829. .type = I10NM,
  830. .decs_did = 0x3452,
  831. .busno_cfg_offset = 0xd0,
  832. .ddr_imc_num = 4,
  833. .ddr_chan_num = 2,
  834. .ddr_dimm_num = 2,
  835. .ddr_chan_mmio_sz = 0x4000,
  836. .sad_all_bdf = {1, 29, 0},
  837. .pcu_cr3_bdf = {1, 30, 3},
  838. .util_all_bdf = {1, 29, 1},
  839. .uracu_bdf = {0, 0, 1},
  840. .ddr_mdev_bdf = {0, 12, 0},
  841. .hbm_mdev_bdf = {0, 12, 1},
  842. .sad_all_offset = 0x108,
  843. .reg_rrl_ddr = &icx_reg_rrl_ddr,
  844. };
  845. static struct res_config spr_cfg = {
  846. .type = SPR,
  847. .decs_did = 0x3252,
  848. .busno_cfg_offset = 0xd0,
  849. .ddr_imc_num = 4,
  850. .ddr_chan_num = 2,
  851. .ddr_dimm_num = 2,
  852. .hbm_imc_num = 16,
  853. .hbm_chan_num = 2,
  854. .hbm_dimm_num = 1,
  855. .ddr_chan_mmio_sz = 0x8000,
  856. .hbm_chan_mmio_sz = 0x4000,
  857. .support_ddr5 = true,
  858. .sad_all_bdf = {1, 10, 0},
  859. .pcu_cr3_bdf = {1, 30, 3},
  860. .util_all_bdf = {1, 29, 1},
  861. .uracu_bdf = {0, 0, 1},
  862. .ddr_mdev_bdf = {0, 12, 0},
  863. .hbm_mdev_bdf = {0, 12, 1},
  864. .sad_all_offset = 0x300,
  865. .reg_rrl_ddr = &spr_reg_rrl_ddr,
  866. .reg_rrl_hbm[0] = &spr_reg_rrl_hbm_pch0,
  867. .reg_rrl_hbm[1] = &spr_reg_rrl_hbm_pch1,
  868. };
  869. static struct res_config gnr_cfg = {
  870. .type = GNR,
  871. .decs_did = 0x3252,
  872. .busno_cfg_offset = 0xd0,
  873. .ddr_imc_num = 12,
  874. .ddr_chan_num = 1,
  875. .ddr_dimm_num = 2,
  876. .ddr_chan_mmio_sz = 0x4000,
  877. .support_ddr5 = true,
  878. .sad_all_bdf = {0, 13, 0},
  879. .pcu_cr3_bdf = {0, 5, 0},
  880. .util_all_bdf = {0, 13, 1},
  881. .uracu_bdf = {0, 0, 1},
  882. .ddr_mdev_bdf = {0, 5, 1},
  883. .sad_all_offset = 0x300,
  884. .reg_rrl_ddr = &gnr_reg_rrl_ddr,
  885. };
  886. static const struct x86_cpu_id i10nm_cpuids[] = {
  887. X86_MATCH_VFM_STEPS(INTEL_ATOM_TREMONT_D, X86_STEP_MIN, 0x3, &i10nm_cfg0),
  888. X86_MATCH_VFM_STEPS(INTEL_ATOM_TREMONT_D, 0x4, X86_STEP_MAX, &i10nm_cfg1),
  889. X86_MATCH_VFM_STEPS(INTEL_ICELAKE_X, X86_STEP_MIN, 0x3, &i10nm_cfg0),
  890. X86_MATCH_VFM_STEPS(INTEL_ICELAKE_X, 0x4, X86_STEP_MAX, &i10nm_cfg1),
  891. X86_MATCH_VFM( INTEL_ICELAKE_D, &i10nm_cfg1),
  892. X86_MATCH_VFM(INTEL_SAPPHIRERAPIDS_X, &spr_cfg),
  893. X86_MATCH_VFM(INTEL_EMERALDRAPIDS_X, &spr_cfg),
  894. X86_MATCH_VFM(INTEL_GRANITERAPIDS_X, &gnr_cfg),
  895. X86_MATCH_VFM(INTEL_GRANITERAPIDS_D, &gnr_cfg),
  896. X86_MATCH_VFM(INTEL_ATOM_CRESTMONT_X, &gnr_cfg),
  897. X86_MATCH_VFM(INTEL_ATOM_CRESTMONT, &gnr_cfg),
  898. X86_MATCH_VFM(INTEL_ATOM_DARKMONT_X, &gnr_cfg),
  899. {}
  900. };
  901. MODULE_DEVICE_TABLE(x86cpu, i10nm_cpuids);
  902. static bool i10nm_check_ecc(struct skx_imc *imc, int chan)
  903. {
  904. u32 mcmtr;
  905. mcmtr = I10NM_GET_MCMTR(imc, chan);
  906. edac_dbg(1, "ch%d mcmtr reg %x\n", chan, mcmtr);
  907. return !!GET_BITFIELD(mcmtr, 2, 2);
  908. }
  909. static bool i10nm_channel_disabled(struct skx_imc *imc, int chan)
  910. {
  911. u32 mcmtr = I10NM_GET_MCMTR(imc, chan);
  912. edac_dbg(1, "mc%d ch%d mcmtr reg %x\n", imc->mc, chan, mcmtr);
  913. return (mcmtr == ~0 || GET_BITFIELD(mcmtr, 18, 18));
  914. }
  915. static int i10nm_get_dimm_config(struct mem_ctl_info *mci,
  916. struct res_config *cfg)
  917. {
  918. struct skx_pvt *pvt = mci->pvt_info;
  919. struct skx_imc *imc = pvt->imc;
  920. u32 mtr, mcddrtcfg = 0;
  921. struct dimm_info *dimm;
  922. int i, j, ndimms;
  923. for (i = 0; i < imc->num_channels; i++) {
  924. if (!imc->mbase)
  925. continue;
  926. if (i10nm_channel_disabled(imc, i)) {
  927. edac_dbg(1, "mc%d ch%d is disabled.\n", imc->mc, i);
  928. continue;
  929. }
  930. ndimms = 0;
  931. if (res_cfg->type != GNR)
  932. mcddrtcfg = I10NM_GET_MCDDRTCFG(imc, i);
  933. for (j = 0; j < imc->num_dimms; j++) {
  934. dimm = edac_get_dimm(mci, i, j, 0);
  935. mtr = I10NM_GET_DIMMMTR(imc, i, j);
  936. edac_dbg(1, "dimmmtr 0x%x mcddrtcfg 0x%x (mc%d ch%d dimm%d)\n",
  937. mtr, mcddrtcfg, imc->mc, i, j);
  938. if (IS_DIMM_PRESENT(mtr))
  939. ndimms += skx_get_dimm_info(mtr, 0, 0, dimm,
  940. imc, i, j, cfg);
  941. else if (IS_NVDIMM_PRESENT(mcddrtcfg, j))
  942. ndimms += skx_get_nvdimm_info(dimm, imc, i, j,
  943. EDAC_MOD_STR);
  944. }
  945. if (ndimms && !i10nm_check_ecc(imc, i)) {
  946. i10nm_printk(KERN_ERR, "ECC is disabled on imc %d channel %d\n",
  947. imc->mc, i);
  948. return -ENODEV;
  949. }
  950. }
  951. return 0;
  952. }
  953. static struct notifier_block i10nm_mce_dec = {
  954. .notifier_call = skx_mce_check_error,
  955. .priority = MCE_PRIO_EDAC,
  956. };
  957. static int __init i10nm_init(void)
  958. {
  959. u8 mc = 0, src_id = 0;
  960. const struct x86_cpu_id *id;
  961. struct res_config *cfg;
  962. const char *owner;
  963. struct skx_dev *d;
  964. int rc, i, off[3] = {0xd0, 0xc8, 0xcc};
  965. u64 tolm, tohm;
  966. int imc_num;
  967. edac_dbg(2, "\n");
  968. if (ghes_get_devices())
  969. return -EBUSY;
  970. owner = edac_get_owner();
  971. if (owner && strncmp(owner, EDAC_MOD_STR, sizeof(EDAC_MOD_STR)))
  972. return -EBUSY;
  973. if (cpu_feature_enabled(X86_FEATURE_HYPERVISOR))
  974. return -ENODEV;
  975. id = x86_match_cpu(i10nm_cpuids);
  976. if (!id)
  977. return -ENODEV;
  978. cfg = (struct res_config *)id->driver_data;
  979. skx_set_res_cfg(cfg);
  980. res_cfg = cfg;
  981. rc = skx_get_hi_lo(0x09a2, off, &tolm, &tohm);
  982. if (rc)
  983. return rc;
  984. rc = skx_get_all_bus_mappings(cfg, &i10nm_edac_list);
  985. if (rc < 0)
  986. goto fail;
  987. if (rc == 0) {
  988. i10nm_printk(KERN_ERR, "No memory controllers found\n");
  989. return -ENODEV;
  990. }
  991. rc = i10nm_get_imc_num(cfg);
  992. if (rc < 0)
  993. goto fail;
  994. mem_cfg_2lm = i10nm_check_2lm(cfg);
  995. skx_set_mem_cfg(mem_cfg_2lm);
  996. rc = i10nm_get_ddr_munits();
  997. if (i10nm_get_hbm_munits() && rc)
  998. goto fail;
  999. imc_num = res_cfg->ddr_imc_num + res_cfg->hbm_imc_num;
  1000. list_for_each_entry(d, i10nm_edac_list, list) {
  1001. rc = skx_get_src_id(d, 0xf8, &src_id);
  1002. if (rc < 0)
  1003. goto fail;
  1004. edac_dbg(2, "src_id = %d\n", src_id);
  1005. for (i = 0; i < imc_num; i++) {
  1006. if (!d->imc[i].mdev)
  1007. continue;
  1008. d->imc[i].mc = mc++;
  1009. d->imc[i].lmc = i;
  1010. d->imc[i].src_id = src_id;
  1011. if (d->imc[i].hbm_mc) {
  1012. d->imc[i].chan_mmio_sz = cfg->hbm_chan_mmio_sz;
  1013. d->imc[i].num_channels = cfg->hbm_chan_num;
  1014. d->imc[i].num_dimms = cfg->hbm_dimm_num;
  1015. } else {
  1016. d->imc[i].chan_mmio_sz = cfg->ddr_chan_mmio_sz;
  1017. d->imc[i].num_channels = cfg->ddr_chan_num;
  1018. d->imc[i].num_dimms = cfg->ddr_dimm_num;
  1019. }
  1020. rc = skx_register_mci(&d->imc[i], &d->imc[i].mdev->dev,
  1021. pci_name(d->imc[i].mdev),
  1022. "Intel_10nm Socket", EDAC_MOD_STR,
  1023. i10nm_get_dimm_config, cfg);
  1024. if (rc < 0)
  1025. goto fail;
  1026. }
  1027. }
  1028. rc = skx_adxl_get();
  1029. if (rc)
  1030. goto fail;
  1031. opstate_init();
  1032. mce_register_decode_chain(&i10nm_mce_dec);
  1033. skx_setup_debug("i10nm_test");
  1034. if (retry_rd_err_log && res_cfg->reg_rrl_ddr) {
  1035. skx_set_decode(i10nm_mc_decode, show_retry_rd_err_log);
  1036. if (retry_rd_err_log == 2)
  1037. enable_retry_rd_err_log(true);
  1038. } else {
  1039. skx_set_decode(i10nm_mc_decode, NULL);
  1040. }
  1041. i10nm_printk(KERN_INFO, "%s\n", I10NM_REVISION);
  1042. return 0;
  1043. fail:
  1044. skx_remove();
  1045. return rc;
  1046. }
  1047. static void __exit i10nm_exit(void)
  1048. {
  1049. edac_dbg(2, "\n");
  1050. if (retry_rd_err_log && res_cfg->reg_rrl_ddr) {
  1051. skx_set_decode(NULL, NULL);
  1052. if (retry_rd_err_log == 2)
  1053. enable_retry_rd_err_log(false);
  1054. }
  1055. skx_teardown_debug();
  1056. mce_unregister_decode_chain(&i10nm_mce_dec);
  1057. skx_adxl_put();
  1058. skx_remove();
  1059. }
  1060. module_init(i10nm_init);
  1061. module_exit(i10nm_exit);
  1062. static int set_decoding_via_mca(const char *buf, const struct kernel_param *kp)
  1063. {
  1064. unsigned long val;
  1065. int ret;
  1066. ret = kstrtoul(buf, 0, &val);
  1067. if (ret || val > 1)
  1068. return -EINVAL;
  1069. if (val && mem_cfg_2lm) {
  1070. i10nm_printk(KERN_NOTICE, "Decoding errors via MCA banks for 2LM isn't supported yet\n");
  1071. return -EIO;
  1072. }
  1073. ret = param_set_int(buf, kp);
  1074. return ret;
  1075. }
  1076. static const struct kernel_param_ops decoding_via_mca_param_ops = {
  1077. .set = set_decoding_via_mca,
  1078. .get = param_get_int,
  1079. };
  1080. module_param_cb(decoding_via_mca, &decoding_via_mca_param_ops, &decoding_via_mca, 0644);
  1081. MODULE_PARM_DESC(decoding_via_mca, "decoding_via_mca: 0=off(default), 1=enable");
  1082. module_param(retry_rd_err_log, int, 0444);
  1083. MODULE_PARM_DESC(retry_rd_err_log, "retry_rd_err_log: 0=off(default), 1=bios(Linux doesn't reset any control bits, but just reports values.), 2=linux(Linux tries to take control and resets mode bits, clear valid/UC bits after reading.)");
  1084. MODULE_LICENSE("GPL v2");
  1085. MODULE_DESCRIPTION("MC Driver for Intel 10nm server processors");