qcom_edac.c 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419
  1. // SPDX-License-Identifier: GPL-2.0
  2. /*
  3. * Copyright (c) 2018, The Linux Foundation. All rights reserved.
  4. */
  5. #include <linux/edac.h>
  6. #include <linux/interrupt.h>
  7. #include <linux/kernel.h>
  8. #include <linux/of.h>
  9. #include <linux/platform_device.h>
  10. #include <linux/regmap.h>
  11. #include <linux/soc/qcom/llcc-qcom.h>
  12. #include "edac_mc.h"
  13. #include "edac_device.h"
  14. #define EDAC_LLCC "qcom_llcc"
  15. #define LLCC_ERP_PANIC_ON_UE 1
  16. #define TRP_SYN_REG_CNT 6
  17. #define DRP_SYN_REG_CNT 8
  18. #define LLCC_LB_CNT_MASK GENMASK(31, 28)
  19. #define LLCC_LB_CNT_SHIFT 28
  20. /* Mask and shift macros */
  21. #define ECC_DB_ERR_COUNT_MASK GENMASK(4, 0)
  22. #define ECC_DB_ERR_WAYS_MASK GENMASK(31, 16)
  23. #define ECC_DB_ERR_WAYS_SHIFT BIT(4)
  24. #define ECC_SB_ERR_COUNT_MASK GENMASK(23, 16)
  25. #define ECC_SB_ERR_COUNT_SHIFT BIT(4)
  26. #define ECC_SB_ERR_WAYS_MASK GENMASK(15, 0)
  27. #define SB_ECC_ERROR BIT(0)
  28. #define DB_ECC_ERROR BIT(1)
  29. #define DRP_TRP_INT_CLEAR GENMASK(1, 0)
  30. #define DRP_TRP_CNT_CLEAR GENMASK(1, 0)
  31. #define SB_ERROR_THRESHOLD 0x1
  32. #define SB_ERROR_THRESHOLD_SHIFT 24
  33. #define SB_DB_TRP_INTERRUPT_ENABLE 0x3
  34. #define TRP0_INTERRUPT_ENABLE 0x1
  35. #define DRP0_INTERRUPT_ENABLE BIT(6)
  36. #define SB_DB_DRP_INTERRUPT_ENABLE 0x3
  37. #define ECC_POLL_MSEC 5000
  38. enum {
  39. LLCC_DRAM_CE = 0,
  40. LLCC_DRAM_UE,
  41. LLCC_TRAM_CE,
  42. LLCC_TRAM_UE,
  43. };
  44. static const struct llcc_edac_reg_data edac_reg_data[] = {
  45. [LLCC_DRAM_CE] = {
  46. .name = "DRAM Single-bit",
  47. .reg_cnt = DRP_SYN_REG_CNT,
  48. .count_mask = ECC_SB_ERR_COUNT_MASK,
  49. .ways_mask = ECC_SB_ERR_WAYS_MASK,
  50. .count_shift = ECC_SB_ERR_COUNT_SHIFT,
  51. },
  52. [LLCC_DRAM_UE] = {
  53. .name = "DRAM Double-bit",
  54. .reg_cnt = DRP_SYN_REG_CNT,
  55. .count_mask = ECC_DB_ERR_COUNT_MASK,
  56. .ways_mask = ECC_DB_ERR_WAYS_MASK,
  57. .ways_shift = ECC_DB_ERR_WAYS_SHIFT,
  58. },
  59. [LLCC_TRAM_CE] = {
  60. .name = "TRAM Single-bit",
  61. .reg_cnt = TRP_SYN_REG_CNT,
  62. .count_mask = ECC_SB_ERR_COUNT_MASK,
  63. .ways_mask = ECC_SB_ERR_WAYS_MASK,
  64. .count_shift = ECC_SB_ERR_COUNT_SHIFT,
  65. },
  66. [LLCC_TRAM_UE] = {
  67. .name = "TRAM Double-bit",
  68. .reg_cnt = TRP_SYN_REG_CNT,
  69. .count_mask = ECC_DB_ERR_COUNT_MASK,
  70. .ways_mask = ECC_DB_ERR_WAYS_MASK,
  71. .ways_shift = ECC_DB_ERR_WAYS_SHIFT,
  72. },
  73. };
  74. static int qcom_llcc_core_setup(struct llcc_drv_data *drv, struct regmap *llcc_bcast_regmap)
  75. {
  76. u32 sb_err_threshold;
  77. int ret;
  78. /*
  79. * Configure interrupt enable registers such that Tag, Data RAM related
  80. * interrupts are propagated to interrupt controller for servicing
  81. */
  82. ret = regmap_update_bits(llcc_bcast_regmap, drv->edac_reg_offset->cmn_interrupt_0_enable,
  83. TRP0_INTERRUPT_ENABLE,
  84. TRP0_INTERRUPT_ENABLE);
  85. if (ret)
  86. return ret;
  87. ret = regmap_update_bits(llcc_bcast_regmap, drv->edac_reg_offset->trp_interrupt_0_enable,
  88. SB_DB_TRP_INTERRUPT_ENABLE,
  89. SB_DB_TRP_INTERRUPT_ENABLE);
  90. if (ret)
  91. return ret;
  92. sb_err_threshold = (SB_ERROR_THRESHOLD << SB_ERROR_THRESHOLD_SHIFT);
  93. ret = regmap_write(llcc_bcast_regmap, drv->edac_reg_offset->drp_ecc_error_cfg,
  94. sb_err_threshold);
  95. if (ret)
  96. return ret;
  97. ret = regmap_update_bits(llcc_bcast_regmap, drv->edac_reg_offset->cmn_interrupt_0_enable,
  98. DRP0_INTERRUPT_ENABLE,
  99. DRP0_INTERRUPT_ENABLE);
  100. if (ret)
  101. return ret;
  102. ret = regmap_write(llcc_bcast_regmap, drv->edac_reg_offset->drp_interrupt_enable,
  103. SB_DB_DRP_INTERRUPT_ENABLE);
  104. return ret;
  105. }
  106. /* Clear the error interrupt and counter registers */
  107. static int
  108. qcom_llcc_clear_error_status(int err_type, struct llcc_drv_data *drv)
  109. {
  110. int ret;
  111. switch (err_type) {
  112. case LLCC_DRAM_CE:
  113. case LLCC_DRAM_UE:
  114. ret = regmap_write(drv->bcast_regmap,
  115. drv->edac_reg_offset->drp_interrupt_clear,
  116. DRP_TRP_INT_CLEAR);
  117. if (ret)
  118. return ret;
  119. ret = regmap_write(drv->bcast_regmap,
  120. drv->edac_reg_offset->drp_ecc_error_cntr_clear,
  121. DRP_TRP_CNT_CLEAR);
  122. if (ret)
  123. return ret;
  124. break;
  125. case LLCC_TRAM_CE:
  126. case LLCC_TRAM_UE:
  127. ret = regmap_write(drv->bcast_regmap,
  128. drv->edac_reg_offset->trp_interrupt_0_clear,
  129. DRP_TRP_INT_CLEAR);
  130. if (ret)
  131. return ret;
  132. ret = regmap_write(drv->bcast_regmap,
  133. drv->edac_reg_offset->trp_ecc_error_cntr_clear,
  134. DRP_TRP_CNT_CLEAR);
  135. if (ret)
  136. return ret;
  137. break;
  138. default:
  139. ret = -EINVAL;
  140. edac_printk(KERN_CRIT, EDAC_LLCC, "Unexpected error type: %d\n",
  141. err_type);
  142. }
  143. return ret;
  144. }
  145. struct qcom_llcc_syn_regs {
  146. u32 synd_reg;
  147. u32 count_status_reg;
  148. u32 ways_status_reg;
  149. };
  150. static void get_reg_offsets(struct llcc_drv_data *drv, int err_type,
  151. struct qcom_llcc_syn_regs *syn_regs)
  152. {
  153. const struct llcc_edac_reg_offset *edac_reg_offset = drv->edac_reg_offset;
  154. switch (err_type) {
  155. case LLCC_DRAM_CE:
  156. syn_regs->synd_reg = edac_reg_offset->drp_ecc_sb_err_syn0;
  157. syn_regs->count_status_reg = edac_reg_offset->drp_ecc_error_status1;
  158. syn_regs->ways_status_reg = edac_reg_offset->drp_ecc_error_status0;
  159. break;
  160. case LLCC_DRAM_UE:
  161. syn_regs->synd_reg = edac_reg_offset->drp_ecc_db_err_syn0;
  162. syn_regs->count_status_reg = edac_reg_offset->drp_ecc_error_status1;
  163. syn_regs->ways_status_reg = edac_reg_offset->drp_ecc_error_status0;
  164. break;
  165. case LLCC_TRAM_CE:
  166. syn_regs->synd_reg = edac_reg_offset->trp_ecc_sb_err_syn0;
  167. syn_regs->count_status_reg = edac_reg_offset->trp_ecc_error_status1;
  168. syn_regs->ways_status_reg = edac_reg_offset->trp_ecc_error_status0;
  169. break;
  170. case LLCC_TRAM_UE:
  171. syn_regs->synd_reg = edac_reg_offset->trp_ecc_db_err_syn0;
  172. syn_regs->count_status_reg = edac_reg_offset->trp_ecc_error_status1;
  173. syn_regs->ways_status_reg = edac_reg_offset->trp_ecc_error_status0;
  174. break;
  175. }
  176. }
  177. /* Dump Syndrome registers data for Tag RAM, Data RAM bit errors*/
  178. static int
  179. dump_syn_reg_values(struct llcc_drv_data *drv, u32 bank, int err_type)
  180. {
  181. struct llcc_edac_reg_data reg_data = edac_reg_data[err_type];
  182. struct qcom_llcc_syn_regs regs = { };
  183. int err_cnt, err_ways, ret, i;
  184. u32 synd_reg, synd_val;
  185. get_reg_offsets(drv, err_type, &regs);
  186. for (i = 0; i < reg_data.reg_cnt; i++) {
  187. synd_reg = regs.synd_reg + (i * 4);
  188. ret = regmap_read(drv->regmaps[bank], synd_reg,
  189. &synd_val);
  190. if (ret)
  191. goto clear;
  192. edac_printk(KERN_CRIT, EDAC_LLCC, "%s: ECC_SYN%d: 0x%8x\n",
  193. reg_data.name, i, synd_val);
  194. }
  195. ret = regmap_read(drv->regmaps[bank], regs.count_status_reg,
  196. &err_cnt);
  197. if (ret)
  198. goto clear;
  199. err_cnt &= reg_data.count_mask;
  200. err_cnt >>= reg_data.count_shift;
  201. edac_printk(KERN_CRIT, EDAC_LLCC, "%s: Error count: 0x%4x\n",
  202. reg_data.name, err_cnt);
  203. ret = regmap_read(drv->regmaps[bank], regs.ways_status_reg,
  204. &err_ways);
  205. if (ret)
  206. goto clear;
  207. err_ways &= reg_data.ways_mask;
  208. err_ways >>= reg_data.ways_shift;
  209. edac_printk(KERN_CRIT, EDAC_LLCC, "%s: Error ways: 0x%4x\n",
  210. reg_data.name, err_ways);
  211. clear:
  212. return qcom_llcc_clear_error_status(err_type, drv);
  213. }
  214. static int
  215. dump_syn_reg(struct edac_device_ctl_info *edev_ctl, int err_type, u32 bank)
  216. {
  217. struct llcc_drv_data *drv = edev_ctl->dev->platform_data;
  218. int ret;
  219. ret = dump_syn_reg_values(drv, bank, err_type);
  220. if (ret)
  221. return ret;
  222. switch (err_type) {
  223. case LLCC_DRAM_CE:
  224. edac_device_handle_ce(edev_ctl, 0, bank,
  225. "LLCC Data RAM correctable Error");
  226. break;
  227. case LLCC_DRAM_UE:
  228. edac_device_handle_ue(edev_ctl, 0, bank,
  229. "LLCC Data RAM uncorrectable Error");
  230. break;
  231. case LLCC_TRAM_CE:
  232. edac_device_handle_ce(edev_ctl, 0, bank,
  233. "LLCC Tag RAM correctable Error");
  234. break;
  235. case LLCC_TRAM_UE:
  236. edac_device_handle_ue(edev_ctl, 0, bank,
  237. "LLCC Tag RAM uncorrectable Error");
  238. break;
  239. default:
  240. ret = -EINVAL;
  241. edac_printk(KERN_CRIT, EDAC_LLCC, "Unexpected error type: %d\n",
  242. err_type);
  243. }
  244. return ret;
  245. }
  246. static irqreturn_t llcc_ecc_irq_handler(int irq, void *edev_ctl)
  247. {
  248. struct edac_device_ctl_info *edac_dev_ctl = edev_ctl;
  249. struct llcc_drv_data *drv = edac_dev_ctl->dev->platform_data;
  250. irqreturn_t irq_rc = IRQ_NONE;
  251. u32 drp_error, trp_error, i;
  252. int ret;
  253. /* Iterate over the banks and look for Tag RAM or Data RAM errors */
  254. for (i = 0; i < drv->num_banks; i++) {
  255. ret = regmap_read(drv->regmaps[i], drv->edac_reg_offset->drp_interrupt_status,
  256. &drp_error);
  257. if (!ret && (drp_error & SB_ECC_ERROR)) {
  258. edac_printk(KERN_CRIT, EDAC_LLCC,
  259. "Single Bit Error detected in Data RAM\n");
  260. ret = dump_syn_reg(edev_ctl, LLCC_DRAM_CE, i);
  261. } else if (!ret && (drp_error & DB_ECC_ERROR)) {
  262. edac_printk(KERN_CRIT, EDAC_LLCC,
  263. "Double Bit Error detected in Data RAM\n");
  264. ret = dump_syn_reg(edev_ctl, LLCC_DRAM_UE, i);
  265. }
  266. if (!ret)
  267. irq_rc = IRQ_HANDLED;
  268. ret = regmap_read(drv->regmaps[i], drv->edac_reg_offset->trp_interrupt_0_status,
  269. &trp_error);
  270. if (!ret && (trp_error & SB_ECC_ERROR)) {
  271. edac_printk(KERN_CRIT, EDAC_LLCC,
  272. "Single Bit Error detected in Tag RAM\n");
  273. ret = dump_syn_reg(edev_ctl, LLCC_TRAM_CE, i);
  274. } else if (!ret && (trp_error & DB_ECC_ERROR)) {
  275. edac_printk(KERN_CRIT, EDAC_LLCC,
  276. "Double Bit Error detected in Tag RAM\n");
  277. ret = dump_syn_reg(edev_ctl, LLCC_TRAM_UE, i);
  278. }
  279. if (!ret)
  280. irq_rc = IRQ_HANDLED;
  281. }
  282. return irq_rc;
  283. }
  284. static void llcc_ecc_check(struct edac_device_ctl_info *edev_ctl)
  285. {
  286. llcc_ecc_irq_handler(0, edev_ctl);
  287. }
  288. static int qcom_llcc_edac_probe(struct platform_device *pdev)
  289. {
  290. struct llcc_drv_data *llcc_driv_data = pdev->dev.platform_data;
  291. struct edac_device_ctl_info *edev_ctl;
  292. struct device *dev = &pdev->dev;
  293. int ecc_irq;
  294. int rc;
  295. if (!llcc_driv_data->ecc_irq_configured) {
  296. rc = qcom_llcc_core_setup(llcc_driv_data, llcc_driv_data->bcast_regmap);
  297. if (rc)
  298. return rc;
  299. }
  300. /* Allocate edac control info */
  301. edev_ctl = edac_device_alloc_ctl_info(0, "qcom-llcc", 1, "bank",
  302. llcc_driv_data->num_banks, 1,
  303. edac_device_alloc_index());
  304. if (!edev_ctl)
  305. return -ENOMEM;
  306. edev_ctl->dev = dev;
  307. edev_ctl->mod_name = dev_name(dev);
  308. edev_ctl->dev_name = dev_name(dev);
  309. edev_ctl->ctl_name = "llcc";
  310. edev_ctl->panic_on_ue = LLCC_ERP_PANIC_ON_UE;
  311. /* Check if LLCC driver has passed ECC IRQ */
  312. ecc_irq = llcc_driv_data->ecc_irq;
  313. if (ecc_irq > 0) {
  314. /* Use interrupt mode if IRQ is available */
  315. rc = devm_request_irq(dev, ecc_irq, llcc_ecc_irq_handler,
  316. IRQF_TRIGGER_HIGH, "llcc_ecc", edev_ctl);
  317. if (!rc) {
  318. edac_op_state = EDAC_OPSTATE_INT;
  319. goto irq_done;
  320. }
  321. }
  322. /* Fall back to polling mode otherwise */
  323. edev_ctl->poll_msec = ECC_POLL_MSEC;
  324. edev_ctl->edac_check = llcc_ecc_check;
  325. edac_op_state = EDAC_OPSTATE_POLL;
  326. irq_done:
  327. rc = edac_device_add_device(edev_ctl);
  328. if (rc) {
  329. edac_device_free_ctl_info(edev_ctl);
  330. return rc;
  331. }
  332. platform_set_drvdata(pdev, edev_ctl);
  333. return rc;
  334. }
  335. static void qcom_llcc_edac_remove(struct platform_device *pdev)
  336. {
  337. struct edac_device_ctl_info *edev_ctl = dev_get_drvdata(&pdev->dev);
  338. edac_device_del_device(edev_ctl->dev);
  339. edac_device_free_ctl_info(edev_ctl);
  340. }
  341. static const struct platform_device_id qcom_llcc_edac_id_table[] = {
  342. { .name = "qcom_llcc_edac" },
  343. {}
  344. };
  345. MODULE_DEVICE_TABLE(platform, qcom_llcc_edac_id_table);
  346. static struct platform_driver qcom_llcc_edac_driver = {
  347. .probe = qcom_llcc_edac_probe,
  348. .remove = qcom_llcc_edac_remove,
  349. .driver = {
  350. .name = "qcom_llcc_edac",
  351. },
  352. .id_table = qcom_llcc_edac_id_table,
  353. };
  354. module_platform_driver(qcom_llcc_edac_driver);
  355. MODULE_DESCRIPTION("QCOM EDAC driver");
  356. MODULE_LICENSE("GPL v2");