altera_edac.c 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513
  1. /*
  2. * Copyright Altera Corporation (C) 2014-2015. All rights reserved.
  3. * Copyright 2011-2012 Calxeda, Inc.
  4. *
  5. * This program is free software; you can redistribute it and/or modify it
  6. * under the terms and conditions of the GNU General Public License,
  7. * version 2, as published by the Free Software Foundation.
  8. *
  9. * This program is distributed in the hope it will be useful, but WITHOUT
  10. * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  11. * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
  12. * more details.
  13. *
  14. * You should have received a copy of the GNU General Public License along with
  15. * this program. If not, see <http://www.gnu.org/licenses/>.
  16. *
  17. * Adapted from the highbank_mc_edac driver.
  18. */
  19. #include <linux/ctype.h>
  20. #include <linux/edac.h>
  21. #include <linux/interrupt.h>
  22. #include <linux/kernel.h>
  23. #include <linux/mfd/syscon.h>
  24. #include <linux/of_platform.h>
  25. #include <linux/platform_device.h>
  26. #include <linux/regmap.h>
  27. #include <linux/types.h>
  28. #include <linux/uaccess.h>
  29. #include "altera_edac.h"
  30. #include "edac_core.h"
  31. #include "edac_module.h"
  32. #define EDAC_MOD_STR "altera_edac"
  33. #define EDAC_VERSION "1"
  34. static const struct altr_sdram_prv_data c5_data = {
  35. .ecc_ctrl_offset = CV_CTLCFG_OFST,
  36. .ecc_ctl_en_mask = CV_CTLCFG_ECC_AUTO_EN,
  37. .ecc_stat_offset = CV_DRAMSTS_OFST,
  38. .ecc_stat_ce_mask = CV_DRAMSTS_SBEERR,
  39. .ecc_stat_ue_mask = CV_DRAMSTS_DBEERR,
  40. .ecc_saddr_offset = CV_ERRADDR_OFST,
  41. .ecc_daddr_offset = CV_ERRADDR_OFST,
  42. .ecc_cecnt_offset = CV_SBECOUNT_OFST,
  43. .ecc_uecnt_offset = CV_DBECOUNT_OFST,
  44. .ecc_irq_en_offset = CV_DRAMINTR_OFST,
  45. .ecc_irq_en_mask = CV_DRAMINTR_INTREN,
  46. .ecc_irq_clr_offset = CV_DRAMINTR_OFST,
  47. .ecc_irq_clr_mask = (CV_DRAMINTR_INTRCLR | CV_DRAMINTR_INTREN),
  48. .ecc_cnt_rst_offset = CV_DRAMINTR_OFST,
  49. .ecc_cnt_rst_mask = CV_DRAMINTR_INTRCLR,
  50. #ifdef CONFIG_EDAC_DEBUG
  51. .ce_ue_trgr_offset = CV_CTLCFG_OFST,
  52. .ce_set_mask = CV_CTLCFG_GEN_SB_ERR,
  53. .ue_set_mask = CV_CTLCFG_GEN_DB_ERR,
  54. #endif
  55. };
  56. static const struct altr_sdram_prv_data a10_data = {
  57. .ecc_ctrl_offset = A10_ECCCTRL1_OFST,
  58. .ecc_ctl_en_mask = A10_ECCCTRL1_ECC_EN,
  59. .ecc_stat_offset = A10_INTSTAT_OFST,
  60. .ecc_stat_ce_mask = A10_INTSTAT_SBEERR,
  61. .ecc_stat_ue_mask = A10_INTSTAT_DBEERR,
  62. .ecc_saddr_offset = A10_SERRADDR_OFST,
  63. .ecc_daddr_offset = A10_DERRADDR_OFST,
  64. .ecc_irq_en_offset = A10_ERRINTEN_OFST,
  65. .ecc_irq_en_mask = A10_ECC_IRQ_EN_MASK,
  66. .ecc_irq_clr_offset = A10_INTSTAT_OFST,
  67. .ecc_irq_clr_mask = (A10_INTSTAT_SBEERR | A10_INTSTAT_DBEERR),
  68. .ecc_cnt_rst_offset = A10_ECCCTRL1_OFST,
  69. .ecc_cnt_rst_mask = A10_ECC_CNT_RESET_MASK,
  70. #ifdef CONFIG_EDAC_DEBUG
  71. .ce_ue_trgr_offset = A10_DIAGINTTEST_OFST,
  72. .ce_set_mask = A10_DIAGINT_TSERRA_MASK,
  73. .ue_set_mask = A10_DIAGINT_TDERRA_MASK,
  74. #endif
  75. };
  76. static irqreturn_t altr_sdram_mc_err_handler(int irq, void *dev_id)
  77. {
  78. struct mem_ctl_info *mci = dev_id;
  79. struct altr_sdram_mc_data *drvdata = mci->pvt_info;
  80. const struct altr_sdram_prv_data *priv = drvdata->data;
  81. u32 status, err_count = 1, err_addr;
  82. regmap_read(drvdata->mc_vbase, priv->ecc_stat_offset, &status);
  83. if (status & priv->ecc_stat_ue_mask) {
  84. regmap_read(drvdata->mc_vbase, priv->ecc_daddr_offset,
  85. &err_addr);
  86. if (priv->ecc_uecnt_offset)
  87. regmap_read(drvdata->mc_vbase, priv->ecc_uecnt_offset,
  88. &err_count);
  89. panic("\nEDAC: [%d Uncorrectable errors @ 0x%08X]\n",
  90. err_count, err_addr);
  91. }
  92. if (status & priv->ecc_stat_ce_mask) {
  93. regmap_read(drvdata->mc_vbase, priv->ecc_saddr_offset,
  94. &err_addr);
  95. if (priv->ecc_uecnt_offset)
  96. regmap_read(drvdata->mc_vbase, priv->ecc_cecnt_offset,
  97. &err_count);
  98. edac_mc_handle_error(HW_EVENT_ERR_CORRECTED, mci, err_count,
  99. err_addr >> PAGE_SHIFT,
  100. err_addr & ~PAGE_MASK, 0,
  101. 0, 0, -1, mci->ctl_name, "");
  102. /* Clear IRQ to resume */
  103. regmap_write(drvdata->mc_vbase, priv->ecc_irq_clr_offset,
  104. priv->ecc_irq_clr_mask);
  105. return IRQ_HANDLED;
  106. }
  107. return IRQ_NONE;
  108. }
  109. #ifdef CONFIG_EDAC_DEBUG
  110. static ssize_t altr_sdr_mc_err_inject_write(struct file *file,
  111. const char __user *data,
  112. size_t count, loff_t *ppos)
  113. {
  114. struct mem_ctl_info *mci = file->private_data;
  115. struct altr_sdram_mc_data *drvdata = mci->pvt_info;
  116. const struct altr_sdram_prv_data *priv = drvdata->data;
  117. u32 *ptemp;
  118. dma_addr_t dma_handle;
  119. u32 reg, read_reg;
  120. ptemp = dma_alloc_coherent(mci->pdev, 16, &dma_handle, GFP_KERNEL);
  121. if (!ptemp) {
  122. dma_free_coherent(mci->pdev, 16, ptemp, dma_handle);
  123. edac_printk(KERN_ERR, EDAC_MC,
  124. "Inject: Buffer Allocation error\n");
  125. return -ENOMEM;
  126. }
  127. regmap_read(drvdata->mc_vbase, priv->ce_ue_trgr_offset,
  128. &read_reg);
  129. read_reg &= ~(priv->ce_set_mask | priv->ue_set_mask);
  130. /* Error are injected by writing a word while the SBE or DBE
  131. * bit in the CTLCFG register is set. Reading the word will
  132. * trigger the SBE or DBE error and the corresponding IRQ.
  133. */
  134. if (count == 3) {
  135. edac_printk(KERN_ALERT, EDAC_MC,
  136. "Inject Double bit error\n");
  137. regmap_write(drvdata->mc_vbase, priv->ce_ue_trgr_offset,
  138. (read_reg | priv->ue_set_mask));
  139. } else {
  140. edac_printk(KERN_ALERT, EDAC_MC,
  141. "Inject Single bit error\n");
  142. regmap_write(drvdata->mc_vbase, priv->ce_ue_trgr_offset,
  143. (read_reg | priv->ce_set_mask));
  144. }
  145. ptemp[0] = 0x5A5A5A5A;
  146. ptemp[1] = 0xA5A5A5A5;
  147. /* Clear the error injection bits */
  148. regmap_write(drvdata->mc_vbase, priv->ce_ue_trgr_offset, read_reg);
  149. /* Ensure it has been written out */
  150. wmb();
  151. /*
  152. * To trigger the error, we need to read the data back
  153. * (the data was written with errors above).
  154. * The ACCESS_ONCE macros and printk are used to prevent the
  155. * the compiler optimizing these reads out.
  156. */
  157. reg = ACCESS_ONCE(ptemp[0]);
  158. read_reg = ACCESS_ONCE(ptemp[1]);
  159. /* Force Read */
  160. rmb();
  161. edac_printk(KERN_ALERT, EDAC_MC, "Read Data [0x%X, 0x%X]\n",
  162. reg, read_reg);
  163. dma_free_coherent(mci->pdev, 16, ptemp, dma_handle);
  164. return count;
  165. }
  166. static const struct file_operations altr_sdr_mc_debug_inject_fops = {
  167. .open = simple_open,
  168. .write = altr_sdr_mc_err_inject_write,
  169. .llseek = generic_file_llseek,
  170. };
  171. static void altr_sdr_mc_create_debugfs_nodes(struct mem_ctl_info *mci)
  172. {
  173. if (mci->debugfs)
  174. debugfs_create_file("inject_ctrl", S_IWUSR, mci->debugfs, mci,
  175. &altr_sdr_mc_debug_inject_fops);
  176. }
  177. #else
  178. static void altr_sdr_mc_create_debugfs_nodes(struct mem_ctl_info *mci)
  179. {}
  180. #endif
  181. /* Get total memory size from Open Firmware DTB */
  182. static unsigned long get_total_mem(void)
  183. {
  184. struct device_node *np = NULL;
  185. const unsigned int *reg, *reg_end;
  186. int len, sw, aw;
  187. unsigned long start, size, total_mem = 0;
  188. for_each_node_by_type(np, "memory") {
  189. aw = of_n_addr_cells(np);
  190. sw = of_n_size_cells(np);
  191. reg = (const unsigned int *)of_get_property(np, "reg", &len);
  192. reg_end = reg + (len / sizeof(u32));
  193. total_mem = 0;
  194. do {
  195. start = of_read_number(reg, aw);
  196. reg += aw;
  197. size = of_read_number(reg, sw);
  198. reg += sw;
  199. total_mem += size;
  200. } while (reg < reg_end);
  201. }
  202. edac_dbg(0, "total_mem 0x%lx\n", total_mem);
  203. return total_mem;
  204. }
  205. static const struct of_device_id altr_sdram_ctrl_of_match[] = {
  206. { .compatible = "altr,sdram-edac", .data = (void *)&c5_data},
  207. { .compatible = "altr,sdram-edac-a10", .data = (void *)&a10_data},
  208. {},
  209. };
  210. MODULE_DEVICE_TABLE(of, altr_sdram_ctrl_of_match);
  211. static int a10_init(struct regmap *mc_vbase)
  212. {
  213. if (regmap_update_bits(mc_vbase, A10_INTMODE_OFST,
  214. A10_INTMODE_SB_INT, A10_INTMODE_SB_INT)) {
  215. edac_printk(KERN_ERR, EDAC_MC,
  216. "Error setting SB IRQ mode\n");
  217. return -ENODEV;
  218. }
  219. if (regmap_write(mc_vbase, A10_SERRCNTREG_OFST, 1)) {
  220. edac_printk(KERN_ERR, EDAC_MC,
  221. "Error setting trigger count\n");
  222. return -ENODEV;
  223. }
  224. return 0;
  225. }
  226. static int a10_unmask_irq(struct platform_device *pdev, u32 mask)
  227. {
  228. void __iomem *sm_base;
  229. int ret = 0;
  230. if (!request_mem_region(A10_SYMAN_INTMASK_CLR, sizeof(u32),
  231. dev_name(&pdev->dev))) {
  232. edac_printk(KERN_ERR, EDAC_MC,
  233. "Unable to request mem region\n");
  234. return -EBUSY;
  235. }
  236. sm_base = ioremap(A10_SYMAN_INTMASK_CLR, sizeof(u32));
  237. if (!sm_base) {
  238. edac_printk(KERN_ERR, EDAC_MC,
  239. "Unable to ioremap device\n");
  240. ret = -ENOMEM;
  241. goto release;
  242. }
  243. iowrite32(mask, sm_base);
  244. iounmap(sm_base);
  245. release:
  246. release_mem_region(A10_SYMAN_INTMASK_CLR, sizeof(u32));
  247. return ret;
  248. }
  249. static int altr_sdram_probe(struct platform_device *pdev)
  250. {
  251. const struct of_device_id *id;
  252. struct edac_mc_layer layers[2];
  253. struct mem_ctl_info *mci;
  254. struct altr_sdram_mc_data *drvdata;
  255. const struct altr_sdram_prv_data *priv;
  256. struct regmap *mc_vbase;
  257. struct dimm_info *dimm;
  258. u32 read_reg;
  259. int irq, irq2, res = 0;
  260. unsigned long mem_size, irqflags = 0;
  261. id = of_match_device(altr_sdram_ctrl_of_match, &pdev->dev);
  262. if (!id)
  263. return -ENODEV;
  264. /* Grab the register range from the sdr controller in device tree */
  265. mc_vbase = syscon_regmap_lookup_by_phandle(pdev->dev.of_node,
  266. "altr,sdr-syscon");
  267. if (IS_ERR(mc_vbase)) {
  268. edac_printk(KERN_ERR, EDAC_MC,
  269. "regmap for altr,sdr-syscon lookup failed.\n");
  270. return -ENODEV;
  271. }
  272. /* Check specific dependencies for the module */
  273. priv = of_match_node(altr_sdram_ctrl_of_match,
  274. pdev->dev.of_node)->data;
  275. /* Validate the SDRAM controller has ECC enabled */
  276. if (regmap_read(mc_vbase, priv->ecc_ctrl_offset, &read_reg) ||
  277. ((read_reg & priv->ecc_ctl_en_mask) != priv->ecc_ctl_en_mask)) {
  278. edac_printk(KERN_ERR, EDAC_MC,
  279. "No ECC/ECC disabled [0x%08X]\n", read_reg);
  280. return -ENODEV;
  281. }
  282. /* Grab memory size from device tree. */
  283. mem_size = get_total_mem();
  284. if (!mem_size) {
  285. edac_printk(KERN_ERR, EDAC_MC, "Unable to calculate memory size\n");
  286. return -ENODEV;
  287. }
  288. /* Ensure the SDRAM Interrupt is disabled */
  289. if (regmap_update_bits(mc_vbase, priv->ecc_irq_en_offset,
  290. priv->ecc_irq_en_mask, 0)) {
  291. edac_printk(KERN_ERR, EDAC_MC,
  292. "Error disabling SDRAM ECC IRQ\n");
  293. return -ENODEV;
  294. }
  295. /* Toggle to clear the SDRAM Error count */
  296. if (regmap_update_bits(mc_vbase, priv->ecc_cnt_rst_offset,
  297. priv->ecc_cnt_rst_mask,
  298. priv->ecc_cnt_rst_mask)) {
  299. edac_printk(KERN_ERR, EDAC_MC,
  300. "Error clearing SDRAM ECC count\n");
  301. return -ENODEV;
  302. }
  303. if (regmap_update_bits(mc_vbase, priv->ecc_cnt_rst_offset,
  304. priv->ecc_cnt_rst_mask, 0)) {
  305. edac_printk(KERN_ERR, EDAC_MC,
  306. "Error clearing SDRAM ECC count\n");
  307. return -ENODEV;
  308. }
  309. irq = platform_get_irq(pdev, 0);
  310. if (irq < 0) {
  311. edac_printk(KERN_ERR, EDAC_MC,
  312. "No irq %d in DT\n", irq);
  313. return -ENODEV;
  314. }
  315. /* Arria10 has a 2nd IRQ */
  316. irq2 = platform_get_irq(pdev, 1);
  317. layers[0].type = EDAC_MC_LAYER_CHIP_SELECT;
  318. layers[0].size = 1;
  319. layers[0].is_virt_csrow = true;
  320. layers[1].type = EDAC_MC_LAYER_CHANNEL;
  321. layers[1].size = 1;
  322. layers[1].is_virt_csrow = false;
  323. mci = edac_mc_alloc(0, ARRAY_SIZE(layers), layers,
  324. sizeof(struct altr_sdram_mc_data));
  325. if (!mci)
  326. return -ENOMEM;
  327. mci->pdev = &pdev->dev;
  328. drvdata = mci->pvt_info;
  329. drvdata->mc_vbase = mc_vbase;
  330. drvdata->data = priv;
  331. platform_set_drvdata(pdev, mci);
  332. if (!devres_open_group(&pdev->dev, NULL, GFP_KERNEL)) {
  333. edac_printk(KERN_ERR, EDAC_MC,
  334. "Unable to get managed device resource\n");
  335. res = -ENOMEM;
  336. goto free;
  337. }
  338. mci->mtype_cap = MEM_FLAG_DDR3;
  339. mci->edac_ctl_cap = EDAC_FLAG_NONE | EDAC_FLAG_SECDED;
  340. mci->edac_cap = EDAC_FLAG_SECDED;
  341. mci->mod_name = EDAC_MOD_STR;
  342. mci->mod_ver = EDAC_VERSION;
  343. mci->ctl_name = dev_name(&pdev->dev);
  344. mci->scrub_mode = SCRUB_SW_SRC;
  345. mci->dev_name = dev_name(&pdev->dev);
  346. dimm = *mci->dimms;
  347. dimm->nr_pages = ((mem_size - 1) >> PAGE_SHIFT) + 1;
  348. dimm->grain = 8;
  349. dimm->dtype = DEV_X8;
  350. dimm->mtype = MEM_DDR3;
  351. dimm->edac_mode = EDAC_SECDED;
  352. res = edac_mc_add_mc(mci);
  353. if (res < 0)
  354. goto err;
  355. /* Only the Arria10 has separate IRQs */
  356. if (irq2 > 0) {
  357. /* Arria10 specific initialization */
  358. res = a10_init(mc_vbase);
  359. if (res < 0)
  360. goto err2;
  361. res = devm_request_irq(&pdev->dev, irq2,
  362. altr_sdram_mc_err_handler,
  363. IRQF_SHARED, dev_name(&pdev->dev), mci);
  364. if (res < 0) {
  365. edac_mc_printk(mci, KERN_ERR,
  366. "Unable to request irq %d\n", irq2);
  367. res = -ENODEV;
  368. goto err2;
  369. }
  370. res = a10_unmask_irq(pdev, A10_DDR0_IRQ_MASK);
  371. if (res < 0)
  372. goto err2;
  373. irqflags = IRQF_SHARED;
  374. }
  375. res = devm_request_irq(&pdev->dev, irq, altr_sdram_mc_err_handler,
  376. irqflags, dev_name(&pdev->dev), mci);
  377. if (res < 0) {
  378. edac_mc_printk(mci, KERN_ERR,
  379. "Unable to request irq %d\n", irq);
  380. res = -ENODEV;
  381. goto err2;
  382. }
  383. /* Infrastructure ready - enable the IRQ */
  384. if (regmap_update_bits(drvdata->mc_vbase, priv->ecc_irq_en_offset,
  385. priv->ecc_irq_en_mask, priv->ecc_irq_en_mask)) {
  386. edac_mc_printk(mci, KERN_ERR,
  387. "Error enabling SDRAM ECC IRQ\n");
  388. res = -ENODEV;
  389. goto err2;
  390. }
  391. altr_sdr_mc_create_debugfs_nodes(mci);
  392. devres_close_group(&pdev->dev, NULL);
  393. return 0;
  394. err2:
  395. edac_mc_del_mc(&pdev->dev);
  396. err:
  397. devres_release_group(&pdev->dev, NULL);
  398. free:
  399. edac_mc_free(mci);
  400. edac_printk(KERN_ERR, EDAC_MC,
  401. "EDAC Probe Failed; Error %d\n", res);
  402. return res;
  403. }
  404. static int altr_sdram_remove(struct platform_device *pdev)
  405. {
  406. struct mem_ctl_info *mci = platform_get_drvdata(pdev);
  407. edac_mc_del_mc(&pdev->dev);
  408. edac_mc_free(mci);
  409. platform_set_drvdata(pdev, NULL);
  410. return 0;
  411. }
  412. /*
  413. * If you want to suspend, need to disable EDAC by removing it
  414. * from the device tree or defconfig.
  415. */
  416. #ifdef CONFIG_PM
  417. static int altr_sdram_prepare(struct device *dev)
  418. {
  419. pr_err("Suspend not allowed when EDAC is enabled.\n");
  420. return -EPERM;
  421. }
  422. static const struct dev_pm_ops altr_sdram_pm_ops = {
  423. .prepare = altr_sdram_prepare,
  424. };
  425. #endif
  426. static struct platform_driver altr_sdram_edac_driver = {
  427. .probe = altr_sdram_probe,
  428. .remove = altr_sdram_remove,
  429. .driver = {
  430. .name = "altr_sdram_edac",
  431. #ifdef CONFIG_PM
  432. .pm = &altr_sdram_pm_ops,
  433. #endif
  434. .of_match_table = altr_sdram_ctrl_of_match,
  435. },
  436. };
  437. module_platform_driver(altr_sdram_edac_driver);
  438. MODULE_LICENSE("GPL v2");
  439. MODULE_AUTHOR("Thor Thayer");
  440. MODULE_DESCRIPTION("EDAC Driver for Altera SDRAM Controller");