mmdc.c 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581
  1. /*
  2. * Copyright 2011,2016 Freescale Semiconductor, Inc.
  3. * Copyright 2011 Linaro Ltd.
  4. *
  5. * The code contained herein is licensed under the GNU General Public
  6. * License. You may obtain a copy of the GNU General Public License
  7. * Version 2 or later at the following locations:
  8. *
  9. * http://www.opensource.org/licenses/gpl-license.html
  10. * http://www.gnu.org/copyleft/gpl.html
  11. */
  12. #include <linux/hrtimer.h>
  13. #include <linux/init.h>
  14. #include <linux/interrupt.h>
  15. #include <linux/io.h>
  16. #include <linux/module.h>
  17. #include <linux/of.h>
  18. #include <linux/of_address.h>
  19. #include <linux/of_device.h>
  20. #include <linux/perf_event.h>
  21. #include <linux/slab.h>
  22. #include "common.h"
  23. #define MMDC_MAPSR 0x404
  24. #define BP_MMDC_MAPSR_PSD 0
  25. #define BP_MMDC_MAPSR_PSS 4
  26. #define MMDC_MDMISC 0x18
  27. #define BM_MMDC_MDMISC_DDR_TYPE 0x18
  28. #define BP_MMDC_MDMISC_DDR_TYPE 0x3
  29. #define TOTAL_CYCLES 0x0
  30. #define BUSY_CYCLES 0x1
  31. #define READ_ACCESSES 0x2
  32. #define WRITE_ACCESSES 0x3
  33. #define READ_BYTES 0x4
  34. #define WRITE_BYTES 0x5
  35. /* Enables, resets, freezes, overflow profiling*/
  36. #define DBG_DIS 0x0
  37. #define DBG_EN 0x1
  38. #define DBG_RST 0x2
  39. #define PRF_FRZ 0x4
  40. #define CYC_OVF 0x8
  41. #define PROFILE_SEL 0x10
  42. #define MMDC_MADPCR0 0x410
  43. #define MMDC_MADPSR0 0x418
  44. #define MMDC_MADPSR1 0x41C
  45. #define MMDC_MADPSR2 0x420
  46. #define MMDC_MADPSR3 0x424
  47. #define MMDC_MADPSR4 0x428
  48. #define MMDC_MADPSR5 0x42C
  49. #define MMDC_NUM_COUNTERS 6
  50. #define MMDC_FLAG_PROFILE_SEL 0x1
  51. #define to_mmdc_pmu(p) container_of(p, struct mmdc_pmu, pmu)
  52. static enum cpuhp_state cpuhp_mmdc_state;
  53. static int ddr_type;
  54. struct fsl_mmdc_devtype_data {
  55. unsigned int flags;
  56. };
  57. static const struct fsl_mmdc_devtype_data imx6q_data = {
  58. };
  59. static const struct fsl_mmdc_devtype_data imx6qp_data = {
  60. .flags = MMDC_FLAG_PROFILE_SEL,
  61. };
  62. static const struct of_device_id imx_mmdc_dt_ids[] = {
  63. { .compatible = "fsl,imx6q-mmdc", .data = (void *)&imx6q_data},
  64. { .compatible = "fsl,imx6qp-mmdc", .data = (void *)&imx6qp_data},
  65. { /* sentinel */ }
  66. };
  67. #ifdef CONFIG_PERF_EVENTS
  68. static DEFINE_IDA(mmdc_ida);
  69. PMU_EVENT_ATTR_STRING(total-cycles, mmdc_pmu_total_cycles, "event=0x00")
  70. PMU_EVENT_ATTR_STRING(busy-cycles, mmdc_pmu_busy_cycles, "event=0x01")
  71. PMU_EVENT_ATTR_STRING(read-accesses, mmdc_pmu_read_accesses, "event=0x02")
  72. PMU_EVENT_ATTR_STRING(write-accesses, mmdc_pmu_write_accesses, "config=0x03")
  73. PMU_EVENT_ATTR_STRING(read-bytes, mmdc_pmu_read_bytes, "event=0x04")
  74. PMU_EVENT_ATTR_STRING(read-bytes.unit, mmdc_pmu_read_bytes_unit, "MB");
  75. PMU_EVENT_ATTR_STRING(read-bytes.scale, mmdc_pmu_read_bytes_scale, "0.000001");
  76. PMU_EVENT_ATTR_STRING(write-bytes, mmdc_pmu_write_bytes, "event=0x05")
  77. PMU_EVENT_ATTR_STRING(write-bytes.unit, mmdc_pmu_write_bytes_unit, "MB");
  78. PMU_EVENT_ATTR_STRING(write-bytes.scale, mmdc_pmu_write_bytes_scale, "0.000001");
  79. struct mmdc_pmu {
  80. struct pmu pmu;
  81. void __iomem *mmdc_base;
  82. cpumask_t cpu;
  83. struct hrtimer hrtimer;
  84. unsigned int active_events;
  85. struct device *dev;
  86. struct perf_event *mmdc_events[MMDC_NUM_COUNTERS];
  87. struct hlist_node node;
  88. struct fsl_mmdc_devtype_data *devtype_data;
  89. };
  90. /*
  91. * Polling period is set to one second, overflow of total-cycles (the fastest
  92. * increasing counter) takes ten seconds so one second is safe
  93. */
  94. static unsigned int mmdc_pmu_poll_period_us = 1000000;
  95. module_param_named(pmu_pmu_poll_period_us, mmdc_pmu_poll_period_us, uint,
  96. S_IRUGO | S_IWUSR);
  97. static ktime_t mmdc_pmu_timer_period(void)
  98. {
  99. return ns_to_ktime((u64)mmdc_pmu_poll_period_us * 1000);
  100. }
  101. static ssize_t mmdc_pmu_cpumask_show(struct device *dev,
  102. struct device_attribute *attr, char *buf)
  103. {
  104. struct mmdc_pmu *pmu_mmdc = dev_get_drvdata(dev);
  105. return cpumap_print_to_pagebuf(true, buf, &pmu_mmdc->cpu);
  106. }
  107. static struct device_attribute mmdc_pmu_cpumask_attr =
  108. __ATTR(cpumask, S_IRUGO, mmdc_pmu_cpumask_show, NULL);
  109. static struct attribute *mmdc_pmu_cpumask_attrs[] = {
  110. &mmdc_pmu_cpumask_attr.attr,
  111. NULL,
  112. };
  113. static struct attribute_group mmdc_pmu_cpumask_attr_group = {
  114. .attrs = mmdc_pmu_cpumask_attrs,
  115. };
  116. static struct attribute *mmdc_pmu_events_attrs[] = {
  117. &mmdc_pmu_total_cycles.attr.attr,
  118. &mmdc_pmu_busy_cycles.attr.attr,
  119. &mmdc_pmu_read_accesses.attr.attr,
  120. &mmdc_pmu_write_accesses.attr.attr,
  121. &mmdc_pmu_read_bytes.attr.attr,
  122. &mmdc_pmu_read_bytes_unit.attr.attr,
  123. &mmdc_pmu_read_bytes_scale.attr.attr,
  124. &mmdc_pmu_write_bytes.attr.attr,
  125. &mmdc_pmu_write_bytes_unit.attr.attr,
  126. &mmdc_pmu_write_bytes_scale.attr.attr,
  127. NULL,
  128. };
  129. static struct attribute_group mmdc_pmu_events_attr_group = {
  130. .name = "events",
  131. .attrs = mmdc_pmu_events_attrs,
  132. };
  133. PMU_FORMAT_ATTR(event, "config:0-63");
  134. static struct attribute *mmdc_pmu_format_attrs[] = {
  135. &format_attr_event.attr,
  136. NULL,
  137. };
  138. static struct attribute_group mmdc_pmu_format_attr_group = {
  139. .name = "format",
  140. .attrs = mmdc_pmu_format_attrs,
  141. };
  142. static const struct attribute_group *attr_groups[] = {
  143. &mmdc_pmu_events_attr_group,
  144. &mmdc_pmu_format_attr_group,
  145. &mmdc_pmu_cpumask_attr_group,
  146. NULL,
  147. };
  148. static u32 mmdc_pmu_read_counter(struct mmdc_pmu *pmu_mmdc, int cfg)
  149. {
  150. void __iomem *mmdc_base, *reg;
  151. mmdc_base = pmu_mmdc->mmdc_base;
  152. switch (cfg) {
  153. case TOTAL_CYCLES:
  154. reg = mmdc_base + MMDC_MADPSR0;
  155. break;
  156. case BUSY_CYCLES:
  157. reg = mmdc_base + MMDC_MADPSR1;
  158. break;
  159. case READ_ACCESSES:
  160. reg = mmdc_base + MMDC_MADPSR2;
  161. break;
  162. case WRITE_ACCESSES:
  163. reg = mmdc_base + MMDC_MADPSR3;
  164. break;
  165. case READ_BYTES:
  166. reg = mmdc_base + MMDC_MADPSR4;
  167. break;
  168. case WRITE_BYTES:
  169. reg = mmdc_base + MMDC_MADPSR5;
  170. break;
  171. default:
  172. return WARN_ONCE(1,
  173. "invalid configuration %d for mmdc counter", cfg);
  174. }
  175. return readl(reg);
  176. }
  177. static int mmdc_pmu_offline_cpu(unsigned int cpu, struct hlist_node *node)
  178. {
  179. struct mmdc_pmu *pmu_mmdc = hlist_entry_safe(node, struct mmdc_pmu, node);
  180. int target;
  181. if (!cpumask_test_and_clear_cpu(cpu, &pmu_mmdc->cpu))
  182. return 0;
  183. target = cpumask_any_but(cpu_online_mask, cpu);
  184. if (target >= nr_cpu_ids)
  185. return 0;
  186. perf_pmu_migrate_context(&pmu_mmdc->pmu, cpu, target);
  187. cpumask_set_cpu(target, &pmu_mmdc->cpu);
  188. return 0;
  189. }
  190. static bool mmdc_pmu_group_event_is_valid(struct perf_event *event,
  191. struct pmu *pmu,
  192. unsigned long *used_counters)
  193. {
  194. int cfg = event->attr.config;
  195. if (is_software_event(event))
  196. return true;
  197. if (event->pmu != pmu)
  198. return false;
  199. return !test_and_set_bit(cfg, used_counters);
  200. }
  201. /*
  202. * Each event has a single fixed-purpose counter, so we can only have a
  203. * single active event for each at any point in time. Here we just check
  204. * for duplicates, and rely on mmdc_pmu_event_init to verify that the HW
  205. * event numbers are valid.
  206. */
  207. static bool mmdc_pmu_group_is_valid(struct perf_event *event)
  208. {
  209. struct pmu *pmu = event->pmu;
  210. struct perf_event *leader = event->group_leader;
  211. struct perf_event *sibling;
  212. unsigned long counter_mask = 0;
  213. set_bit(leader->attr.config, &counter_mask);
  214. if (event != leader) {
  215. if (!mmdc_pmu_group_event_is_valid(event, pmu, &counter_mask))
  216. return false;
  217. }
  218. list_for_each_entry(sibling, &leader->sibling_list, group_entry) {
  219. if (!mmdc_pmu_group_event_is_valid(sibling, pmu, &counter_mask))
  220. return false;
  221. }
  222. return true;
  223. }
  224. static int mmdc_pmu_event_init(struct perf_event *event)
  225. {
  226. struct mmdc_pmu *pmu_mmdc = to_mmdc_pmu(event->pmu);
  227. int cfg = event->attr.config;
  228. if (event->attr.type != event->pmu->type)
  229. return -ENOENT;
  230. if (is_sampling_event(event) || event->attach_state & PERF_ATTACH_TASK)
  231. return -EOPNOTSUPP;
  232. if (event->cpu < 0) {
  233. dev_warn(pmu_mmdc->dev, "Can't provide per-task data!\n");
  234. return -EOPNOTSUPP;
  235. }
  236. if (event->attr.exclude_user ||
  237. event->attr.exclude_kernel ||
  238. event->attr.exclude_hv ||
  239. event->attr.exclude_idle ||
  240. event->attr.exclude_host ||
  241. event->attr.exclude_guest ||
  242. event->attr.sample_period)
  243. return -EINVAL;
  244. if (cfg < 0 || cfg >= MMDC_NUM_COUNTERS)
  245. return -EINVAL;
  246. if (!mmdc_pmu_group_is_valid(event))
  247. return -EINVAL;
  248. event->cpu = cpumask_first(&pmu_mmdc->cpu);
  249. return 0;
  250. }
  251. static void mmdc_pmu_event_update(struct perf_event *event)
  252. {
  253. struct mmdc_pmu *pmu_mmdc = to_mmdc_pmu(event->pmu);
  254. struct hw_perf_event *hwc = &event->hw;
  255. u64 delta, prev_raw_count, new_raw_count;
  256. do {
  257. prev_raw_count = local64_read(&hwc->prev_count);
  258. new_raw_count = mmdc_pmu_read_counter(pmu_mmdc,
  259. event->attr.config);
  260. } while (local64_cmpxchg(&hwc->prev_count, prev_raw_count,
  261. new_raw_count) != prev_raw_count);
  262. delta = (new_raw_count - prev_raw_count) & 0xFFFFFFFF;
  263. local64_add(delta, &event->count);
  264. }
  265. static void mmdc_pmu_event_start(struct perf_event *event, int flags)
  266. {
  267. struct mmdc_pmu *pmu_mmdc = to_mmdc_pmu(event->pmu);
  268. struct hw_perf_event *hwc = &event->hw;
  269. void __iomem *mmdc_base, *reg;
  270. u32 val;
  271. mmdc_base = pmu_mmdc->mmdc_base;
  272. reg = mmdc_base + MMDC_MADPCR0;
  273. /*
  274. * hrtimer is required because mmdc does not provide an interrupt so
  275. * polling is necessary
  276. */
  277. hrtimer_start(&pmu_mmdc->hrtimer, mmdc_pmu_timer_period(),
  278. HRTIMER_MODE_REL_PINNED);
  279. local64_set(&hwc->prev_count, 0);
  280. writel(DBG_RST, reg);
  281. val = DBG_EN;
  282. if (pmu_mmdc->devtype_data->flags & MMDC_FLAG_PROFILE_SEL)
  283. val |= PROFILE_SEL;
  284. writel(val, reg);
  285. }
  286. static int mmdc_pmu_event_add(struct perf_event *event, int flags)
  287. {
  288. struct mmdc_pmu *pmu_mmdc = to_mmdc_pmu(event->pmu);
  289. struct hw_perf_event *hwc = &event->hw;
  290. int cfg = event->attr.config;
  291. if (flags & PERF_EF_START)
  292. mmdc_pmu_event_start(event, flags);
  293. if (pmu_mmdc->mmdc_events[cfg] != NULL)
  294. return -EAGAIN;
  295. pmu_mmdc->mmdc_events[cfg] = event;
  296. pmu_mmdc->active_events++;
  297. local64_set(&hwc->prev_count, mmdc_pmu_read_counter(pmu_mmdc, cfg));
  298. return 0;
  299. }
  300. static void mmdc_pmu_event_stop(struct perf_event *event, int flags)
  301. {
  302. struct mmdc_pmu *pmu_mmdc = to_mmdc_pmu(event->pmu);
  303. void __iomem *mmdc_base, *reg;
  304. mmdc_base = pmu_mmdc->mmdc_base;
  305. reg = mmdc_base + MMDC_MADPCR0;
  306. writel(PRF_FRZ, reg);
  307. mmdc_pmu_event_update(event);
  308. }
  309. static void mmdc_pmu_event_del(struct perf_event *event, int flags)
  310. {
  311. struct mmdc_pmu *pmu_mmdc = to_mmdc_pmu(event->pmu);
  312. int cfg = event->attr.config;
  313. pmu_mmdc->mmdc_events[cfg] = NULL;
  314. pmu_mmdc->active_events--;
  315. if (pmu_mmdc->active_events == 0)
  316. hrtimer_cancel(&pmu_mmdc->hrtimer);
  317. mmdc_pmu_event_stop(event, PERF_EF_UPDATE);
  318. }
  319. static void mmdc_pmu_overflow_handler(struct mmdc_pmu *pmu_mmdc)
  320. {
  321. int i;
  322. for (i = 0; i < MMDC_NUM_COUNTERS; i++) {
  323. struct perf_event *event = pmu_mmdc->mmdc_events[i];
  324. if (event)
  325. mmdc_pmu_event_update(event);
  326. }
  327. }
  328. static enum hrtimer_restart mmdc_pmu_timer_handler(struct hrtimer *hrtimer)
  329. {
  330. struct mmdc_pmu *pmu_mmdc = container_of(hrtimer, struct mmdc_pmu,
  331. hrtimer);
  332. mmdc_pmu_overflow_handler(pmu_mmdc);
  333. hrtimer_forward_now(hrtimer, mmdc_pmu_timer_period());
  334. return HRTIMER_RESTART;
  335. }
  336. static int mmdc_pmu_init(struct mmdc_pmu *pmu_mmdc,
  337. void __iomem *mmdc_base, struct device *dev)
  338. {
  339. int mmdc_num;
  340. *pmu_mmdc = (struct mmdc_pmu) {
  341. .pmu = (struct pmu) {
  342. .task_ctx_nr = perf_invalid_context,
  343. .attr_groups = attr_groups,
  344. .event_init = mmdc_pmu_event_init,
  345. .add = mmdc_pmu_event_add,
  346. .del = mmdc_pmu_event_del,
  347. .start = mmdc_pmu_event_start,
  348. .stop = mmdc_pmu_event_stop,
  349. .read = mmdc_pmu_event_update,
  350. },
  351. .mmdc_base = mmdc_base,
  352. .dev = dev,
  353. .active_events = 0,
  354. };
  355. mmdc_num = ida_simple_get(&mmdc_ida, 0, 0, GFP_KERNEL);
  356. return mmdc_num;
  357. }
  358. static int imx_mmdc_remove(struct platform_device *pdev)
  359. {
  360. struct mmdc_pmu *pmu_mmdc = platform_get_drvdata(pdev);
  361. cpuhp_state_remove_instance_nocalls(cpuhp_mmdc_state, &pmu_mmdc->node);
  362. perf_pmu_unregister(&pmu_mmdc->pmu);
  363. kfree(pmu_mmdc);
  364. return 0;
  365. }
  366. static int imx_mmdc_perf_init(struct platform_device *pdev, void __iomem *mmdc_base)
  367. {
  368. struct mmdc_pmu *pmu_mmdc;
  369. char *name;
  370. int mmdc_num;
  371. int ret;
  372. const struct of_device_id *of_id =
  373. of_match_device(imx_mmdc_dt_ids, &pdev->dev);
  374. pmu_mmdc = kzalloc(sizeof(*pmu_mmdc), GFP_KERNEL);
  375. if (!pmu_mmdc) {
  376. pr_err("failed to allocate PMU device!\n");
  377. return -ENOMEM;
  378. }
  379. /* The first instance registers the hotplug state */
  380. if (!cpuhp_mmdc_state) {
  381. ret = cpuhp_setup_state_multi(CPUHP_AP_ONLINE_DYN,
  382. "perf/arm/mmdc:online", NULL,
  383. mmdc_pmu_offline_cpu);
  384. if (ret < 0) {
  385. pr_err("cpuhp_setup_state_multi failed\n");
  386. goto pmu_free;
  387. }
  388. cpuhp_mmdc_state = ret;
  389. }
  390. mmdc_num = mmdc_pmu_init(pmu_mmdc, mmdc_base, &pdev->dev);
  391. if (mmdc_num == 0)
  392. name = "mmdc";
  393. else
  394. name = devm_kasprintf(&pdev->dev,
  395. GFP_KERNEL, "mmdc%d", mmdc_num);
  396. pmu_mmdc->devtype_data = (struct fsl_mmdc_devtype_data *)of_id->data;
  397. hrtimer_init(&pmu_mmdc->hrtimer, CLOCK_MONOTONIC,
  398. HRTIMER_MODE_REL);
  399. pmu_mmdc->hrtimer.function = mmdc_pmu_timer_handler;
  400. cpumask_set_cpu(raw_smp_processor_id(), &pmu_mmdc->cpu);
  401. /* Register the pmu instance for cpu hotplug */
  402. cpuhp_state_add_instance_nocalls(cpuhp_mmdc_state, &pmu_mmdc->node);
  403. ret = perf_pmu_register(&(pmu_mmdc->pmu), name, -1);
  404. if (ret)
  405. goto pmu_register_err;
  406. platform_set_drvdata(pdev, pmu_mmdc);
  407. return 0;
  408. pmu_register_err:
  409. pr_warn("MMDC Perf PMU failed (%d), disabled\n", ret);
  410. cpuhp_state_remove_instance_nocalls(cpuhp_mmdc_state, &pmu_mmdc->node);
  411. hrtimer_cancel(&pmu_mmdc->hrtimer);
  412. pmu_free:
  413. kfree(pmu_mmdc);
  414. return ret;
  415. }
  416. #else
  417. #define imx_mmdc_remove NULL
  418. #define imx_mmdc_perf_init(pdev, mmdc_base) 0
  419. #endif
  420. static int imx_mmdc_probe(struct platform_device *pdev)
  421. {
  422. struct device_node *np = pdev->dev.of_node;
  423. void __iomem *mmdc_base, *reg;
  424. u32 val;
  425. int timeout = 0x400;
  426. mmdc_base = of_iomap(np, 0);
  427. WARN_ON(!mmdc_base);
  428. reg = mmdc_base + MMDC_MDMISC;
  429. /* Get ddr type */
  430. val = readl_relaxed(reg);
  431. ddr_type = (val & BM_MMDC_MDMISC_DDR_TYPE) >>
  432. BP_MMDC_MDMISC_DDR_TYPE;
  433. reg = mmdc_base + MMDC_MAPSR;
  434. /* Enable automatic power saving */
  435. val = readl_relaxed(reg);
  436. val &= ~(1 << BP_MMDC_MAPSR_PSD);
  437. writel_relaxed(val, reg);
  438. /* Ensure it's successfully enabled */
  439. while (!(readl_relaxed(reg) & 1 << BP_MMDC_MAPSR_PSS) && --timeout)
  440. cpu_relax();
  441. if (unlikely(!timeout)) {
  442. pr_warn("%s: failed to enable automatic power saving\n",
  443. __func__);
  444. return -EBUSY;
  445. }
  446. return imx_mmdc_perf_init(pdev, mmdc_base);
  447. }
  448. int imx_mmdc_get_ddr_type(void)
  449. {
  450. return ddr_type;
  451. }
  452. static struct platform_driver imx_mmdc_driver = {
  453. .driver = {
  454. .name = "imx-mmdc",
  455. .of_match_table = imx_mmdc_dt_ids,
  456. },
  457. .probe = imx_mmdc_probe,
  458. .remove = imx_mmdc_remove,
  459. };
  460. static int __init imx_mmdc_init(void)
  461. {
  462. return platform_driver_register(&imx_mmdc_driver);
  463. }
  464. postcore_initcall(imx_mmdc_init);