fsl_imx9_ddr_perf.c 25 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887
  1. // SPDX-License-Identifier: GPL-2.0
  2. // Copyright 2023 NXP
  3. #include <linux/bitfield.h>
  4. #include <linux/init.h>
  5. #include <linux/interrupt.h>
  6. #include <linux/io.h>
  7. #include <linux/module.h>
  8. #include <linux/of.h>
  9. #include <linux/platform_device.h>
  10. #include <linux/perf_event.h>
  11. /* Performance monitor configuration */
  12. #define PMCFG1 0x00
  13. #define MX93_PMCFG1_RD_TRANS_FILT_EN BIT(31)
  14. #define MX93_PMCFG1_WR_TRANS_FILT_EN BIT(30)
  15. #define MX93_PMCFG1_RD_BT_FILT_EN BIT(29)
  16. #define MX93_PMCFG1_ID_MASK GENMASK(17, 0)
  17. #define MX95_PMCFG1_WR_BEAT_FILT_EN BIT(31)
  18. #define MX95_PMCFG1_RD_BEAT_FILT_EN BIT(30)
  19. #define PMCFG2 0x04
  20. #define MX93_PMCFG2_ID GENMASK(17, 0)
  21. #define PMCFG3 0x08
  22. #define PMCFG4 0x0C
  23. #define PMCFG5 0x10
  24. #define PMCFG6 0x14
  25. #define MX95_PMCFG_ID_MASK GENMASK(9, 0)
  26. #define MX95_PMCFG_ID GENMASK(25, 16)
  27. /* Global control register affects all counters and takes priority over local control registers */
  28. #define PMGC0 0x40
  29. /* Global control register bits */
  30. #define PMGC0_FAC BIT(31)
  31. #define PMGC0_PMIE BIT(30)
  32. #define PMGC0_FCECE BIT(29)
  33. /*
  34. * 64bit counter0 exclusively dedicated to counting cycles
  35. * 32bit counters monitor counter-specific events in addition to counting reference events
  36. */
  37. #define PMLCA(n) (0x40 + 0x10 + (0x10 * n))
  38. #define PMLCB(n) (0x40 + 0x14 + (0x10 * n))
  39. #define PMC(n) (0x40 + 0x18 + (0x10 * n))
  40. /* Local control register bits */
  41. #define PMLCA_FC BIT(31)
  42. #define PMLCA_CE BIT(26)
  43. #define PMLCA_EVENT GENMASK(22, 16)
  44. #define NUM_COUNTERS 11
  45. #define CYCLES_COUNTER 0
  46. #define CYCLES_EVENT_ID 0
  47. #define CONFIG_EVENT_MASK GENMASK(7, 0)
  48. #define CONFIG_COUNTER_MASK GENMASK(23, 16)
  49. #define to_ddr_pmu(p) container_of(p, struct ddr_pmu, pmu)
  50. #define DDR_PERF_DEV_NAME "imx9_ddr"
  51. #define DDR_CPUHP_CB_NAME DDR_PERF_DEV_NAME "_perf_pmu"
  52. static DEFINE_IDA(ddr_ida);
  53. /*
  54. * V1 support 1 read transaction, 1 write transaction and 1 read beats
  55. * event which corresponding respecitively to counter 2, 3 and 4.
  56. */
  57. #define DDR_PERF_AXI_FILTER_V1 0x1
  58. /*
  59. * V2 support 1 read beats and 3 write beats events which corresponding
  60. * respecitively to counter 2-5.
  61. */
  62. #define DDR_PERF_AXI_FILTER_V2 0x2
  63. struct imx_ddr_devtype_data {
  64. const char *identifier; /* system PMU identifier for userspace */
  65. unsigned int filter_ver; /* AXI filter version */
  66. };
  67. struct ddr_pmu {
  68. struct pmu pmu;
  69. void __iomem *base;
  70. unsigned int cpu;
  71. struct hlist_node node;
  72. struct device *dev;
  73. struct perf_event *events[NUM_COUNTERS];
  74. int active_events;
  75. enum cpuhp_state cpuhp_state;
  76. const struct imx_ddr_devtype_data *devtype_data;
  77. int irq;
  78. int id;
  79. };
  80. static const struct imx_ddr_devtype_data imx91_devtype_data = {
  81. .identifier = "imx91",
  82. .filter_ver = DDR_PERF_AXI_FILTER_V1
  83. };
  84. static const struct imx_ddr_devtype_data imx93_devtype_data = {
  85. .identifier = "imx93",
  86. .filter_ver = DDR_PERF_AXI_FILTER_V1
  87. };
  88. static const struct imx_ddr_devtype_data imx94_devtype_data = {
  89. .identifier = "imx94",
  90. .filter_ver = DDR_PERF_AXI_FILTER_V2
  91. };
  92. static const struct imx_ddr_devtype_data imx95_devtype_data = {
  93. .identifier = "imx95",
  94. .filter_ver = DDR_PERF_AXI_FILTER_V2
  95. };
  96. static inline bool axi_filter_v1(struct ddr_pmu *pmu)
  97. {
  98. return pmu->devtype_data->filter_ver == DDR_PERF_AXI_FILTER_V1;
  99. }
  100. static inline bool axi_filter_v2(struct ddr_pmu *pmu)
  101. {
  102. return pmu->devtype_data->filter_ver == DDR_PERF_AXI_FILTER_V2;
  103. }
  104. static const struct of_device_id imx_ddr_pmu_dt_ids[] = {
  105. { .compatible = "fsl,imx91-ddr-pmu", .data = &imx91_devtype_data },
  106. { .compatible = "fsl,imx93-ddr-pmu", .data = &imx93_devtype_data },
  107. { .compatible = "fsl,imx94-ddr-pmu", .data = &imx94_devtype_data },
  108. { .compatible = "fsl,imx95-ddr-pmu", .data = &imx95_devtype_data },
  109. { /* sentinel */ }
  110. };
  111. MODULE_DEVICE_TABLE(of, imx_ddr_pmu_dt_ids);
  112. static ssize_t ddr_perf_identifier_show(struct device *dev,
  113. struct device_attribute *attr,
  114. char *page)
  115. {
  116. struct ddr_pmu *pmu = dev_get_drvdata(dev);
  117. return sysfs_emit(page, "%s\n", pmu->devtype_data->identifier);
  118. }
  119. static struct device_attribute ddr_perf_identifier_attr =
  120. __ATTR(identifier, 0444, ddr_perf_identifier_show, NULL);
  121. static struct attribute *ddr_perf_identifier_attrs[] = {
  122. &ddr_perf_identifier_attr.attr,
  123. NULL,
  124. };
  125. static struct attribute_group ddr_perf_identifier_attr_group = {
  126. .attrs = ddr_perf_identifier_attrs,
  127. };
  128. static ssize_t ddr_perf_cpumask_show(struct device *dev,
  129. struct device_attribute *attr, char *buf)
  130. {
  131. struct ddr_pmu *pmu = dev_get_drvdata(dev);
  132. return cpumap_print_to_pagebuf(true, buf, cpumask_of(pmu->cpu));
  133. }
  134. static struct device_attribute ddr_perf_cpumask_attr =
  135. __ATTR(cpumask, 0444, ddr_perf_cpumask_show, NULL);
  136. static struct attribute *ddr_perf_cpumask_attrs[] = {
  137. &ddr_perf_cpumask_attr.attr,
  138. NULL,
  139. };
  140. static const struct attribute_group ddr_perf_cpumask_attr_group = {
  141. .attrs = ddr_perf_cpumask_attrs,
  142. };
  143. struct imx9_pmu_events_attr {
  144. struct device_attribute attr;
  145. u64 id;
  146. const struct imx_ddr_devtype_data *devtype_data;
  147. };
  148. static ssize_t ddr_pmu_event_show(struct device *dev,
  149. struct device_attribute *attr, char *page)
  150. {
  151. struct imx9_pmu_events_attr *pmu_attr;
  152. pmu_attr = container_of(attr, struct imx9_pmu_events_attr, attr);
  153. return sysfs_emit(page, "event=0x%02llx\n", pmu_attr->id);
  154. }
  155. #define COUNTER_OFFSET_IN_EVENT 8
  156. #define ID(counter, id) ((counter << COUNTER_OFFSET_IN_EVENT) | id)
  157. #define DDR_PMU_EVENT_ATTR_COMM(_name, _id, _data) \
  158. (&((struct imx9_pmu_events_attr[]) { \
  159. { .attr = __ATTR(_name, 0444, ddr_pmu_event_show, NULL),\
  160. .id = _id, \
  161. .devtype_data = _data, } \
  162. })[0].attr.attr)
  163. #define IMX9_DDR_PMU_EVENT_ATTR(_name, _id) \
  164. DDR_PMU_EVENT_ATTR_COMM(_name, _id, NULL)
  165. #define IMX93_DDR_PMU_EVENT_ATTR(_name, _id) \
  166. DDR_PMU_EVENT_ATTR_COMM(_name, _id, &imx93_devtype_data)
  167. #define IMX95_DDR_PMU_EVENT_ATTR(_name, _id) \
  168. DDR_PMU_EVENT_ATTR_COMM(_name, _id, &imx95_devtype_data)
  169. static struct attribute *ddr_perf_events_attrs[] = {
  170. /* counter0 cycles event */
  171. IMX9_DDR_PMU_EVENT_ATTR(cycles, 0),
  172. /* reference events for all normal counters, need assert DEBUG19[21] bit */
  173. IMX9_DDR_PMU_EVENT_ATTR(ddrc_ddrc1_rmw_for_ecc, 12),
  174. IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pmon_rreorder, 13),
  175. IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pmon_wreorder, 14),
  176. IMX9_DDR_PMU_EVENT_ATTR(ddrc_pm_0, 15),
  177. IMX9_DDR_PMU_EVENT_ATTR(ddrc_pm_1, 16),
  178. IMX9_DDR_PMU_EVENT_ATTR(ddrc_pm_2, 17),
  179. IMX9_DDR_PMU_EVENT_ATTR(ddrc_pm_3, 18),
  180. IMX9_DDR_PMU_EVENT_ATTR(ddrc_pm_4, 19),
  181. IMX9_DDR_PMU_EVENT_ATTR(ddrc_pm_5, 22),
  182. IMX9_DDR_PMU_EVENT_ATTR(ddrc_pm_6, 23),
  183. IMX9_DDR_PMU_EVENT_ATTR(ddrc_pm_7, 24),
  184. IMX9_DDR_PMU_EVENT_ATTR(ddrc_pm_8, 25),
  185. IMX9_DDR_PMU_EVENT_ATTR(ddrc_pm_9, 26),
  186. IMX9_DDR_PMU_EVENT_ATTR(ddrc_pm_10, 27),
  187. IMX9_DDR_PMU_EVENT_ATTR(ddrc_pm_11, 28),
  188. IMX9_DDR_PMU_EVENT_ATTR(ddrc_pm_12, 31),
  189. IMX9_DDR_PMU_EVENT_ATTR(ddrc_pm_13, 59),
  190. IMX9_DDR_PMU_EVENT_ATTR(ddrc_pm_15, 61),
  191. IMX9_DDR_PMU_EVENT_ATTR(ddrc_pm_29, 63),
  192. /* counter1 specific events */
  193. IMX9_DDR_PMU_EVENT_ATTR(ddrc_ld_riq_0, ID(1, 64)),
  194. IMX9_DDR_PMU_EVENT_ATTR(ddrc_ld_riq_1, ID(1, 65)),
  195. IMX9_DDR_PMU_EVENT_ATTR(ddrc_ld_riq_2, ID(1, 66)),
  196. IMX9_DDR_PMU_EVENT_ATTR(ddrc_ld_riq_3, ID(1, 67)),
  197. IMX9_DDR_PMU_EVENT_ATTR(ddrc_ld_riq_4, ID(1, 68)),
  198. IMX9_DDR_PMU_EVENT_ATTR(ddrc_ld_riq_5, ID(1, 69)),
  199. IMX9_DDR_PMU_EVENT_ATTR(ddrc_ld_riq_6, ID(1, 70)),
  200. IMX9_DDR_PMU_EVENT_ATTR(ddrc_ld_riq_7, ID(1, 71)),
  201. /* counter2 specific events */
  202. IMX9_DDR_PMU_EVENT_ATTR(ddrc_ld_wiq_0, ID(2, 64)),
  203. IMX9_DDR_PMU_EVENT_ATTR(ddrc_ld_wiq_1, ID(2, 65)),
  204. IMX9_DDR_PMU_EVENT_ATTR(ddrc_ld_wiq_2, ID(2, 66)),
  205. IMX9_DDR_PMU_EVENT_ATTR(ddrc_ld_wiq_3, ID(2, 67)),
  206. IMX9_DDR_PMU_EVENT_ATTR(ddrc_ld_wiq_4, ID(2, 68)),
  207. IMX9_DDR_PMU_EVENT_ATTR(ddrc_ld_wiq_5, ID(2, 69)),
  208. IMX9_DDR_PMU_EVENT_ATTR(ddrc_ld_wiq_6, ID(2, 70)),
  209. IMX9_DDR_PMU_EVENT_ATTR(ddrc_ld_wiq_7, ID(2, 71)),
  210. IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pmon_empty, ID(2, 72)),
  211. IMX93_DDR_PMU_EVENT_ATTR(eddrtq_pm_rd_trans_filt, ID(2, 73)), /* imx93 specific*/
  212. IMX95_DDR_PMU_EVENT_ATTR(eddrtq_pm_wr_beat_filt, ID(2, 73)), /* imx95 specific*/
  213. /* counter3 specific events */
  214. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_row_collision_0, ID(3, 64)),
  215. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_row_collision_1, ID(3, 65)),
  216. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_row_collision_2, ID(3, 66)),
  217. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_row_collision_3, ID(3, 67)),
  218. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_row_collision_4, ID(3, 68)),
  219. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_row_collision_5, ID(3, 69)),
  220. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_row_collision_6, ID(3, 70)),
  221. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_row_collision_7, ID(3, 71)),
  222. IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pmon_full, ID(3, 72)),
  223. IMX93_DDR_PMU_EVENT_ATTR(eddrtq_pm_wr_trans_filt, ID(3, 73)), /* imx93 specific*/
  224. IMX95_DDR_PMU_EVENT_ATTR(eddrtq_pm_rd_beat_filt2, ID(3, 73)), /* imx95 specific*/
  225. /* counter4 specific events */
  226. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_row_open_0, ID(4, 64)),
  227. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_row_open_1, ID(4, 65)),
  228. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_row_open_2, ID(4, 66)),
  229. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_row_open_3, ID(4, 67)),
  230. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_row_open_4, ID(4, 68)),
  231. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_row_open_5, ID(4, 69)),
  232. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_row_open_6, ID(4, 70)),
  233. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_row_open_7, ID(4, 71)),
  234. IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pmon_ld_rdq2_rmw, ID(4, 72)),
  235. IMX93_DDR_PMU_EVENT_ATTR(eddrtq_pm_rd_beat_filt, ID(4, 73)), /* imx93 specific*/
  236. IMX95_DDR_PMU_EVENT_ATTR(eddrtq_pm_rd_beat_filt1, ID(4, 73)), /* imx95 specific*/
  237. /* counter5 specific events */
  238. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_valid_start_0, ID(5, 64)),
  239. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_valid_start_1, ID(5, 65)),
  240. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_valid_start_2, ID(5, 66)),
  241. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_valid_start_3, ID(5, 67)),
  242. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_valid_start_4, ID(5, 68)),
  243. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_valid_start_5, ID(5, 69)),
  244. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_valid_start_6, ID(5, 70)),
  245. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_valid_start_7, ID(5, 71)),
  246. IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pmon_ld_rdq1, ID(5, 72)),
  247. IMX95_DDR_PMU_EVENT_ATTR(eddrtq_pm_rd_beat_filt0, ID(5, 73)), /* imx95 specific*/
  248. /* counter6 specific events */
  249. IMX9_DDR_PMU_EVENT_ATTR(ddrc_qx_valid_end_0, ID(6, 64)),
  250. IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pmon_ld_rdq2, ID(6, 72)),
  251. /* counter7 specific events */
  252. IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pmon_1_2_full, ID(7, 64)),
  253. IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pmon_ld_wrq0, ID(7, 65)),
  254. /* counter8 specific events */
  255. IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pmon_bias_switched, ID(8, 64)),
  256. IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pmon_1_4_full, ID(8, 65)),
  257. /* counter9 specific events */
  258. IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pmon_ld_wrq1, ID(9, 65)),
  259. IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pmon_3_4_full, ID(9, 66)),
  260. /* counter10 specific events */
  261. IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pmon_misc_mrk, ID(10, 65)),
  262. IMX9_DDR_PMU_EVENT_ATTR(eddrtq_pmon_ld_rdq0, ID(10, 66)),
  263. NULL,
  264. };
  265. static umode_t
  266. ddr_perf_events_attrs_is_visible(struct kobject *kobj,
  267. struct attribute *attr, int unused)
  268. {
  269. struct pmu *pmu = dev_get_drvdata(kobj_to_dev(kobj));
  270. struct ddr_pmu *ddr_pmu = to_ddr_pmu(pmu);
  271. struct imx9_pmu_events_attr *eattr;
  272. eattr = container_of(attr, typeof(*eattr), attr.attr);
  273. if (!eattr->devtype_data)
  274. return attr->mode;
  275. if (eattr->devtype_data != ddr_pmu->devtype_data &&
  276. eattr->devtype_data->filter_ver != ddr_pmu->devtype_data->filter_ver)
  277. return 0;
  278. return attr->mode;
  279. }
  280. static const struct attribute_group ddr_perf_events_attr_group = {
  281. .name = "events",
  282. .attrs = ddr_perf_events_attrs,
  283. .is_visible = ddr_perf_events_attrs_is_visible,
  284. };
  285. PMU_FORMAT_ATTR(event, "config:0-7,16-23");
  286. PMU_FORMAT_ATTR(counter, "config:8-15");
  287. PMU_FORMAT_ATTR(axi_id, "config1:0-17");
  288. PMU_FORMAT_ATTR(axi_mask, "config2:0-17");
  289. static struct attribute *ddr_perf_format_attrs[] = {
  290. &format_attr_event.attr,
  291. &format_attr_counter.attr,
  292. &format_attr_axi_id.attr,
  293. &format_attr_axi_mask.attr,
  294. NULL,
  295. };
  296. static const struct attribute_group ddr_perf_format_attr_group = {
  297. .name = "format",
  298. .attrs = ddr_perf_format_attrs,
  299. };
  300. static const struct attribute_group *attr_groups[] = {
  301. &ddr_perf_identifier_attr_group,
  302. &ddr_perf_cpumask_attr_group,
  303. &ddr_perf_events_attr_group,
  304. &ddr_perf_format_attr_group,
  305. NULL,
  306. };
  307. static void ddr_perf_clear_counter(struct ddr_pmu *pmu, int counter)
  308. {
  309. if (counter == CYCLES_COUNTER) {
  310. writel(0, pmu->base + PMC(counter) + 0x4);
  311. writel(0, pmu->base + PMC(counter));
  312. } else {
  313. writel(0, pmu->base + PMC(counter));
  314. }
  315. }
  316. static u64 ddr_perf_read_counter(struct ddr_pmu *pmu, int counter)
  317. {
  318. u32 val_lower, val_upper;
  319. u64 val;
  320. if (counter != CYCLES_COUNTER) {
  321. val = readl_relaxed(pmu->base + PMC(counter));
  322. goto out;
  323. }
  324. /* special handling for reading 64bit cycle counter */
  325. do {
  326. val_upper = readl_relaxed(pmu->base + PMC(counter) + 0x4);
  327. val_lower = readl_relaxed(pmu->base + PMC(counter));
  328. } while (val_upper != readl_relaxed(pmu->base + PMC(counter) + 0x4));
  329. val = val_upper;
  330. val = (val << 32);
  331. val |= val_lower;
  332. out:
  333. return val;
  334. }
  335. static void ddr_perf_counter_global_config(struct ddr_pmu *pmu, bool enable)
  336. {
  337. u32 ctrl;
  338. ctrl = readl_relaxed(pmu->base + PMGC0);
  339. if (enable) {
  340. /*
  341. * The performance monitor must be reset before event counting
  342. * sequences. The performance monitor can be reset by first freezing
  343. * one or more counters and then clearing the freeze condition to
  344. * allow the counters to count according to the settings in the
  345. * performance monitor registers. Counters can be frozen individually
  346. * by setting PMLCAn[FC] bits, or simultaneously by setting PMGC0[FAC].
  347. * Simply clearing these freeze bits will then allow the performance
  348. * monitor to begin counting based on the register settings.
  349. */
  350. ctrl |= PMGC0_FAC;
  351. writel(ctrl, pmu->base + PMGC0);
  352. /*
  353. * Freeze all counters disabled, interrupt enabled, and freeze
  354. * counters on condition enabled.
  355. */
  356. ctrl &= ~PMGC0_FAC;
  357. ctrl |= PMGC0_PMIE | PMGC0_FCECE;
  358. writel(ctrl, pmu->base + PMGC0);
  359. } else {
  360. ctrl |= PMGC0_FAC;
  361. ctrl &= ~(PMGC0_PMIE | PMGC0_FCECE);
  362. writel(ctrl, pmu->base + PMGC0);
  363. }
  364. }
  365. static void ddr_perf_counter_local_config(struct ddr_pmu *pmu, int config,
  366. int counter, bool enable)
  367. {
  368. u32 ctrl_a;
  369. int event;
  370. ctrl_a = readl_relaxed(pmu->base + PMLCA(counter));
  371. event = FIELD_GET(CONFIG_EVENT_MASK, config);
  372. if (enable) {
  373. ctrl_a |= PMLCA_FC;
  374. writel(ctrl_a, pmu->base + PMLCA(counter));
  375. ddr_perf_clear_counter(pmu, counter);
  376. /* Freeze counter disabled, condition enabled, and program event.*/
  377. ctrl_a &= ~PMLCA_FC;
  378. ctrl_a |= PMLCA_CE;
  379. ctrl_a &= ~FIELD_PREP(PMLCA_EVENT, 0x7F);
  380. ctrl_a |= FIELD_PREP(PMLCA_EVENT, event);
  381. writel(ctrl_a, pmu->base + PMLCA(counter));
  382. } else {
  383. /* Freeze counter. */
  384. ctrl_a |= PMLCA_FC;
  385. writel(ctrl_a, pmu->base + PMLCA(counter));
  386. }
  387. }
  388. static void imx93_ddr_perf_monitor_config(struct ddr_pmu *pmu, int event,
  389. int counter, int axi_id, int axi_mask)
  390. {
  391. u32 pmcfg1, pmcfg2;
  392. static const u32 mask[] = {
  393. MX93_PMCFG1_RD_TRANS_FILT_EN,
  394. MX93_PMCFG1_WR_TRANS_FILT_EN,
  395. MX93_PMCFG1_RD_BT_FILT_EN
  396. };
  397. pmcfg1 = readl_relaxed(pmu->base + PMCFG1);
  398. if (counter >= 2 && counter <= 4)
  399. pmcfg1 = event == 73 ? pmcfg1 | mask[counter - 2] :
  400. pmcfg1 & ~mask[counter - 2];
  401. pmcfg1 &= ~FIELD_PREP(MX93_PMCFG1_ID_MASK, 0x3FFFF);
  402. pmcfg1 |= FIELD_PREP(MX93_PMCFG1_ID_MASK, axi_mask);
  403. writel_relaxed(pmcfg1, pmu->base + PMCFG1);
  404. pmcfg2 = readl_relaxed(pmu->base + PMCFG2);
  405. pmcfg2 &= ~FIELD_PREP(MX93_PMCFG2_ID, 0x3FFFF);
  406. pmcfg2 |= FIELD_PREP(MX93_PMCFG2_ID, axi_id);
  407. writel_relaxed(pmcfg2, pmu->base + PMCFG2);
  408. }
  409. static void imx95_ddr_perf_monitor_config(struct ddr_pmu *pmu, int event,
  410. int counter, int axi_id, int axi_mask)
  411. {
  412. u32 pmcfg1, pmcfg, offset = 0;
  413. pmcfg1 = readl_relaxed(pmu->base + PMCFG1);
  414. if (event == 73) {
  415. switch (counter) {
  416. case 2:
  417. pmcfg1 |= MX95_PMCFG1_WR_BEAT_FILT_EN;
  418. offset = PMCFG3;
  419. break;
  420. case 3:
  421. pmcfg1 |= MX95_PMCFG1_RD_BEAT_FILT_EN;
  422. offset = PMCFG4;
  423. break;
  424. case 4:
  425. pmcfg1 |= MX95_PMCFG1_RD_BEAT_FILT_EN;
  426. offset = PMCFG5;
  427. break;
  428. case 5:
  429. pmcfg1 |= MX95_PMCFG1_RD_BEAT_FILT_EN;
  430. offset = PMCFG6;
  431. break;
  432. }
  433. } else {
  434. switch (counter) {
  435. case 2:
  436. pmcfg1 &= ~MX95_PMCFG1_WR_BEAT_FILT_EN;
  437. break;
  438. case 3:
  439. case 4:
  440. case 5:
  441. pmcfg1 &= ~MX95_PMCFG1_RD_BEAT_FILT_EN;
  442. break;
  443. }
  444. }
  445. writel_relaxed(pmcfg1, pmu->base + PMCFG1);
  446. if (offset) {
  447. pmcfg = readl_relaxed(pmu->base + offset);
  448. pmcfg &= ~(FIELD_PREP(MX95_PMCFG_ID_MASK, 0x3FF) |
  449. FIELD_PREP(MX95_PMCFG_ID, 0x3FF));
  450. pmcfg |= (FIELD_PREP(MX95_PMCFG_ID_MASK, axi_mask) |
  451. FIELD_PREP(MX95_PMCFG_ID, axi_id));
  452. writel_relaxed(pmcfg, pmu->base + offset);
  453. }
  454. }
  455. static void ddr_perf_event_update(struct perf_event *event)
  456. {
  457. struct ddr_pmu *pmu = to_ddr_pmu(event->pmu);
  458. struct hw_perf_event *hwc = &event->hw;
  459. int counter = hwc->idx;
  460. u64 new_raw_count;
  461. new_raw_count = ddr_perf_read_counter(pmu, counter);
  462. local64_add(new_raw_count, &event->count);
  463. /* clear counter's value every time */
  464. ddr_perf_clear_counter(pmu, counter);
  465. }
  466. static int ddr_perf_event_init(struct perf_event *event)
  467. {
  468. struct ddr_pmu *pmu = to_ddr_pmu(event->pmu);
  469. struct hw_perf_event *hwc = &event->hw;
  470. struct perf_event *sibling;
  471. if (event->attr.type != event->pmu->type)
  472. return -ENOENT;
  473. if (is_sampling_event(event) || event->attach_state & PERF_ATTACH_TASK)
  474. return -EOPNOTSUPP;
  475. if (event->cpu < 0) {
  476. dev_warn(pmu->dev, "Can't provide per-task data!\n");
  477. return -EOPNOTSUPP;
  478. }
  479. /*
  480. * We must NOT create groups containing mixed PMUs, although software
  481. * events are acceptable (for example to create a CCN group
  482. * periodically read when a hrtimer aka cpu-clock leader triggers).
  483. */
  484. if (event->group_leader->pmu != event->pmu &&
  485. !is_software_event(event->group_leader))
  486. return -EINVAL;
  487. for_each_sibling_event(sibling, event->group_leader) {
  488. if (sibling->pmu != event->pmu &&
  489. !is_software_event(sibling))
  490. return -EINVAL;
  491. }
  492. event->cpu = pmu->cpu;
  493. hwc->idx = -1;
  494. return 0;
  495. }
  496. static void ddr_perf_event_start(struct perf_event *event, int flags)
  497. {
  498. struct ddr_pmu *pmu = to_ddr_pmu(event->pmu);
  499. struct hw_perf_event *hwc = &event->hw;
  500. int counter = hwc->idx;
  501. local64_set(&hwc->prev_count, 0);
  502. ddr_perf_counter_local_config(pmu, event->attr.config, counter, true);
  503. hwc->state = 0;
  504. }
  505. static int ddr_perf_alloc_counter(struct ddr_pmu *pmu, int event, int counter)
  506. {
  507. int i;
  508. if (event == CYCLES_EVENT_ID) {
  509. // Cycles counter is dedicated for cycle event.
  510. if (pmu->events[CYCLES_COUNTER] == NULL)
  511. return CYCLES_COUNTER;
  512. } else if (counter != 0) {
  513. // Counter specific event use specific counter.
  514. if (pmu->events[counter] == NULL)
  515. return counter;
  516. } else {
  517. // Auto allocate counter for referene event.
  518. for (i = 1; i < NUM_COUNTERS; i++)
  519. if (pmu->events[i] == NULL)
  520. return i;
  521. }
  522. return -ENOENT;
  523. }
  524. static int ddr_perf_event_add(struct perf_event *event, int flags)
  525. {
  526. struct ddr_pmu *pmu = to_ddr_pmu(event->pmu);
  527. struct hw_perf_event *hwc = &event->hw;
  528. int cfg = event->attr.config;
  529. int cfg1 = event->attr.config1;
  530. int cfg2 = event->attr.config2;
  531. int event_id, counter;
  532. event_id = FIELD_GET(CONFIG_EVENT_MASK, cfg);
  533. counter = FIELD_GET(CONFIG_COUNTER_MASK, cfg);
  534. counter = ddr_perf_alloc_counter(pmu, event_id, counter);
  535. if (counter < 0) {
  536. dev_dbg(pmu->dev, "There are not enough counters\n");
  537. return -EOPNOTSUPP;
  538. }
  539. pmu->events[counter] = event;
  540. pmu->active_events++;
  541. hwc->idx = counter;
  542. hwc->state |= PERF_HES_STOPPED;
  543. if (axi_filter_v1(pmu))
  544. /* read trans, write trans, read beat */
  545. imx93_ddr_perf_monitor_config(pmu, event_id, counter, cfg1, cfg2);
  546. if (axi_filter_v2(pmu))
  547. /* write beat, read beat2, read beat1, read beat */
  548. imx95_ddr_perf_monitor_config(pmu, event_id, counter, cfg1, cfg2);
  549. if (flags & PERF_EF_START)
  550. ddr_perf_event_start(event, flags);
  551. return 0;
  552. }
  553. static void ddr_perf_event_stop(struct perf_event *event, int flags)
  554. {
  555. struct ddr_pmu *pmu = to_ddr_pmu(event->pmu);
  556. struct hw_perf_event *hwc = &event->hw;
  557. int counter = hwc->idx;
  558. ddr_perf_counter_local_config(pmu, event->attr.config, counter, false);
  559. ddr_perf_event_update(event);
  560. hwc->state |= PERF_HES_STOPPED;
  561. }
  562. static void ddr_perf_event_del(struct perf_event *event, int flags)
  563. {
  564. struct ddr_pmu *pmu = to_ddr_pmu(event->pmu);
  565. struct hw_perf_event *hwc = &event->hw;
  566. int counter = hwc->idx;
  567. ddr_perf_event_stop(event, PERF_EF_UPDATE);
  568. pmu->events[counter] = NULL;
  569. pmu->active_events--;
  570. hwc->idx = -1;
  571. }
  572. static void ddr_perf_pmu_enable(struct pmu *pmu)
  573. {
  574. struct ddr_pmu *ddr_pmu = to_ddr_pmu(pmu);
  575. ddr_perf_counter_global_config(ddr_pmu, true);
  576. }
  577. static void ddr_perf_pmu_disable(struct pmu *pmu)
  578. {
  579. struct ddr_pmu *ddr_pmu = to_ddr_pmu(pmu);
  580. ddr_perf_counter_global_config(ddr_pmu, false);
  581. }
  582. static void ddr_perf_init(struct ddr_pmu *pmu, void __iomem *base,
  583. struct device *dev)
  584. {
  585. *pmu = (struct ddr_pmu) {
  586. .pmu = (struct pmu) {
  587. .module = THIS_MODULE,
  588. .capabilities = PERF_PMU_CAP_NO_EXCLUDE,
  589. .task_ctx_nr = perf_invalid_context,
  590. .attr_groups = attr_groups,
  591. .event_init = ddr_perf_event_init,
  592. .add = ddr_perf_event_add,
  593. .del = ddr_perf_event_del,
  594. .start = ddr_perf_event_start,
  595. .stop = ddr_perf_event_stop,
  596. .read = ddr_perf_event_update,
  597. .pmu_enable = ddr_perf_pmu_enable,
  598. .pmu_disable = ddr_perf_pmu_disable,
  599. },
  600. .base = base,
  601. .dev = dev,
  602. };
  603. }
  604. static irqreturn_t ddr_perf_irq_handler(int irq, void *p)
  605. {
  606. struct ddr_pmu *pmu = (struct ddr_pmu *)p;
  607. struct perf_event *event;
  608. int i;
  609. /*
  610. * Counters can generate an interrupt on an overflow when msb of a
  611. * counter changes from 0 to 1. For the interrupt to be signalled,
  612. * below condition mush be satisfied:
  613. * PMGC0[PMIE] = 1, PMGC0[FCECE] = 1, PMLCAn[CE] = 1
  614. * When an interrupt is signalled, PMGC0[FAC] is set by hardware and
  615. * all of the registers are frozen.
  616. * Software can clear the interrupt condition by resetting the performance
  617. * monitor and clearing the most significant bit of the counter that
  618. * generate the overflow.
  619. */
  620. for (i = 0; i < NUM_COUNTERS; i++) {
  621. if (!pmu->events[i])
  622. continue;
  623. event = pmu->events[i];
  624. ddr_perf_event_update(event);
  625. }
  626. ddr_perf_counter_global_config(pmu, true);
  627. return IRQ_HANDLED;
  628. }
  629. static int ddr_perf_offline_cpu(unsigned int cpu, struct hlist_node *node)
  630. {
  631. struct ddr_pmu *pmu = hlist_entry_safe(node, struct ddr_pmu, node);
  632. int target;
  633. if (cpu != pmu->cpu)
  634. return 0;
  635. target = cpumask_any_but(cpu_online_mask, cpu);
  636. if (target >= nr_cpu_ids)
  637. return 0;
  638. perf_pmu_migrate_context(&pmu->pmu, cpu, target);
  639. pmu->cpu = target;
  640. WARN_ON(irq_set_affinity(pmu->irq, cpumask_of(pmu->cpu)));
  641. return 0;
  642. }
  643. static int ddr_perf_probe(struct platform_device *pdev)
  644. {
  645. struct ddr_pmu *pmu;
  646. void __iomem *base;
  647. int ret, irq;
  648. char *name;
  649. base = devm_platform_ioremap_resource(pdev, 0);
  650. if (IS_ERR(base))
  651. return PTR_ERR(base);
  652. pmu = devm_kzalloc(&pdev->dev, sizeof(*pmu), GFP_KERNEL);
  653. if (!pmu)
  654. return -ENOMEM;
  655. ddr_perf_init(pmu, base, &pdev->dev);
  656. pmu->devtype_data = of_device_get_match_data(&pdev->dev);
  657. platform_set_drvdata(pdev, pmu);
  658. pmu->id = ida_alloc(&ddr_ida, GFP_KERNEL);
  659. name = devm_kasprintf(&pdev->dev, GFP_KERNEL, DDR_PERF_DEV_NAME "%d", pmu->id);
  660. if (!name) {
  661. ret = -ENOMEM;
  662. goto format_string_err;
  663. }
  664. pmu->cpu = raw_smp_processor_id();
  665. ret = cpuhp_setup_state_multi(CPUHP_AP_ONLINE_DYN, DDR_CPUHP_CB_NAME,
  666. NULL, ddr_perf_offline_cpu);
  667. if (ret < 0) {
  668. dev_err(&pdev->dev, "Failed to add callbacks for multi state\n");
  669. goto cpuhp_state_err;
  670. }
  671. pmu->cpuhp_state = ret;
  672. /* Register the pmu instance for cpu hotplug */
  673. ret = cpuhp_state_add_instance_nocalls(pmu->cpuhp_state, &pmu->node);
  674. if (ret) {
  675. dev_err(&pdev->dev, "Error %d registering hotplug\n", ret);
  676. goto cpuhp_instance_err;
  677. }
  678. /* Request irq */
  679. irq = platform_get_irq(pdev, 0);
  680. if (irq < 0) {
  681. ret = irq;
  682. goto ddr_perf_err;
  683. }
  684. ret = devm_request_irq(&pdev->dev, irq, ddr_perf_irq_handler,
  685. IRQF_NOBALANCING | IRQF_NO_THREAD,
  686. DDR_CPUHP_CB_NAME, pmu);
  687. if (ret < 0) {
  688. dev_err(&pdev->dev, "Request irq failed: %d", ret);
  689. goto ddr_perf_err;
  690. }
  691. pmu->irq = irq;
  692. ret = irq_set_affinity(pmu->irq, cpumask_of(pmu->cpu));
  693. if (ret) {
  694. dev_err(pmu->dev, "Failed to set interrupt affinity\n");
  695. goto ddr_perf_err;
  696. }
  697. ret = perf_pmu_register(&pmu->pmu, name, -1);
  698. if (ret)
  699. goto ddr_perf_err;
  700. return 0;
  701. ddr_perf_err:
  702. cpuhp_state_remove_instance_nocalls(pmu->cpuhp_state, &pmu->node);
  703. cpuhp_instance_err:
  704. cpuhp_remove_multi_state(pmu->cpuhp_state);
  705. cpuhp_state_err:
  706. format_string_err:
  707. ida_free(&ddr_ida, pmu->id);
  708. dev_warn(&pdev->dev, "i.MX9 DDR Perf PMU failed (%d), disabled\n", ret);
  709. return ret;
  710. }
  711. static void ddr_perf_remove(struct platform_device *pdev)
  712. {
  713. struct ddr_pmu *pmu = platform_get_drvdata(pdev);
  714. cpuhp_state_remove_instance_nocalls(pmu->cpuhp_state, &pmu->node);
  715. cpuhp_remove_multi_state(pmu->cpuhp_state);
  716. perf_pmu_unregister(&pmu->pmu);
  717. ida_free(&ddr_ida, pmu->id);
  718. }
  719. static struct platform_driver imx_ddr_pmu_driver = {
  720. .driver = {
  721. .name = "imx9-ddr-pmu",
  722. .of_match_table = imx_ddr_pmu_dt_ids,
  723. .suppress_bind_attrs = true,
  724. },
  725. .probe = ddr_perf_probe,
  726. .remove = ddr_perf_remove,
  727. };
  728. module_platform_driver(imx_ddr_pmu_driver);
  729. MODULE_AUTHOR("Xu Yang <xu.yang_2@nxp.com>");
  730. MODULE_LICENSE("GPL v2");
  731. MODULE_DESCRIPTION("DDRC PerfMon for i.MX9 SoCs");