core-fsl-emb.c 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696
  1. // SPDX-License-Identifier: GPL-2.0-or-later
  2. /*
  3. * Performance event support - Freescale Embedded Performance Monitor
  4. *
  5. * Copyright 2008-2009 Paul Mackerras, IBM Corporation.
  6. * Copyright 2010 Freescale Semiconductor, Inc.
  7. */
  8. #include <linux/kernel.h>
  9. #include <linux/sched.h>
  10. #include <linux/perf_event.h>
  11. #include <linux/percpu.h>
  12. #include <linux/hardirq.h>
  13. #include <asm/reg_fsl_emb.h>
  14. #include <asm/pmc.h>
  15. #include <asm/machdep.h>
  16. #include <asm/firmware.h>
  17. #include <asm/ptrace.h>
  18. struct cpu_hw_events {
  19. int n_events;
  20. int disabled;
  21. u8 pmcs_enabled;
  22. struct perf_event *event[MAX_HWEVENTS];
  23. };
  24. static DEFINE_PER_CPU(struct cpu_hw_events, cpu_hw_events);
  25. static struct fsl_emb_pmu *ppmu;
  26. /* Number of perf_events counting hardware events */
  27. static atomic_t num_events;
  28. /* Used to avoid races in calling reserve/release_pmc_hardware */
  29. static DEFINE_MUTEX(pmc_reserve_mutex);
  30. static void perf_event_interrupt(struct pt_regs *regs);
  31. /*
  32. * Read one performance monitor counter (PMC).
  33. */
  34. static unsigned long read_pmc(int idx)
  35. {
  36. unsigned long val;
  37. switch (idx) {
  38. case 0:
  39. val = mfpmr(PMRN_PMC0);
  40. break;
  41. case 1:
  42. val = mfpmr(PMRN_PMC1);
  43. break;
  44. case 2:
  45. val = mfpmr(PMRN_PMC2);
  46. break;
  47. case 3:
  48. val = mfpmr(PMRN_PMC3);
  49. break;
  50. case 4:
  51. val = mfpmr(PMRN_PMC4);
  52. break;
  53. case 5:
  54. val = mfpmr(PMRN_PMC5);
  55. break;
  56. default:
  57. printk(KERN_ERR "oops trying to read PMC%d\n", idx);
  58. val = 0;
  59. }
  60. return val;
  61. }
  62. /*
  63. * Write one PMC.
  64. */
  65. static void write_pmc(int idx, unsigned long val)
  66. {
  67. switch (idx) {
  68. case 0:
  69. mtpmr(PMRN_PMC0, val);
  70. break;
  71. case 1:
  72. mtpmr(PMRN_PMC1, val);
  73. break;
  74. case 2:
  75. mtpmr(PMRN_PMC2, val);
  76. break;
  77. case 3:
  78. mtpmr(PMRN_PMC3, val);
  79. break;
  80. case 4:
  81. mtpmr(PMRN_PMC4, val);
  82. break;
  83. case 5:
  84. mtpmr(PMRN_PMC5, val);
  85. break;
  86. default:
  87. printk(KERN_ERR "oops trying to write PMC%d\n", idx);
  88. }
  89. isync();
  90. }
  91. /*
  92. * Write one local control A register
  93. */
  94. static void write_pmlca(int idx, unsigned long val)
  95. {
  96. switch (idx) {
  97. case 0:
  98. mtpmr(PMRN_PMLCA0, val);
  99. break;
  100. case 1:
  101. mtpmr(PMRN_PMLCA1, val);
  102. break;
  103. case 2:
  104. mtpmr(PMRN_PMLCA2, val);
  105. break;
  106. case 3:
  107. mtpmr(PMRN_PMLCA3, val);
  108. break;
  109. case 4:
  110. mtpmr(PMRN_PMLCA4, val);
  111. break;
  112. case 5:
  113. mtpmr(PMRN_PMLCA5, val);
  114. break;
  115. default:
  116. printk(KERN_ERR "oops trying to write PMLCA%d\n", idx);
  117. }
  118. isync();
  119. }
  120. /*
  121. * Write one local control B register
  122. */
  123. static void write_pmlcb(int idx, unsigned long val)
  124. {
  125. switch (idx) {
  126. case 0:
  127. mtpmr(PMRN_PMLCB0, val);
  128. break;
  129. case 1:
  130. mtpmr(PMRN_PMLCB1, val);
  131. break;
  132. case 2:
  133. mtpmr(PMRN_PMLCB2, val);
  134. break;
  135. case 3:
  136. mtpmr(PMRN_PMLCB3, val);
  137. break;
  138. case 4:
  139. mtpmr(PMRN_PMLCB4, val);
  140. break;
  141. case 5:
  142. mtpmr(PMRN_PMLCB5, val);
  143. break;
  144. default:
  145. printk(KERN_ERR "oops trying to write PMLCB%d\n", idx);
  146. }
  147. isync();
  148. }
  149. static void fsl_emb_pmu_read(struct perf_event *event)
  150. {
  151. s64 val, delta, prev;
  152. if (event->hw.state & PERF_HES_STOPPED)
  153. return;
  154. /*
  155. * Performance monitor interrupts come even when interrupts
  156. * are soft-disabled, as long as interrupts are hard-enabled.
  157. * Therefore we treat them like NMIs.
  158. */
  159. do {
  160. prev = local64_read(&event->hw.prev_count);
  161. barrier();
  162. val = read_pmc(event->hw.idx);
  163. } while (local64_cmpxchg(&event->hw.prev_count, prev, val) != prev);
  164. /* The counters are only 32 bits wide */
  165. delta = (val - prev) & 0xfffffffful;
  166. local64_add(delta, &event->count);
  167. local64_sub(delta, &event->hw.period_left);
  168. }
  169. /*
  170. * Disable all events to prevent PMU interrupts and to allow
  171. * events to be added or removed.
  172. */
  173. static void fsl_emb_pmu_disable(struct pmu *pmu)
  174. {
  175. struct cpu_hw_events *cpuhw;
  176. unsigned long flags;
  177. local_irq_save(flags);
  178. cpuhw = this_cpu_ptr(&cpu_hw_events);
  179. if (!cpuhw->disabled) {
  180. cpuhw->disabled = 1;
  181. /*
  182. * Check if we ever enabled the PMU on this cpu.
  183. */
  184. if (!cpuhw->pmcs_enabled) {
  185. ppc_enable_pmcs();
  186. cpuhw->pmcs_enabled = 1;
  187. }
  188. if (atomic_read(&num_events)) {
  189. /*
  190. * Set the 'freeze all counters' bit, and disable
  191. * interrupts. The barrier is to make sure the
  192. * mtpmr has been executed and the PMU has frozen
  193. * the events before we return.
  194. */
  195. mtpmr(PMRN_PMGC0, PMGC0_FAC);
  196. isync();
  197. }
  198. }
  199. local_irq_restore(flags);
  200. }
  201. /*
  202. * Re-enable all events if disable == 0.
  203. * If we were previously disabled and events were added, then
  204. * put the new config on the PMU.
  205. */
  206. static void fsl_emb_pmu_enable(struct pmu *pmu)
  207. {
  208. struct cpu_hw_events *cpuhw;
  209. unsigned long flags;
  210. local_irq_save(flags);
  211. cpuhw = this_cpu_ptr(&cpu_hw_events);
  212. if (!cpuhw->disabled)
  213. goto out;
  214. cpuhw->disabled = 0;
  215. ppc_set_pmu_inuse(cpuhw->n_events != 0);
  216. if (cpuhw->n_events > 0) {
  217. mtpmr(PMRN_PMGC0, PMGC0_PMIE | PMGC0_FCECE);
  218. isync();
  219. }
  220. out:
  221. local_irq_restore(flags);
  222. }
  223. static int collect_events(struct perf_event *group, int max_count,
  224. struct perf_event *ctrs[])
  225. {
  226. int n = 0;
  227. struct perf_event *event;
  228. if (!is_software_event(group)) {
  229. if (n >= max_count)
  230. return -1;
  231. ctrs[n] = group;
  232. n++;
  233. }
  234. for_each_sibling_event(event, group) {
  235. if (!is_software_event(event) &&
  236. event->state != PERF_EVENT_STATE_OFF) {
  237. if (n >= max_count)
  238. return -1;
  239. ctrs[n] = event;
  240. n++;
  241. }
  242. }
  243. return n;
  244. }
  245. /* context locked on entry */
  246. static int fsl_emb_pmu_add(struct perf_event *event, int flags)
  247. {
  248. struct cpu_hw_events *cpuhw;
  249. int ret = -EAGAIN;
  250. int num_counters = ppmu->n_counter;
  251. u64 val;
  252. int i;
  253. perf_pmu_disable(event->pmu);
  254. cpuhw = &get_cpu_var(cpu_hw_events);
  255. if (event->hw.config & FSL_EMB_EVENT_RESTRICTED)
  256. num_counters = ppmu->n_restricted;
  257. /*
  258. * Allocate counters from top-down, so that restricted-capable
  259. * counters are kept free as long as possible.
  260. */
  261. for (i = num_counters - 1; i >= 0; i--) {
  262. if (cpuhw->event[i])
  263. continue;
  264. break;
  265. }
  266. if (i < 0)
  267. goto out;
  268. event->hw.idx = i;
  269. cpuhw->event[i] = event;
  270. ++cpuhw->n_events;
  271. val = 0;
  272. if (event->hw.sample_period) {
  273. s64 left = local64_read(&event->hw.period_left);
  274. if (left < 0x80000000L)
  275. val = 0x80000000L - left;
  276. }
  277. local64_set(&event->hw.prev_count, val);
  278. if (unlikely(!(flags & PERF_EF_START))) {
  279. event->hw.state = PERF_HES_STOPPED | PERF_HES_UPTODATE;
  280. val = 0;
  281. } else {
  282. event->hw.state &= ~(PERF_HES_STOPPED | PERF_HES_UPTODATE);
  283. }
  284. write_pmc(i, val);
  285. perf_event_update_userpage(event);
  286. write_pmlcb(i, event->hw.config >> 32);
  287. write_pmlca(i, event->hw.config_base);
  288. ret = 0;
  289. out:
  290. put_cpu_var(cpu_hw_events);
  291. perf_pmu_enable(event->pmu);
  292. return ret;
  293. }
  294. /* context locked on entry */
  295. static void fsl_emb_pmu_del(struct perf_event *event, int flags)
  296. {
  297. struct cpu_hw_events *cpuhw;
  298. int i = event->hw.idx;
  299. perf_pmu_disable(event->pmu);
  300. if (i < 0)
  301. goto out;
  302. fsl_emb_pmu_read(event);
  303. cpuhw = &get_cpu_var(cpu_hw_events);
  304. WARN_ON(event != cpuhw->event[event->hw.idx]);
  305. write_pmlca(i, 0);
  306. write_pmlcb(i, 0);
  307. write_pmc(i, 0);
  308. cpuhw->event[i] = NULL;
  309. event->hw.idx = -1;
  310. /*
  311. * TODO: if at least one restricted event exists, and we
  312. * just freed up a non-restricted-capable counter, and
  313. * there is a restricted-capable counter occupied by
  314. * a non-restricted event, migrate that event to the
  315. * vacated counter.
  316. */
  317. cpuhw->n_events--;
  318. out:
  319. perf_pmu_enable(event->pmu);
  320. put_cpu_var(cpu_hw_events);
  321. }
  322. static void fsl_emb_pmu_start(struct perf_event *event, int ef_flags)
  323. {
  324. unsigned long flags;
  325. unsigned long val;
  326. s64 left;
  327. if (event->hw.idx < 0 || !event->hw.sample_period)
  328. return;
  329. if (!(event->hw.state & PERF_HES_STOPPED))
  330. return;
  331. if (ef_flags & PERF_EF_RELOAD)
  332. WARN_ON_ONCE(!(event->hw.state & PERF_HES_UPTODATE));
  333. local_irq_save(flags);
  334. perf_pmu_disable(event->pmu);
  335. event->hw.state = 0;
  336. left = local64_read(&event->hw.period_left);
  337. val = 0;
  338. if (left < 0x80000000L)
  339. val = 0x80000000L - left;
  340. write_pmc(event->hw.idx, val);
  341. perf_event_update_userpage(event);
  342. perf_pmu_enable(event->pmu);
  343. local_irq_restore(flags);
  344. }
  345. static void fsl_emb_pmu_stop(struct perf_event *event, int ef_flags)
  346. {
  347. unsigned long flags;
  348. if (event->hw.idx < 0 || !event->hw.sample_period)
  349. return;
  350. if (event->hw.state & PERF_HES_STOPPED)
  351. return;
  352. local_irq_save(flags);
  353. perf_pmu_disable(event->pmu);
  354. fsl_emb_pmu_read(event);
  355. event->hw.state |= PERF_HES_STOPPED | PERF_HES_UPTODATE;
  356. write_pmc(event->hw.idx, 0);
  357. perf_event_update_userpage(event);
  358. perf_pmu_enable(event->pmu);
  359. local_irq_restore(flags);
  360. }
  361. /*
  362. * Release the PMU if this is the last perf_event.
  363. */
  364. static void hw_perf_event_destroy(struct perf_event *event)
  365. {
  366. if (!atomic_add_unless(&num_events, -1, 1)) {
  367. mutex_lock(&pmc_reserve_mutex);
  368. if (atomic_dec_return(&num_events) == 0)
  369. release_pmc_hardware();
  370. mutex_unlock(&pmc_reserve_mutex);
  371. }
  372. }
  373. /*
  374. * Translate a generic cache event_id config to a raw event_id code.
  375. */
  376. static int hw_perf_cache_event(u64 config, u64 *eventp)
  377. {
  378. unsigned long type, op, result;
  379. int ev;
  380. if (!ppmu->cache_events)
  381. return -EINVAL;
  382. /* unpack config */
  383. type = config & 0xff;
  384. op = (config >> 8) & 0xff;
  385. result = (config >> 16) & 0xff;
  386. if (type >= PERF_COUNT_HW_CACHE_MAX ||
  387. op >= PERF_COUNT_HW_CACHE_OP_MAX ||
  388. result >= PERF_COUNT_HW_CACHE_RESULT_MAX)
  389. return -EINVAL;
  390. ev = (*ppmu->cache_events)[type][op][result];
  391. if (ev == 0)
  392. return -EOPNOTSUPP;
  393. if (ev == -1)
  394. return -EINVAL;
  395. *eventp = ev;
  396. return 0;
  397. }
  398. static int fsl_emb_pmu_event_init(struct perf_event *event)
  399. {
  400. u64 ev;
  401. struct perf_event *events[MAX_HWEVENTS];
  402. int n;
  403. int err;
  404. int num_restricted;
  405. int i;
  406. if (ppmu->n_counter > MAX_HWEVENTS) {
  407. WARN(1, "No. of perf counters (%d) is higher than max array size(%d)\n",
  408. ppmu->n_counter, MAX_HWEVENTS);
  409. ppmu->n_counter = MAX_HWEVENTS;
  410. }
  411. switch (event->attr.type) {
  412. case PERF_TYPE_HARDWARE:
  413. ev = event->attr.config;
  414. if (ev >= ppmu->n_generic || ppmu->generic_events[ev] == 0)
  415. return -EOPNOTSUPP;
  416. ev = ppmu->generic_events[ev];
  417. break;
  418. case PERF_TYPE_HW_CACHE:
  419. err = hw_perf_cache_event(event->attr.config, &ev);
  420. if (err)
  421. return err;
  422. break;
  423. case PERF_TYPE_RAW:
  424. ev = event->attr.config;
  425. break;
  426. default:
  427. return -ENOENT;
  428. }
  429. event->hw.config = ppmu->xlate_event(ev);
  430. if (!(event->hw.config & FSL_EMB_EVENT_VALID))
  431. return -EINVAL;
  432. /*
  433. * If this is in a group, check if it can go on with all the
  434. * other hardware events in the group. We assume the event
  435. * hasn't been linked into its leader's sibling list at this point.
  436. */
  437. n = 0;
  438. if (event->group_leader != event) {
  439. n = collect_events(event->group_leader,
  440. ppmu->n_counter - 1, events);
  441. if (n < 0)
  442. return -EINVAL;
  443. }
  444. if (event->hw.config & FSL_EMB_EVENT_RESTRICTED) {
  445. num_restricted = 0;
  446. for (i = 0; i < n; i++) {
  447. if (events[i]->hw.config & FSL_EMB_EVENT_RESTRICTED)
  448. num_restricted++;
  449. }
  450. if (num_restricted >= ppmu->n_restricted)
  451. return -EINVAL;
  452. }
  453. event->hw.idx = -1;
  454. event->hw.config_base = PMLCA_CE | PMLCA_FCM1 |
  455. (u32)((ev << 16) & PMLCA_EVENT_MASK);
  456. if (event->attr.exclude_user)
  457. event->hw.config_base |= PMLCA_FCU;
  458. if (event->attr.exclude_kernel)
  459. event->hw.config_base |= PMLCA_FCS;
  460. if (event->attr.exclude_idle)
  461. return -ENOTSUPP;
  462. event->hw.last_period = event->hw.sample_period;
  463. local64_set(&event->hw.period_left, event->hw.last_period);
  464. /*
  465. * See if we need to reserve the PMU.
  466. * If no events are currently in use, then we have to take a
  467. * mutex to ensure that we don't race with another task doing
  468. * reserve_pmc_hardware or release_pmc_hardware.
  469. */
  470. err = 0;
  471. if (!atomic_inc_not_zero(&num_events)) {
  472. mutex_lock(&pmc_reserve_mutex);
  473. if (atomic_read(&num_events) == 0 &&
  474. reserve_pmc_hardware(perf_event_interrupt))
  475. err = -EBUSY;
  476. else
  477. atomic_inc(&num_events);
  478. mutex_unlock(&pmc_reserve_mutex);
  479. mtpmr(PMRN_PMGC0, PMGC0_FAC);
  480. isync();
  481. }
  482. event->destroy = hw_perf_event_destroy;
  483. return err;
  484. }
  485. static struct pmu fsl_emb_pmu = {
  486. .pmu_enable = fsl_emb_pmu_enable,
  487. .pmu_disable = fsl_emb_pmu_disable,
  488. .event_init = fsl_emb_pmu_event_init,
  489. .add = fsl_emb_pmu_add,
  490. .del = fsl_emb_pmu_del,
  491. .start = fsl_emb_pmu_start,
  492. .stop = fsl_emb_pmu_stop,
  493. .read = fsl_emb_pmu_read,
  494. };
  495. /*
  496. * A counter has overflowed; update its count and record
  497. * things if requested. Note that interrupts are hard-disabled
  498. * here so there is no possibility of being interrupted.
  499. */
  500. static void record_and_restart(struct perf_event *event, unsigned long val,
  501. struct pt_regs *regs)
  502. {
  503. u64 period = event->hw.sample_period;
  504. const u64 last_period = event->hw.last_period;
  505. s64 prev, delta, left;
  506. int record = 0;
  507. if (event->hw.state & PERF_HES_STOPPED) {
  508. write_pmc(event->hw.idx, 0);
  509. return;
  510. }
  511. /* we don't have to worry about interrupts here */
  512. prev = local64_read(&event->hw.prev_count);
  513. delta = (val - prev) & 0xfffffffful;
  514. local64_add(delta, &event->count);
  515. /*
  516. * See if the total period for this event has expired,
  517. * and update for the next period.
  518. */
  519. val = 0;
  520. left = local64_read(&event->hw.period_left) - delta;
  521. if (period) {
  522. if (left <= 0) {
  523. left += period;
  524. if (left <= 0)
  525. left = period;
  526. record = 1;
  527. event->hw.last_period = event->hw.sample_period;
  528. }
  529. if (left < 0x80000000LL)
  530. val = 0x80000000LL - left;
  531. }
  532. write_pmc(event->hw.idx, val);
  533. local64_set(&event->hw.prev_count, val);
  534. local64_set(&event->hw.period_left, left);
  535. perf_event_update_userpage(event);
  536. /*
  537. * Finally record data if requested.
  538. */
  539. if (record) {
  540. struct perf_sample_data data;
  541. perf_sample_data_init(&data, 0, last_period);
  542. perf_event_overflow(event, &data, regs);
  543. }
  544. }
  545. static void perf_event_interrupt(struct pt_regs *regs)
  546. {
  547. int i;
  548. struct cpu_hw_events *cpuhw = this_cpu_ptr(&cpu_hw_events);
  549. struct perf_event *event;
  550. unsigned long val;
  551. for (i = 0; i < ppmu->n_counter; ++i) {
  552. event = cpuhw->event[i];
  553. val = read_pmc(i);
  554. if ((int)val < 0) {
  555. if (event) {
  556. /* event has overflowed */
  557. record_and_restart(event, val, regs);
  558. } else {
  559. /*
  560. * Disabled counter is negative,
  561. * reset it just in case.
  562. */
  563. write_pmc(i, 0);
  564. }
  565. }
  566. }
  567. /* PMM will keep counters frozen until we return from the interrupt. */
  568. mtmsr(mfmsr() | MSR_PMM);
  569. mtpmr(PMRN_PMGC0, PMGC0_PMIE | PMGC0_FCECE);
  570. isync();
  571. }
  572. static int fsl_emb_pmu_prepare_cpu(unsigned int cpu)
  573. {
  574. struct cpu_hw_events *cpuhw = &per_cpu(cpu_hw_events, cpu);
  575. memset(cpuhw, 0, sizeof(*cpuhw));
  576. return 0;
  577. }
  578. int register_fsl_emb_pmu(struct fsl_emb_pmu *pmu)
  579. {
  580. if (ppmu)
  581. return -EBUSY; /* something's already registered */
  582. ppmu = pmu;
  583. pr_info("%s performance monitor hardware support registered\n",
  584. pmu->name);
  585. perf_pmu_register(&fsl_emb_pmu, "cpu", PERF_TYPE_RAW);
  586. cpuhp_setup_state(CPUHP_PERF_POWER, "perf/powerpc:prepare",
  587. fsl_emb_pmu_prepare_cpu, NULL);
  588. return 0;
  589. }