tegra186-cpufreq.c 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444
  1. // SPDX-License-Identifier: GPL-2.0-only
  2. /*
  3. * Copyright (c) 2017, NVIDIA CORPORATION. All rights reserved
  4. */
  5. #include <linux/cpufreq.h>
  6. #include <linux/dma-mapping.h>
  7. #include <linux/module.h>
  8. #include <linux/of.h>
  9. #include <linux/platform_device.h>
  10. #include <linux/units.h>
  11. #include <soc/tegra/bpmp.h>
  12. #include <soc/tegra/bpmp-abi.h>
  13. #define TEGRA186_NUM_CLUSTERS 2
  14. #define EDVD_OFFSET_A57(core) ((SZ_64K * 6) + (0x20 + (core) * 0x4))
  15. #define EDVD_OFFSET_DENVER(core) ((SZ_64K * 7) + (0x20 + (core) * 0x4))
  16. #define EDVD_CORE_VOLT_FREQ_F_SHIFT 0
  17. #define EDVD_CORE_VOLT_FREQ_F_MASK 0xffff
  18. #define EDVD_CORE_VOLT_FREQ_V_SHIFT 16
  19. struct tegra186_cpufreq_cpu {
  20. unsigned int bpmp_cluster_id;
  21. unsigned int edvd_offset;
  22. };
  23. static const struct tegra186_cpufreq_cpu tegra186_cpus[] = {
  24. /* CPU0 - A57 Cluster */
  25. {
  26. .bpmp_cluster_id = 1,
  27. .edvd_offset = EDVD_OFFSET_A57(0)
  28. },
  29. /* CPU1 - Denver Cluster */
  30. {
  31. .bpmp_cluster_id = 0,
  32. .edvd_offset = EDVD_OFFSET_DENVER(0)
  33. },
  34. /* CPU2 - Denver Cluster */
  35. {
  36. .bpmp_cluster_id = 0,
  37. .edvd_offset = EDVD_OFFSET_DENVER(1)
  38. },
  39. /* CPU3 - A57 Cluster */
  40. {
  41. .bpmp_cluster_id = 1,
  42. .edvd_offset = EDVD_OFFSET_A57(1)
  43. },
  44. /* CPU4 - A57 Cluster */
  45. {
  46. .bpmp_cluster_id = 1,
  47. .edvd_offset = EDVD_OFFSET_A57(2)
  48. },
  49. /* CPU5 - A57 Cluster */
  50. {
  51. .bpmp_cluster_id = 1,
  52. .edvd_offset = EDVD_OFFSET_A57(3)
  53. },
  54. };
  55. struct tegra186_cpufreq_cluster {
  56. struct cpufreq_frequency_table *bpmp_lut;
  57. u32 ref_clk_khz;
  58. u32 div;
  59. };
  60. struct tegra186_cpufreq_data {
  61. void __iomem *regs;
  62. const struct tegra186_cpufreq_cpu *cpus;
  63. bool icc_dram_bw_scaling;
  64. struct tegra186_cpufreq_cluster clusters[];
  65. };
  66. static int tegra_cpufreq_set_bw(struct cpufreq_policy *policy, unsigned long freq_khz)
  67. {
  68. struct tegra186_cpufreq_data *data = cpufreq_get_driver_data();
  69. struct device *dev;
  70. int ret;
  71. dev = get_cpu_device(policy->cpu);
  72. if (!dev)
  73. return -ENODEV;
  74. struct dev_pm_opp *opp __free(put_opp) =
  75. dev_pm_opp_find_freq_exact(dev, freq_khz * HZ_PER_KHZ, true);
  76. if (IS_ERR(opp))
  77. return PTR_ERR(opp);
  78. ret = dev_pm_opp_set_opp(dev, opp);
  79. if (ret)
  80. data->icc_dram_bw_scaling = false;
  81. return ret;
  82. }
  83. static int tegra_cpufreq_init_cpufreq_table(struct cpufreq_policy *policy,
  84. struct cpufreq_frequency_table *bpmp_lut,
  85. struct cpufreq_frequency_table **opp_table)
  86. {
  87. struct tegra186_cpufreq_data *data = cpufreq_get_driver_data();
  88. struct cpufreq_frequency_table *freq_table = NULL;
  89. struct cpufreq_frequency_table *pos;
  90. struct device *cpu_dev;
  91. unsigned long rate;
  92. int ret, max_opps;
  93. int j = 0;
  94. cpu_dev = get_cpu_device(policy->cpu);
  95. if (!cpu_dev) {
  96. pr_err("%s: failed to get cpu%d device\n", __func__, policy->cpu);
  97. return -ENODEV;
  98. }
  99. /* Initialize OPP table mentioned in operating-points-v2 property in DT */
  100. ret = dev_pm_opp_of_add_table_indexed(cpu_dev, 0);
  101. if (ret) {
  102. dev_err(cpu_dev, "Invalid or empty opp table in device tree\n");
  103. data->icc_dram_bw_scaling = false;
  104. return ret;
  105. }
  106. max_opps = dev_pm_opp_get_opp_count(cpu_dev);
  107. if (max_opps <= 0) {
  108. dev_err(cpu_dev, "Failed to add OPPs\n");
  109. return max_opps;
  110. }
  111. /* Disable all opps and cross-validate against LUT later */
  112. for (rate = 0; ; rate++) {
  113. struct dev_pm_opp *opp __free(put_opp) =
  114. dev_pm_opp_find_freq_ceil(cpu_dev, &rate);
  115. if (IS_ERR(opp))
  116. break;
  117. dev_pm_opp_disable(cpu_dev, rate);
  118. }
  119. freq_table = kzalloc_objs(*freq_table, (max_opps + 1));
  120. if (!freq_table)
  121. return -ENOMEM;
  122. /*
  123. * Cross check the frequencies from BPMP-FW LUT against the OPP's present in DT.
  124. * Enable only those DT OPP's which are present in LUT also.
  125. */
  126. cpufreq_for_each_valid_entry(pos, bpmp_lut) {
  127. struct dev_pm_opp *opp __free(put_opp) =
  128. dev_pm_opp_find_freq_exact(cpu_dev, pos->frequency * HZ_PER_KHZ, false);
  129. if (IS_ERR(opp))
  130. continue;
  131. ret = dev_pm_opp_enable(cpu_dev, pos->frequency * HZ_PER_KHZ);
  132. if (ret < 0)
  133. return ret;
  134. freq_table[j].driver_data = pos->driver_data;
  135. freq_table[j].frequency = pos->frequency;
  136. j++;
  137. }
  138. freq_table[j].driver_data = pos->driver_data;
  139. freq_table[j].frequency = CPUFREQ_TABLE_END;
  140. *opp_table = &freq_table[0];
  141. dev_pm_opp_set_sharing_cpus(cpu_dev, policy->cpus);
  142. /* Prime interconnect data */
  143. tegra_cpufreq_set_bw(policy, freq_table[j - 1].frequency);
  144. return ret;
  145. }
  146. static int tegra186_cpufreq_init(struct cpufreq_policy *policy)
  147. {
  148. struct tegra186_cpufreq_data *data = cpufreq_get_driver_data();
  149. unsigned int cluster = data->cpus[policy->cpu].bpmp_cluster_id;
  150. struct cpufreq_frequency_table *freq_table;
  151. struct cpufreq_frequency_table *bpmp_lut;
  152. u32 cpu;
  153. int ret;
  154. policy->cpuinfo.transition_latency = 300 * 1000;
  155. policy->driver_data = NULL;
  156. /* set same policy for all cpus in a cluster */
  157. for (cpu = 0; cpu < ARRAY_SIZE(tegra186_cpus); cpu++) {
  158. if (data->cpus[cpu].bpmp_cluster_id == cluster)
  159. cpumask_set_cpu(cpu, policy->cpus);
  160. }
  161. bpmp_lut = data->clusters[cluster].bpmp_lut;
  162. if (data->icc_dram_bw_scaling) {
  163. ret = tegra_cpufreq_init_cpufreq_table(policy, bpmp_lut, &freq_table);
  164. if (!ret) {
  165. policy->freq_table = freq_table;
  166. return 0;
  167. }
  168. }
  169. data->icc_dram_bw_scaling = false;
  170. policy->freq_table = bpmp_lut;
  171. pr_info("OPP tables missing from DT, EMC frequency scaling disabled\n");
  172. return 0;
  173. }
  174. static int tegra186_cpufreq_set_target(struct cpufreq_policy *policy,
  175. unsigned int index)
  176. {
  177. struct tegra186_cpufreq_data *data = cpufreq_get_driver_data();
  178. struct cpufreq_frequency_table *tbl = policy->freq_table + index;
  179. unsigned int edvd_offset;
  180. u32 edvd_val = tbl->driver_data;
  181. u32 cpu;
  182. for_each_cpu(cpu, policy->cpus) {
  183. edvd_offset = data->cpus[cpu].edvd_offset;
  184. writel(edvd_val, data->regs + edvd_offset);
  185. }
  186. if (data->icc_dram_bw_scaling)
  187. tegra_cpufreq_set_bw(policy, tbl->frequency);
  188. return 0;
  189. }
  190. static unsigned int tegra186_cpufreq_get(unsigned int cpu)
  191. {
  192. struct cpufreq_policy *policy __free(put_cpufreq_policy) = cpufreq_cpu_get(cpu);
  193. struct tegra186_cpufreq_data *data = cpufreq_get_driver_data();
  194. struct tegra186_cpufreq_cluster *cluster;
  195. unsigned int edvd_offset, cluster_id;
  196. u32 ndiv;
  197. if (!policy)
  198. return 0;
  199. edvd_offset = data->cpus[policy->cpu].edvd_offset;
  200. ndiv = readl(data->regs + edvd_offset) & EDVD_CORE_VOLT_FREQ_F_MASK;
  201. cluster_id = data->cpus[policy->cpu].bpmp_cluster_id;
  202. cluster = &data->clusters[cluster_id];
  203. return (cluster->ref_clk_khz * ndiv) / cluster->div;
  204. }
  205. static struct cpufreq_driver tegra186_cpufreq_driver = {
  206. .name = "tegra186",
  207. .flags = CPUFREQ_HAVE_GOVERNOR_PER_POLICY |
  208. CPUFREQ_NEED_INITIAL_FREQ_CHECK,
  209. .get = tegra186_cpufreq_get,
  210. .verify = cpufreq_generic_frequency_table_verify,
  211. .target_index = tegra186_cpufreq_set_target,
  212. .init = tegra186_cpufreq_init,
  213. };
  214. static struct cpufreq_frequency_table *tegra_cpufreq_bpmp_read_lut(
  215. struct platform_device *pdev, struct tegra_bpmp *bpmp,
  216. struct tegra186_cpufreq_cluster *cluster, unsigned int cluster_id,
  217. int *num_rates)
  218. {
  219. struct cpufreq_frequency_table *table;
  220. struct mrq_cpu_vhint_request req;
  221. struct tegra_bpmp_message msg;
  222. struct cpu_vhint_data *data;
  223. int err, i, j;
  224. dma_addr_t phys;
  225. void *virt;
  226. virt = dma_alloc_coherent(bpmp->dev, sizeof(*data), &phys,
  227. GFP_KERNEL);
  228. if (!virt)
  229. return ERR_PTR(-ENOMEM);
  230. data = (struct cpu_vhint_data *)virt;
  231. memset(&req, 0, sizeof(req));
  232. req.addr = phys;
  233. req.cluster_id = cluster_id;
  234. memset(&msg, 0, sizeof(msg));
  235. msg.mrq = MRQ_CPU_VHINT;
  236. msg.tx.data = &req;
  237. msg.tx.size = sizeof(req);
  238. err = tegra_bpmp_transfer(bpmp, &msg);
  239. if (err) {
  240. table = ERR_PTR(err);
  241. goto free;
  242. }
  243. if (msg.rx.ret) {
  244. table = ERR_PTR(-EINVAL);
  245. goto free;
  246. }
  247. *num_rates = 0;
  248. for (i = data->vfloor; i <= data->vceil; i++) {
  249. u16 ndiv = data->ndiv[i];
  250. if (ndiv < data->ndiv_min || ndiv > data->ndiv_max)
  251. continue;
  252. /* Only store lowest voltage index for each rate */
  253. if (i > 0 && ndiv == data->ndiv[i - 1])
  254. continue;
  255. (*num_rates)++;
  256. }
  257. table = devm_kcalloc(&pdev->dev, *num_rates + 1, sizeof(*table),
  258. GFP_KERNEL);
  259. if (!table) {
  260. table = ERR_PTR(-ENOMEM);
  261. goto free;
  262. }
  263. cluster->ref_clk_khz = data->ref_clk_hz / 1000;
  264. cluster->div = data->pdiv * data->mdiv;
  265. for (i = data->vfloor, j = 0; i <= data->vceil; i++) {
  266. struct cpufreq_frequency_table *point;
  267. u16 ndiv = data->ndiv[i];
  268. u32 edvd_val = 0;
  269. if (ndiv < data->ndiv_min || ndiv > data->ndiv_max)
  270. continue;
  271. /* Only store lowest voltage index for each rate */
  272. if (i > 0 && ndiv == data->ndiv[i - 1])
  273. continue;
  274. edvd_val |= i << EDVD_CORE_VOLT_FREQ_V_SHIFT;
  275. edvd_val |= ndiv << EDVD_CORE_VOLT_FREQ_F_SHIFT;
  276. point = &table[j++];
  277. point->driver_data = edvd_val;
  278. point->frequency = (cluster->ref_clk_khz * ndiv) / cluster->div;
  279. }
  280. table[j].frequency = CPUFREQ_TABLE_END;
  281. free:
  282. dma_free_coherent(bpmp->dev, sizeof(*data), virt, phys);
  283. return table;
  284. }
  285. static int tegra186_cpufreq_probe(struct platform_device *pdev)
  286. {
  287. struct tegra186_cpufreq_data *data;
  288. struct tegra_bpmp *bpmp;
  289. struct device *cpu_dev;
  290. unsigned int i = 0, err, edvd_offset;
  291. int num_rates = 0;
  292. u32 edvd_val, cpu;
  293. data = devm_kzalloc(&pdev->dev,
  294. struct_size(data, clusters, TEGRA186_NUM_CLUSTERS),
  295. GFP_KERNEL);
  296. if (!data)
  297. return -ENOMEM;
  298. data->cpus = tegra186_cpus;
  299. bpmp = tegra_bpmp_get(&pdev->dev);
  300. if (IS_ERR(bpmp))
  301. return PTR_ERR(bpmp);
  302. data->regs = devm_platform_ioremap_resource(pdev, 0);
  303. if (IS_ERR(data->regs)) {
  304. err = PTR_ERR(data->regs);
  305. goto put_bpmp;
  306. }
  307. for (i = 0; i < TEGRA186_NUM_CLUSTERS; i++) {
  308. struct tegra186_cpufreq_cluster *cluster = &data->clusters[i];
  309. cluster->bpmp_lut = tegra_cpufreq_bpmp_read_lut(pdev, bpmp, cluster, i, &num_rates);
  310. if (IS_ERR(cluster->bpmp_lut)) {
  311. err = PTR_ERR(cluster->bpmp_lut);
  312. goto put_bpmp;
  313. } else if (!num_rates) {
  314. err = -EINVAL;
  315. goto put_bpmp;
  316. }
  317. for (cpu = 0; cpu < ARRAY_SIZE(tegra186_cpus); cpu++) {
  318. if (data->cpus[cpu].bpmp_cluster_id == i) {
  319. edvd_val = cluster->bpmp_lut[num_rates - 1].driver_data;
  320. edvd_offset = data->cpus[cpu].edvd_offset;
  321. writel(edvd_val, data->regs + edvd_offset);
  322. }
  323. }
  324. }
  325. tegra186_cpufreq_driver.driver_data = data;
  326. /* Check for optional OPPv2 and interconnect paths on CPU0 to enable ICC scaling */
  327. cpu_dev = get_cpu_device(0);
  328. if (!cpu_dev) {
  329. err = -EPROBE_DEFER;
  330. goto put_bpmp;
  331. }
  332. if (dev_pm_opp_of_get_opp_desc_node(cpu_dev)) {
  333. err = dev_pm_opp_of_find_icc_paths(cpu_dev, NULL);
  334. if (!err)
  335. data->icc_dram_bw_scaling = true;
  336. }
  337. err = cpufreq_register_driver(&tegra186_cpufreq_driver);
  338. put_bpmp:
  339. tegra_bpmp_put(bpmp);
  340. return err;
  341. }
  342. static void tegra186_cpufreq_remove(struct platform_device *pdev)
  343. {
  344. cpufreq_unregister_driver(&tegra186_cpufreq_driver);
  345. }
  346. static const struct of_device_id tegra186_cpufreq_of_match[] = {
  347. { .compatible = "nvidia,tegra186-ccplex-cluster", },
  348. { }
  349. };
  350. MODULE_DEVICE_TABLE(of, tegra186_cpufreq_of_match);
  351. static struct platform_driver tegra186_cpufreq_platform_driver = {
  352. .driver = {
  353. .name = "tegra186-cpufreq",
  354. .of_match_table = tegra186_cpufreq_of_match,
  355. },
  356. .probe = tegra186_cpufreq_probe,
  357. .remove = tegra186_cpufreq_remove,
  358. };
  359. module_platform_driver(tegra186_cpufreq_platform_driver);
  360. MODULE_AUTHOR("Mikko Perttunen <mperttunen@nvidia.com>");
  361. MODULE_DESCRIPTION("NVIDIA Tegra186 cpufreq driver");
  362. MODULE_LICENSE("GPL v2");