selftest_slpc.c 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557
  1. // SPDX-License-Identifier: MIT
  2. /*
  3. * Copyright © 2021 Intel Corporation
  4. */
  5. #define NUM_STEPS 5
  6. #define H2G_DELAY 50000
  7. #define delay_for_h2g() usleep_range(H2G_DELAY, H2G_DELAY + 10000)
  8. #define FREQUENCY_REQ_UNIT DIV_ROUND_CLOSEST(GT_FREQUENCY_MULTIPLIER, \
  9. GEN9_FREQ_SCALER)
  10. enum test_type {
  11. VARY_MIN,
  12. VARY_MAX,
  13. MAX_GRANTED,
  14. SLPC_POWER,
  15. TILE_INTERACTION,
  16. };
  17. struct slpc_thread {
  18. struct kthread_worker *worker;
  19. struct kthread_work work;
  20. struct intel_gt *gt;
  21. int result;
  22. };
  23. static int slpc_set_min_freq(struct intel_guc_slpc *slpc, u32 freq)
  24. {
  25. int ret;
  26. ret = intel_guc_slpc_set_min_freq(slpc, freq);
  27. if (ret)
  28. pr_err("Could not set min frequency to [%u]\n", freq);
  29. else /* Delay to ensure h2g completes */
  30. delay_for_h2g();
  31. return ret;
  32. }
  33. static int slpc_set_max_freq(struct intel_guc_slpc *slpc, u32 freq)
  34. {
  35. int ret;
  36. ret = intel_guc_slpc_set_max_freq(slpc, freq);
  37. if (ret)
  38. pr_err("Could not set maximum frequency [%u]\n",
  39. freq);
  40. else /* Delay to ensure h2g completes */
  41. delay_for_h2g();
  42. return ret;
  43. }
  44. static int slpc_set_freq(struct intel_gt *gt, u32 freq)
  45. {
  46. int err;
  47. struct intel_guc_slpc *slpc = &gt_to_guc(gt)->slpc;
  48. err = slpc_set_max_freq(slpc, freq);
  49. if (err) {
  50. pr_err("Unable to update max freq");
  51. return err;
  52. }
  53. err = slpc_set_min_freq(slpc, freq);
  54. if (err) {
  55. pr_err("Unable to update min freq");
  56. return err;
  57. }
  58. return err;
  59. }
  60. static int slpc_restore_freq(struct intel_guc_slpc *slpc, u32 min, u32 max)
  61. {
  62. int err;
  63. err = slpc_set_max_freq(slpc, max);
  64. if (err) {
  65. pr_err("Unable to restore max freq");
  66. return err;
  67. }
  68. err = slpc_set_min_freq(slpc, min);
  69. if (err) {
  70. pr_err("Unable to restore min freq");
  71. return err;
  72. }
  73. err = intel_guc_slpc_set_ignore_eff_freq(slpc, false);
  74. if (err) {
  75. pr_err("Unable to restore efficient freq");
  76. return err;
  77. }
  78. return 0;
  79. }
  80. static u64 slpc_measure_power(struct intel_rps *rps, int *freq)
  81. {
  82. u64 x[5];
  83. int i;
  84. for (i = 0; i < 5; i++)
  85. x[i] = __measure_power(5);
  86. *freq = (*freq + intel_rps_read_actual_frequency(rps)) / 2;
  87. /* A simple triangle filter for better result stability */
  88. sort(x, 5, sizeof(*x), cmp_u64, NULL);
  89. return div_u64(x[1] + 2 * x[2] + x[3], 4);
  90. }
  91. static u64 measure_power_at_freq(struct intel_gt *gt, int *freq, u64 *power)
  92. {
  93. int err = 0;
  94. err = slpc_set_freq(gt, *freq);
  95. if (err)
  96. return err;
  97. *freq = intel_rps_read_actual_frequency(&gt->rps);
  98. *power = slpc_measure_power(&gt->rps, freq);
  99. return err;
  100. }
  101. static int vary_max_freq(struct intel_guc_slpc *slpc, struct intel_rps *rps,
  102. u32 *max_act_freq)
  103. {
  104. u32 step, max_freq, req_freq;
  105. u32 act_freq;
  106. int err = 0;
  107. /* Go from max to min in 5 steps */
  108. step = (slpc->rp0_freq - slpc->min_freq) / NUM_STEPS;
  109. *max_act_freq = slpc->min_freq;
  110. for (max_freq = slpc->rp0_freq; max_freq > slpc->min_freq;
  111. max_freq -= step) {
  112. err = slpc_set_max_freq(slpc, max_freq);
  113. if (err)
  114. break;
  115. req_freq = intel_rps_read_punit_req_frequency(rps);
  116. /* GuC requests freq in multiples of 50/3 MHz */
  117. if (req_freq > (max_freq + FREQUENCY_REQ_UNIT)) {
  118. pr_err("SWReq is %d, should be at most %d\n", req_freq,
  119. max_freq + FREQUENCY_REQ_UNIT);
  120. err = -EINVAL;
  121. }
  122. act_freq = intel_rps_read_actual_frequency(rps);
  123. if (act_freq > *max_act_freq)
  124. *max_act_freq = act_freq;
  125. if (err)
  126. break;
  127. }
  128. return err;
  129. }
  130. static int vary_min_freq(struct intel_guc_slpc *slpc, struct intel_rps *rps,
  131. u32 *max_act_freq)
  132. {
  133. u32 step, min_freq, req_freq;
  134. u32 act_freq;
  135. int err = 0;
  136. /* Go from min to max in 5 steps */
  137. step = (slpc->rp0_freq - slpc->min_freq) / NUM_STEPS;
  138. *max_act_freq = slpc->min_freq;
  139. for (min_freq = slpc->min_freq; min_freq < slpc->rp0_freq;
  140. min_freq += step) {
  141. err = slpc_set_min_freq(slpc, min_freq);
  142. if (err)
  143. break;
  144. req_freq = intel_rps_read_punit_req_frequency(rps);
  145. /* GuC requests freq in multiples of 50/3 MHz */
  146. if (req_freq < (min_freq - FREQUENCY_REQ_UNIT)) {
  147. pr_err("SWReq is %d, should be at least %d\n", req_freq,
  148. min_freq - FREQUENCY_REQ_UNIT);
  149. err = -EINVAL;
  150. }
  151. act_freq = intel_rps_read_actual_frequency(rps);
  152. if (act_freq > *max_act_freq)
  153. *max_act_freq = act_freq;
  154. if (err)
  155. break;
  156. }
  157. return err;
  158. }
  159. static int slpc_power(struct intel_gt *gt, struct intel_engine_cs *engine)
  160. {
  161. struct intel_guc_slpc *slpc = &gt_to_guc(gt)->slpc;
  162. struct {
  163. u64 power;
  164. int freq;
  165. } min, max;
  166. int err = 0;
  167. /*
  168. * Our fundamental assumption is that running at lower frequency
  169. * actually saves power. Let's see if our RAPL measurement supports
  170. * that theory.
  171. */
  172. if (!librapl_supported(gt->i915))
  173. return 0;
  174. min.freq = slpc->min_freq;
  175. err = measure_power_at_freq(gt, &min.freq, &min.power);
  176. if (err)
  177. return err;
  178. max.freq = slpc->rp0_freq;
  179. err = measure_power_at_freq(gt, &max.freq, &max.power);
  180. if (err)
  181. return err;
  182. pr_info("%s: min:%llumW @ %uMHz, max:%llumW @ %uMHz\n",
  183. engine->name,
  184. min.power, min.freq,
  185. max.power, max.freq);
  186. if (10 * min.freq >= 9 * max.freq) {
  187. pr_notice("Could not control frequency, ran at [%uMHz, %uMhz]\n",
  188. min.freq, max.freq);
  189. }
  190. if (11 * min.power > 10 * max.power) {
  191. pr_err("%s: did not conserve power when setting lower frequency!\n",
  192. engine->name);
  193. err = -EINVAL;
  194. }
  195. /* Restore min/max frequencies */
  196. slpc_set_max_freq(slpc, slpc->rp0_freq);
  197. slpc_set_min_freq(slpc, slpc->min_freq);
  198. return err;
  199. }
  200. static int max_granted_freq(struct intel_guc_slpc *slpc, struct intel_rps *rps, u32 *max_act_freq)
  201. {
  202. struct intel_gt *gt = rps_to_gt(rps);
  203. u32 perf_limit_reasons;
  204. int err = 0;
  205. err = slpc_set_min_freq(slpc, slpc->rp0_freq);
  206. if (err)
  207. return err;
  208. *max_act_freq = intel_rps_read_actual_frequency(rps);
  209. if (*max_act_freq != slpc->rp0_freq) {
  210. /* Check if there was some throttling by pcode */
  211. perf_limit_reasons = intel_uncore_read(gt->uncore,
  212. intel_gt_perf_limit_reasons_reg(gt));
  213. /* If not, this is an error */
  214. if (!(perf_limit_reasons & GT0_PERF_LIMIT_REASONS_MASK)) {
  215. pr_err("Pcode did not grant max freq\n");
  216. err = -EINVAL;
  217. } else {
  218. pr_info("Pcode throttled frequency 0x%x\n", perf_limit_reasons);
  219. }
  220. }
  221. return err;
  222. }
  223. static int run_test(struct intel_gt *gt, int test_type)
  224. {
  225. struct intel_guc_slpc *slpc = &gt_to_guc(gt)->slpc;
  226. struct intel_rps *rps = &gt->rps;
  227. struct intel_engine_cs *engine;
  228. enum intel_engine_id id;
  229. intel_wakeref_t wakeref;
  230. struct igt_spinner spin;
  231. u32 slpc_min_freq, slpc_max_freq;
  232. int err = 0;
  233. if (!intel_uc_uses_guc_slpc(&gt->uc))
  234. return 0;
  235. if (slpc->min_freq == slpc->rp0_freq) {
  236. pr_err("Min/Max are fused to the same value\n");
  237. return -EINVAL;
  238. }
  239. if (igt_spinner_init(&spin, gt))
  240. return -ENOMEM;
  241. if (intel_guc_slpc_get_max_freq(slpc, &slpc_max_freq)) {
  242. pr_err("Could not get SLPC max freq\n");
  243. return -EIO;
  244. }
  245. if (intel_guc_slpc_get_min_freq(slpc, &slpc_min_freq)) {
  246. pr_err("Could not get SLPC min freq\n");
  247. return -EIO;
  248. }
  249. /*
  250. * Set min frequency to RPn so that we can test the whole
  251. * range of RPn-RP0.
  252. */
  253. err = slpc_set_min_freq(slpc, slpc->min_freq);
  254. if (err) {
  255. pr_err("Unable to update min freq!");
  256. return err;
  257. }
  258. /*
  259. * Turn off efficient frequency so RPn/RP0 ranges are obeyed.
  260. */
  261. err = intel_guc_slpc_set_ignore_eff_freq(slpc, true);
  262. if (err) {
  263. pr_err("Unable to turn off efficient freq!");
  264. return err;
  265. }
  266. intel_gt_pm_wait_for_idle(gt);
  267. wakeref = intel_gt_pm_get(gt);
  268. for_each_engine(engine, gt, id) {
  269. struct i915_request *rq;
  270. u32 max_act_freq;
  271. if (!intel_engine_can_store_dword(engine))
  272. continue;
  273. st_engine_heartbeat_disable(engine);
  274. rq = igt_spinner_create_request(&spin,
  275. engine->kernel_context,
  276. MI_NOOP);
  277. if (IS_ERR(rq)) {
  278. err = PTR_ERR(rq);
  279. st_engine_heartbeat_enable(engine);
  280. break;
  281. }
  282. i915_request_add(rq);
  283. if (!igt_wait_for_spinner(&spin, rq)) {
  284. pr_err("%s: Spinner did not start\n",
  285. engine->name);
  286. igt_spinner_end(&spin);
  287. st_engine_heartbeat_enable(engine);
  288. intel_gt_set_wedged(engine->gt);
  289. err = -EIO;
  290. break;
  291. }
  292. switch (test_type) {
  293. case VARY_MIN:
  294. err = vary_min_freq(slpc, rps, &max_act_freq);
  295. break;
  296. case VARY_MAX:
  297. err = vary_max_freq(slpc, rps, &max_act_freq);
  298. break;
  299. case MAX_GRANTED:
  300. case TILE_INTERACTION:
  301. /* Media engines have a different RP0 */
  302. if (gt->type != GT_MEDIA && (engine->class == VIDEO_DECODE_CLASS ||
  303. engine->class == VIDEO_ENHANCEMENT_CLASS)) {
  304. igt_spinner_end(&spin);
  305. st_engine_heartbeat_enable(engine);
  306. err = 0;
  307. continue;
  308. }
  309. err = max_granted_freq(slpc, rps, &max_act_freq);
  310. break;
  311. case SLPC_POWER:
  312. err = slpc_power(gt, engine);
  313. break;
  314. }
  315. if (test_type != SLPC_POWER) {
  316. pr_info("Max actual frequency for %s was %d\n",
  317. engine->name, max_act_freq);
  318. /* Actual frequency should rise above min */
  319. if (max_act_freq <= slpc->min_freq) {
  320. pr_err("Actual freq did not rise above min\n");
  321. pr_err("Perf Limit Reasons: 0x%x\n",
  322. intel_uncore_read(gt->uncore,
  323. intel_gt_perf_limit_reasons_reg(gt)));
  324. err = -EINVAL;
  325. }
  326. }
  327. igt_spinner_end(&spin);
  328. st_engine_heartbeat_enable(engine);
  329. if (err)
  330. break;
  331. }
  332. /* Restore min/max/efficient frequencies */
  333. err = slpc_restore_freq(slpc, slpc_min_freq, slpc_max_freq);
  334. if (igt_flush_test(gt->i915))
  335. err = -EIO;
  336. intel_gt_pm_put(gt, wakeref);
  337. igt_spinner_fini(&spin);
  338. intel_gt_pm_wait_for_idle(gt);
  339. return err;
  340. }
  341. static int live_slpc_vary_min(void *arg)
  342. {
  343. struct drm_i915_private *i915 = arg;
  344. struct intel_gt *gt;
  345. unsigned int i;
  346. int ret;
  347. for_each_gt(gt, i915, i) {
  348. ret = run_test(gt, VARY_MIN);
  349. if (ret)
  350. return ret;
  351. }
  352. return ret;
  353. }
  354. static int live_slpc_vary_max(void *arg)
  355. {
  356. struct drm_i915_private *i915 = arg;
  357. struct intel_gt *gt;
  358. unsigned int i;
  359. int ret;
  360. for_each_gt(gt, i915, i) {
  361. ret = run_test(gt, VARY_MAX);
  362. if (ret)
  363. return ret;
  364. }
  365. return ret;
  366. }
  367. /* check if pcode can grant RP0 */
  368. static int live_slpc_max_granted(void *arg)
  369. {
  370. struct drm_i915_private *i915 = arg;
  371. struct intel_gt *gt;
  372. unsigned int i;
  373. int ret;
  374. for_each_gt(gt, i915, i) {
  375. ret = run_test(gt, MAX_GRANTED);
  376. if (ret)
  377. return ret;
  378. }
  379. return ret;
  380. }
  381. static int live_slpc_power(void *arg)
  382. {
  383. struct drm_i915_private *i915 = arg;
  384. struct intel_gt *gt;
  385. unsigned int i;
  386. int ret;
  387. for_each_gt(gt, i915, i) {
  388. ret = run_test(gt, SLPC_POWER);
  389. if (ret)
  390. return ret;
  391. }
  392. return ret;
  393. }
  394. static void slpc_spinner_thread(struct kthread_work *work)
  395. {
  396. struct slpc_thread *thread = container_of(work, typeof(*thread), work);
  397. thread->result = run_test(thread->gt, TILE_INTERACTION);
  398. }
  399. static int live_slpc_tile_interaction(void *arg)
  400. {
  401. struct drm_i915_private *i915 = arg;
  402. struct intel_gt *gt;
  403. struct slpc_thread *threads;
  404. int i = 0, ret = 0;
  405. threads = kzalloc_objs(*threads, I915_MAX_GT);
  406. if (!threads)
  407. return -ENOMEM;
  408. for_each_gt(gt, i915, i) {
  409. threads[i].worker = kthread_run_worker(0, "igt/slpc_parallel:%d", gt->info.id);
  410. if (IS_ERR(threads[i].worker)) {
  411. ret = PTR_ERR(threads[i].worker);
  412. break;
  413. }
  414. threads[i].gt = gt;
  415. kthread_init_work(&threads[i].work, slpc_spinner_thread);
  416. kthread_queue_work(threads[i].worker, &threads[i].work);
  417. }
  418. for_each_gt(gt, i915, i) {
  419. int status;
  420. if (IS_ERR_OR_NULL(threads[i].worker))
  421. continue;
  422. kthread_flush_work(&threads[i].work);
  423. status = READ_ONCE(threads[i].result);
  424. if (status && !ret) {
  425. pr_err("%s GT %d failed ", __func__, gt->info.id);
  426. ret = status;
  427. }
  428. kthread_destroy_worker(threads[i].worker);
  429. }
  430. kfree(threads);
  431. return ret;
  432. }
  433. int intel_slpc_live_selftests(struct drm_i915_private *i915)
  434. {
  435. static const struct i915_subtest tests[] = {
  436. SUBTEST(live_slpc_vary_max),
  437. SUBTEST(live_slpc_vary_min),
  438. SUBTEST(live_slpc_max_granted),
  439. SUBTEST(live_slpc_power),
  440. SUBTEST(live_slpc_tile_interaction),
  441. };
  442. struct intel_gt *gt;
  443. unsigned int i;
  444. for_each_gt(gt, i915, i) {
  445. if (intel_gt_is_wedged(gt))
  446. return 0;
  447. }
  448. return i915_live_subtests(tests, i915);
  449. }