st-dma-fence-chain.c 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704
  1. // SPDX-License-Identifier: MIT
  2. /*
  3. * Copyright © 2019 Intel Corporation
  4. */
  5. #include <linux/delay.h>
  6. #include <linux/dma-fence.h>
  7. #include <linux/dma-fence-chain.h>
  8. #include <linux/kernel.h>
  9. #include <linux/kthread.h>
  10. #include <linux/mm.h>
  11. #include <linux/sched/signal.h>
  12. #include <linux/slab.h>
  13. #include <linux/spinlock.h>
  14. #include <linux/random.h>
  15. #include "selftest.h"
  16. #define CHAIN_SZ (4 << 10)
  17. static struct kmem_cache *slab_fences;
  18. static inline struct mock_fence {
  19. struct dma_fence base;
  20. spinlock_t lock;
  21. } *to_mock_fence(struct dma_fence *f) {
  22. return container_of(f, struct mock_fence, base);
  23. }
  24. static const char *mock_name(struct dma_fence *f)
  25. {
  26. return "mock";
  27. }
  28. static void mock_fence_release(struct dma_fence *f)
  29. {
  30. kmem_cache_free(slab_fences, to_mock_fence(f));
  31. }
  32. static const struct dma_fence_ops mock_ops = {
  33. .get_driver_name = mock_name,
  34. .get_timeline_name = mock_name,
  35. .release = mock_fence_release,
  36. };
  37. static struct dma_fence *mock_fence(void)
  38. {
  39. struct mock_fence *f;
  40. f = kmem_cache_alloc(slab_fences, GFP_KERNEL);
  41. if (!f)
  42. return NULL;
  43. spin_lock_init(&f->lock);
  44. dma_fence_init(&f->base, &mock_ops, &f->lock, 0, 0);
  45. return &f->base;
  46. }
  47. static struct dma_fence *mock_chain(struct dma_fence *prev,
  48. struct dma_fence *fence,
  49. u64 seqno)
  50. {
  51. struct dma_fence_chain *f;
  52. f = dma_fence_chain_alloc();
  53. if (!f)
  54. return NULL;
  55. dma_fence_chain_init(f, dma_fence_get(prev), dma_fence_get(fence),
  56. seqno);
  57. return &f->base;
  58. }
  59. static int sanitycheck(void *arg)
  60. {
  61. struct dma_fence *f, *chain;
  62. int err = 0;
  63. f = mock_fence();
  64. if (!f)
  65. return -ENOMEM;
  66. chain = mock_chain(NULL, f, 1);
  67. if (chain)
  68. dma_fence_enable_sw_signaling(chain);
  69. else
  70. err = -ENOMEM;
  71. dma_fence_signal(f);
  72. dma_fence_put(f);
  73. dma_fence_put(chain);
  74. return err;
  75. }
  76. struct fence_chains {
  77. unsigned int chain_length;
  78. struct dma_fence **fences;
  79. struct dma_fence **chains;
  80. struct dma_fence *tail;
  81. };
  82. static uint64_t seqno_inc(unsigned int i)
  83. {
  84. return i + 1;
  85. }
  86. static int fence_chains_init(struct fence_chains *fc, unsigned int count,
  87. uint64_t (*seqno_fn)(unsigned int))
  88. {
  89. unsigned int i;
  90. int err = 0;
  91. fc->chains = kvmalloc_objs(*fc->chains, count, GFP_KERNEL | __GFP_ZERO);
  92. if (!fc->chains)
  93. return -ENOMEM;
  94. fc->fences = kvmalloc_objs(*fc->fences, count, GFP_KERNEL | __GFP_ZERO);
  95. if (!fc->fences) {
  96. err = -ENOMEM;
  97. goto err_chains;
  98. }
  99. fc->tail = NULL;
  100. for (i = 0; i < count; i++) {
  101. fc->fences[i] = mock_fence();
  102. if (!fc->fences[i]) {
  103. err = -ENOMEM;
  104. goto unwind;
  105. }
  106. fc->chains[i] = mock_chain(fc->tail,
  107. fc->fences[i],
  108. seqno_fn(i));
  109. if (!fc->chains[i]) {
  110. err = -ENOMEM;
  111. goto unwind;
  112. }
  113. fc->tail = fc->chains[i];
  114. dma_fence_enable_sw_signaling(fc->chains[i]);
  115. }
  116. fc->chain_length = i;
  117. return 0;
  118. unwind:
  119. for (i = 0; i < count; i++) {
  120. dma_fence_put(fc->fences[i]);
  121. dma_fence_put(fc->chains[i]);
  122. }
  123. kvfree(fc->fences);
  124. err_chains:
  125. kvfree(fc->chains);
  126. return err;
  127. }
  128. static void fence_chains_fini(struct fence_chains *fc)
  129. {
  130. unsigned int i;
  131. for (i = 0; i < fc->chain_length; i++) {
  132. dma_fence_signal(fc->fences[i]);
  133. dma_fence_put(fc->fences[i]);
  134. }
  135. kvfree(fc->fences);
  136. for (i = 0; i < fc->chain_length; i++)
  137. dma_fence_put(fc->chains[i]);
  138. kvfree(fc->chains);
  139. }
  140. static int find_seqno(void *arg)
  141. {
  142. struct fence_chains fc;
  143. struct dma_fence *fence;
  144. int err;
  145. int i;
  146. err = fence_chains_init(&fc, 64, seqno_inc);
  147. if (err)
  148. return err;
  149. fence = dma_fence_get(fc.tail);
  150. err = dma_fence_chain_find_seqno(&fence, 0);
  151. dma_fence_put(fence);
  152. if (err) {
  153. pr_err("Reported %d for find_seqno(0)!\n", err);
  154. goto err;
  155. }
  156. for (i = 0; i < fc.chain_length; i++) {
  157. fence = dma_fence_get(fc.tail);
  158. err = dma_fence_chain_find_seqno(&fence, i + 1);
  159. dma_fence_put(fence);
  160. if (err) {
  161. pr_err("Reported %d for find_seqno(%d:%d)!\n",
  162. err, fc.chain_length + 1, i + 1);
  163. goto err;
  164. }
  165. if (fence != fc.chains[i]) {
  166. pr_err("Incorrect fence reported by find_seqno(%d:%d)\n",
  167. fc.chain_length + 1, i + 1);
  168. err = -EINVAL;
  169. goto err;
  170. }
  171. dma_fence_get(fence);
  172. err = dma_fence_chain_find_seqno(&fence, i + 1);
  173. dma_fence_put(fence);
  174. if (err) {
  175. pr_err("Error reported for finding self\n");
  176. goto err;
  177. }
  178. if (fence != fc.chains[i]) {
  179. pr_err("Incorrect fence reported by find self\n");
  180. err = -EINVAL;
  181. goto err;
  182. }
  183. dma_fence_get(fence);
  184. err = dma_fence_chain_find_seqno(&fence, i + 2);
  185. dma_fence_put(fence);
  186. if (!err) {
  187. pr_err("Error not reported for future fence: find_seqno(%d:%d)!\n",
  188. i + 1, i + 2);
  189. err = -EINVAL;
  190. goto err;
  191. }
  192. dma_fence_get(fence);
  193. err = dma_fence_chain_find_seqno(&fence, i);
  194. dma_fence_put(fence);
  195. if (err) {
  196. pr_err("Error reported for previous fence!\n");
  197. goto err;
  198. }
  199. if (i > 0 && fence != fc.chains[i - 1]) {
  200. pr_err("Incorrect fence reported by find_seqno(%d:%d)\n",
  201. i + 1, i);
  202. err = -EINVAL;
  203. goto err;
  204. }
  205. }
  206. err:
  207. fence_chains_fini(&fc);
  208. return err;
  209. }
  210. static int find_signaled(void *arg)
  211. {
  212. struct fence_chains fc;
  213. struct dma_fence *fence;
  214. int err;
  215. err = fence_chains_init(&fc, 2, seqno_inc);
  216. if (err)
  217. return err;
  218. dma_fence_signal(fc.fences[0]);
  219. fence = dma_fence_get(fc.tail);
  220. err = dma_fence_chain_find_seqno(&fence, 1);
  221. dma_fence_put(fence);
  222. if (err) {
  223. pr_err("Reported %d for find_seqno()!\n", err);
  224. goto err;
  225. }
  226. if (fence && fence != fc.chains[0]) {
  227. pr_err("Incorrect chain-fence.seqno:%lld reported for completed seqno:1\n",
  228. fence->seqno);
  229. dma_fence_get(fence);
  230. err = dma_fence_chain_find_seqno(&fence, 1);
  231. dma_fence_put(fence);
  232. if (err)
  233. pr_err("Reported %d for finding self!\n", err);
  234. err = -EINVAL;
  235. }
  236. err:
  237. fence_chains_fini(&fc);
  238. return err;
  239. }
  240. static int find_out_of_order(void *arg)
  241. {
  242. struct fence_chains fc;
  243. struct dma_fence *fence;
  244. int err;
  245. err = fence_chains_init(&fc, 3, seqno_inc);
  246. if (err)
  247. return err;
  248. dma_fence_signal(fc.fences[1]);
  249. fence = dma_fence_get(fc.tail);
  250. err = dma_fence_chain_find_seqno(&fence, 2);
  251. dma_fence_put(fence);
  252. if (err) {
  253. pr_err("Reported %d for find_seqno()!\n", err);
  254. goto err;
  255. }
  256. /*
  257. * We signaled the middle fence (2) of the 1-2-3 chain. The behavior
  258. * of the dma-fence-chain is to make us wait for all the fences up to
  259. * the point we want. Since fence 1 is still not signaled, this what
  260. * we should get as fence to wait upon (fence 2 being garbage
  261. * collected during the traversal of the chain).
  262. */
  263. if (fence != fc.chains[0]) {
  264. pr_err("Incorrect chain-fence.seqno:%lld reported for completed seqno:2\n",
  265. fence ? fence->seqno : 0);
  266. err = -EINVAL;
  267. }
  268. err:
  269. fence_chains_fini(&fc);
  270. return err;
  271. }
  272. static uint64_t seqno_inc2(unsigned int i)
  273. {
  274. return 2 * i + 2;
  275. }
  276. static int find_gap(void *arg)
  277. {
  278. struct fence_chains fc;
  279. struct dma_fence *fence;
  280. int err;
  281. int i;
  282. err = fence_chains_init(&fc, 64, seqno_inc2);
  283. if (err)
  284. return err;
  285. for (i = 0; i < fc.chain_length; i++) {
  286. fence = dma_fence_get(fc.tail);
  287. err = dma_fence_chain_find_seqno(&fence, 2 * i + 1);
  288. dma_fence_put(fence);
  289. if (err) {
  290. pr_err("Reported %d for find_seqno(%d:%d)!\n",
  291. err, fc.chain_length + 1, 2 * i + 1);
  292. goto err;
  293. }
  294. if (fence != fc.chains[i]) {
  295. pr_err("Incorrect fence.seqno:%lld reported by find_seqno(%d:%d)\n",
  296. fence->seqno,
  297. fc.chain_length + 1,
  298. 2 * i + 1);
  299. err = -EINVAL;
  300. goto err;
  301. }
  302. dma_fence_get(fence);
  303. err = dma_fence_chain_find_seqno(&fence, 2 * i + 2);
  304. dma_fence_put(fence);
  305. if (err) {
  306. pr_err("Error reported for finding self\n");
  307. goto err;
  308. }
  309. if (fence != fc.chains[i]) {
  310. pr_err("Incorrect fence reported by find self\n");
  311. err = -EINVAL;
  312. goto err;
  313. }
  314. }
  315. err:
  316. fence_chains_fini(&fc);
  317. return err;
  318. }
  319. struct find_race {
  320. struct fence_chains fc;
  321. atomic_t children;
  322. };
  323. static int __find_race(void *arg)
  324. {
  325. struct find_race *data = arg;
  326. int err = 0;
  327. while (!kthread_should_stop()) {
  328. struct dma_fence *fence = dma_fence_get(data->fc.tail);
  329. int seqno;
  330. seqno = get_random_u32_inclusive(1, data->fc.chain_length);
  331. err = dma_fence_chain_find_seqno(&fence, seqno);
  332. if (err) {
  333. pr_err("Failed to find fence seqno:%d\n",
  334. seqno);
  335. dma_fence_put(fence);
  336. break;
  337. }
  338. if (!fence)
  339. goto signal;
  340. /*
  341. * We can only find ourselves if we are on fence we were
  342. * looking for.
  343. */
  344. if (fence->seqno == seqno) {
  345. err = dma_fence_chain_find_seqno(&fence, seqno);
  346. if (err) {
  347. pr_err("Reported an invalid fence for find-self:%d\n",
  348. seqno);
  349. dma_fence_put(fence);
  350. break;
  351. }
  352. }
  353. dma_fence_put(fence);
  354. signal:
  355. seqno = get_random_u32_below(data->fc.chain_length - 1);
  356. dma_fence_signal(data->fc.fences[seqno]);
  357. cond_resched();
  358. }
  359. if (atomic_dec_and_test(&data->children))
  360. wake_up_var(&data->children);
  361. return err;
  362. }
  363. static int find_race(void *arg)
  364. {
  365. struct find_race data;
  366. int ncpus = num_online_cpus();
  367. struct task_struct **threads;
  368. unsigned long count;
  369. int err;
  370. int i;
  371. err = fence_chains_init(&data.fc, CHAIN_SZ, seqno_inc);
  372. if (err)
  373. return err;
  374. threads = kmalloc_objs(*threads, ncpus);
  375. if (!threads) {
  376. err = -ENOMEM;
  377. goto err;
  378. }
  379. atomic_set(&data.children, 0);
  380. for (i = 0; i < ncpus; i++) {
  381. threads[i] = kthread_run(__find_race, &data, "dmabuf/%d", i);
  382. if (IS_ERR(threads[i])) {
  383. ncpus = i;
  384. break;
  385. }
  386. atomic_inc(&data.children);
  387. get_task_struct(threads[i]);
  388. }
  389. wait_var_event_timeout(&data.children,
  390. !atomic_read(&data.children),
  391. 5 * HZ);
  392. for (i = 0; i < ncpus; i++) {
  393. int ret;
  394. ret = kthread_stop_put(threads[i]);
  395. if (ret && !err)
  396. err = ret;
  397. }
  398. kfree(threads);
  399. count = 0;
  400. for (i = 0; i < data.fc.chain_length; i++)
  401. if (dma_fence_is_signaled(data.fc.fences[i]))
  402. count++;
  403. pr_info("Completed %lu cycles\n", count);
  404. err:
  405. fence_chains_fini(&data.fc);
  406. return err;
  407. }
  408. static int signal_forward(void *arg)
  409. {
  410. struct fence_chains fc;
  411. int err;
  412. int i;
  413. err = fence_chains_init(&fc, 64, seqno_inc);
  414. if (err)
  415. return err;
  416. for (i = 0; i < fc.chain_length; i++) {
  417. dma_fence_signal(fc.fences[i]);
  418. if (!dma_fence_is_signaled(fc.chains[i])) {
  419. pr_err("chain[%d] not signaled!\n", i);
  420. err = -EINVAL;
  421. goto err;
  422. }
  423. if (i + 1 < fc.chain_length &&
  424. dma_fence_is_signaled(fc.chains[i + 1])) {
  425. pr_err("chain[%d] is signaled!\n", i);
  426. err = -EINVAL;
  427. goto err;
  428. }
  429. }
  430. err:
  431. fence_chains_fini(&fc);
  432. return err;
  433. }
  434. static int signal_backward(void *arg)
  435. {
  436. struct fence_chains fc;
  437. int err;
  438. int i;
  439. err = fence_chains_init(&fc, 64, seqno_inc);
  440. if (err)
  441. return err;
  442. for (i = fc.chain_length; i--; ) {
  443. dma_fence_signal(fc.fences[i]);
  444. if (i > 0 && dma_fence_is_signaled(fc.chains[i])) {
  445. pr_err("chain[%d] is signaled!\n", i);
  446. err = -EINVAL;
  447. goto err;
  448. }
  449. }
  450. for (i = 0; i < fc.chain_length; i++) {
  451. if (!dma_fence_is_signaled(fc.chains[i])) {
  452. pr_err("chain[%d] was not signaled!\n", i);
  453. err = -EINVAL;
  454. goto err;
  455. }
  456. }
  457. err:
  458. fence_chains_fini(&fc);
  459. return err;
  460. }
  461. static int __wait_fence_chains(void *arg)
  462. {
  463. struct fence_chains *fc = arg;
  464. if (dma_fence_wait(fc->tail, false))
  465. return -EIO;
  466. return 0;
  467. }
  468. static int wait_forward(void *arg)
  469. {
  470. struct fence_chains fc;
  471. struct task_struct *tsk;
  472. int err;
  473. int i;
  474. err = fence_chains_init(&fc, CHAIN_SZ, seqno_inc);
  475. if (err)
  476. return err;
  477. tsk = kthread_run(__wait_fence_chains, &fc, "dmabuf/wait");
  478. if (IS_ERR(tsk)) {
  479. err = PTR_ERR(tsk);
  480. goto err;
  481. }
  482. get_task_struct(tsk);
  483. yield_to(tsk, true);
  484. for (i = 0; i < fc.chain_length; i++)
  485. dma_fence_signal(fc.fences[i]);
  486. err = kthread_stop_put(tsk);
  487. err:
  488. fence_chains_fini(&fc);
  489. return err;
  490. }
  491. static int wait_backward(void *arg)
  492. {
  493. struct fence_chains fc;
  494. struct task_struct *tsk;
  495. int err;
  496. int i;
  497. err = fence_chains_init(&fc, CHAIN_SZ, seqno_inc);
  498. if (err)
  499. return err;
  500. tsk = kthread_run(__wait_fence_chains, &fc, "dmabuf/wait");
  501. if (IS_ERR(tsk)) {
  502. err = PTR_ERR(tsk);
  503. goto err;
  504. }
  505. get_task_struct(tsk);
  506. yield_to(tsk, true);
  507. for (i = fc.chain_length; i--; )
  508. dma_fence_signal(fc.fences[i]);
  509. err = kthread_stop_put(tsk);
  510. err:
  511. fence_chains_fini(&fc);
  512. return err;
  513. }
  514. static void randomise_fences(struct fence_chains *fc)
  515. {
  516. unsigned int count = fc->chain_length;
  517. /* Fisher-Yates shuffle courtesy of Knuth */
  518. while (--count) {
  519. unsigned int swp;
  520. swp = get_random_u32_below(count + 1);
  521. if (swp == count)
  522. continue;
  523. swap(fc->fences[count], fc->fences[swp]);
  524. }
  525. }
  526. static int wait_random(void *arg)
  527. {
  528. struct fence_chains fc;
  529. struct task_struct *tsk;
  530. int err;
  531. int i;
  532. err = fence_chains_init(&fc, CHAIN_SZ, seqno_inc);
  533. if (err)
  534. return err;
  535. randomise_fences(&fc);
  536. tsk = kthread_run(__wait_fence_chains, &fc, "dmabuf/wait");
  537. if (IS_ERR(tsk)) {
  538. err = PTR_ERR(tsk);
  539. goto err;
  540. }
  541. get_task_struct(tsk);
  542. yield_to(tsk, true);
  543. for (i = 0; i < fc.chain_length; i++)
  544. dma_fence_signal(fc.fences[i]);
  545. err = kthread_stop_put(tsk);
  546. err:
  547. fence_chains_fini(&fc);
  548. return err;
  549. }
  550. int dma_fence_chain(void)
  551. {
  552. static const struct subtest tests[] = {
  553. SUBTEST(sanitycheck),
  554. SUBTEST(find_seqno),
  555. SUBTEST(find_signaled),
  556. SUBTEST(find_out_of_order),
  557. SUBTEST(find_gap),
  558. SUBTEST(find_race),
  559. SUBTEST(signal_forward),
  560. SUBTEST(signal_backward),
  561. SUBTEST(wait_forward),
  562. SUBTEST(wait_backward),
  563. SUBTEST(wait_random),
  564. };
  565. int ret;
  566. pr_info("sizeof(dma_fence_chain)=%zu\n",
  567. sizeof(struct dma_fence_chain));
  568. slab_fences = KMEM_CACHE(mock_fence,
  569. SLAB_TYPESAFE_BY_RCU |
  570. SLAB_HWCACHE_ALIGN);
  571. if (!slab_fences)
  572. return -ENOMEM;
  573. ret = subtests(tests, NULL);
  574. kmem_cache_destroy(slab_fences);
  575. return ret;
  576. }