ivpu_gem.c 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579
  1. // SPDX-License-Identifier: GPL-2.0-only
  2. /*
  3. * Copyright (C) 2020-2023 Intel Corporation
  4. */
  5. #include <linux/dma-buf.h>
  6. #include <linux/highmem.h>
  7. #include <linux/module.h>
  8. #include <linux/set_memory.h>
  9. #include <linux/xarray.h>
  10. #include <drm/drm_cache.h>
  11. #include <drm/drm_debugfs.h>
  12. #include <drm/drm_file.h>
  13. #include <drm/drm_utils.h>
  14. #include "ivpu_drv.h"
  15. #include "ivpu_fw.h"
  16. #include "ivpu_gem.h"
  17. #include "ivpu_hw.h"
  18. #include "ivpu_mmu.h"
  19. #include "ivpu_mmu_context.h"
  20. MODULE_IMPORT_NS("DMA_BUF");
  21. static const struct drm_gem_object_funcs ivpu_gem_funcs;
  22. static inline void ivpu_dbg_bo(struct ivpu_device *vdev, struct ivpu_bo *bo, const char *action)
  23. {
  24. ivpu_dbg(vdev, BO,
  25. "%6s: bo %8p size %9zu ctx %d vpu_addr %9llx pages %d sgt %d mmu_mapped %d wc %d imported %d\n",
  26. action, bo, ivpu_bo_size(bo), bo->ctx_id, bo->vpu_addr,
  27. (bool)bo->base.pages, (bool)bo->base.sgt, bo->mmu_mapped, bo->base.map_wc,
  28. (bool)drm_gem_is_imported(&bo->base.base));
  29. }
  30. static inline int ivpu_bo_lock(struct ivpu_bo *bo)
  31. {
  32. return dma_resv_lock(bo->base.base.resv, NULL);
  33. }
  34. static inline void ivpu_bo_unlock(struct ivpu_bo *bo)
  35. {
  36. dma_resv_unlock(bo->base.base.resv);
  37. }
  38. static struct sg_table *ivpu_bo_map_attachment(struct ivpu_device *vdev, struct ivpu_bo *bo)
  39. {
  40. struct sg_table *sgt;
  41. drm_WARN_ON(&vdev->drm, !bo->base.base.import_attach);
  42. ivpu_bo_lock(bo);
  43. sgt = bo->base.sgt;
  44. if (!sgt) {
  45. sgt = dma_buf_map_attachment(bo->base.base.import_attach, DMA_BIDIRECTIONAL);
  46. if (IS_ERR(sgt))
  47. ivpu_err(vdev, "Failed to map BO in IOMMU: %ld\n", PTR_ERR(sgt));
  48. else
  49. bo->base.sgt = sgt;
  50. }
  51. ivpu_bo_unlock(bo);
  52. return sgt;
  53. }
  54. /*
  55. * ivpu_bo_bind() - pin the backing physical pages and map them to VPU.
  56. *
  57. * This function pins physical memory pages, then maps the physical pages
  58. * to IOMMU address space and finally updates the VPU MMU page tables
  59. * to allow the VPU to translate VPU address to IOMMU address.
  60. */
  61. int __must_check ivpu_bo_bind(struct ivpu_bo *bo)
  62. {
  63. struct ivpu_device *vdev = ivpu_bo_to_vdev(bo);
  64. struct sg_table *sgt;
  65. int ret = 0;
  66. ivpu_dbg_bo(vdev, bo, "bind");
  67. if (bo->base.base.import_attach)
  68. sgt = ivpu_bo_map_attachment(vdev, bo);
  69. else
  70. sgt = drm_gem_shmem_get_pages_sgt(&bo->base);
  71. if (IS_ERR(sgt)) {
  72. ret = PTR_ERR(sgt);
  73. ivpu_err(vdev, "Failed to map BO in IOMMU: %d\n", ret);
  74. return ret;
  75. }
  76. ivpu_bo_lock(bo);
  77. if (!bo->mmu_mapped) {
  78. drm_WARN_ON(&vdev->drm, !bo->ctx);
  79. ret = ivpu_mmu_context_map_sgt(vdev, bo->ctx, bo->vpu_addr, sgt, ivpu_bo_size(bo),
  80. ivpu_bo_is_snooped(bo), ivpu_bo_is_read_only(bo));
  81. if (ret) {
  82. ivpu_err(vdev, "Failed to map BO in MMU: %d\n", ret);
  83. goto unlock;
  84. }
  85. bo->mmu_mapped = true;
  86. }
  87. unlock:
  88. ivpu_bo_unlock(bo);
  89. return ret;
  90. }
  91. static int
  92. ivpu_bo_alloc_vpu_addr(struct ivpu_bo *bo, struct ivpu_mmu_context *ctx,
  93. const struct ivpu_addr_range *range)
  94. {
  95. struct ivpu_device *vdev = ivpu_bo_to_vdev(bo);
  96. int idx, ret;
  97. if (!drm_dev_enter(&vdev->drm, &idx))
  98. return -ENODEV;
  99. ivpu_bo_lock(bo);
  100. ret = ivpu_mmu_context_insert_node(ctx, range, ivpu_bo_size(bo), &bo->mm_node);
  101. if (!ret) {
  102. bo->ctx = ctx;
  103. bo->ctx_id = ctx->id;
  104. bo->vpu_addr = bo->mm_node.start;
  105. ivpu_dbg_bo(vdev, bo, "vaddr");
  106. }
  107. ivpu_bo_unlock(bo);
  108. drm_dev_exit(idx);
  109. return ret;
  110. }
  111. static void ivpu_bo_unbind_locked(struct ivpu_bo *bo)
  112. {
  113. struct ivpu_device *vdev = ivpu_bo_to_vdev(bo);
  114. dma_resv_assert_held(bo->base.base.resv);
  115. if (bo->mmu_mapped) {
  116. drm_WARN_ON(&vdev->drm, !bo->ctx);
  117. drm_WARN_ON(&vdev->drm, !bo->vpu_addr);
  118. drm_WARN_ON(&vdev->drm, !bo->base.sgt);
  119. ivpu_mmu_context_unmap_sgt(vdev, bo->ctx, bo->vpu_addr, bo->base.sgt);
  120. bo->mmu_mapped = false;
  121. }
  122. if (bo->ctx) {
  123. ivpu_mmu_context_remove_node(bo->ctx, &bo->mm_node);
  124. bo->ctx = NULL;
  125. }
  126. if (bo->base.sgt) {
  127. if (bo->base.base.import_attach) {
  128. dma_buf_unmap_attachment(bo->base.base.import_attach,
  129. bo->base.sgt, DMA_BIDIRECTIONAL);
  130. } else {
  131. dma_unmap_sgtable(vdev->drm.dev, bo->base.sgt, DMA_BIDIRECTIONAL, 0);
  132. sg_free_table(bo->base.sgt);
  133. kfree(bo->base.sgt);
  134. }
  135. bo->base.sgt = NULL;
  136. }
  137. }
  138. void ivpu_bo_unbind_all_bos_from_context(struct ivpu_device *vdev, struct ivpu_mmu_context *ctx)
  139. {
  140. struct ivpu_bo *bo;
  141. if (drm_WARN_ON(&vdev->drm, !ctx))
  142. return;
  143. mutex_lock(&vdev->bo_list_lock);
  144. list_for_each_entry(bo, &vdev->bo_list, bo_list_node) {
  145. ivpu_bo_lock(bo);
  146. if (bo->ctx == ctx) {
  147. ivpu_dbg_bo(vdev, bo, "unbind");
  148. ivpu_bo_unbind_locked(bo);
  149. }
  150. ivpu_bo_unlock(bo);
  151. }
  152. mutex_unlock(&vdev->bo_list_lock);
  153. }
  154. struct drm_gem_object *ivpu_gem_create_object(struct drm_device *dev, size_t size)
  155. {
  156. struct ivpu_bo *bo;
  157. if (size == 0 || !PAGE_ALIGNED(size))
  158. return ERR_PTR(-EINVAL);
  159. bo = kzalloc(sizeof(*bo), GFP_KERNEL);
  160. if (!bo)
  161. return ERR_PTR(-ENOMEM);
  162. bo->base.base.funcs = &ivpu_gem_funcs;
  163. bo->base.pages_mark_dirty_on_put = true; /* VPU can dirty a BO anytime */
  164. INIT_LIST_HEAD(&bo->bo_list_node);
  165. return &bo->base.base;
  166. }
  167. struct drm_gem_object *ivpu_gem_prime_import(struct drm_device *dev,
  168. struct dma_buf *dma_buf)
  169. {
  170. struct ivpu_device *vdev = to_ivpu_device(dev);
  171. struct device *attach_dev = dev->dev;
  172. struct dma_buf_attachment *attach;
  173. struct drm_gem_object *obj;
  174. struct ivpu_bo *bo;
  175. int ret;
  176. attach = dma_buf_attach(dma_buf, attach_dev);
  177. if (IS_ERR(attach))
  178. return ERR_CAST(attach);
  179. get_dma_buf(dma_buf);
  180. obj = drm_gem_shmem_prime_import_sg_table(dev, attach, NULL);
  181. if (IS_ERR(obj)) {
  182. ret = PTR_ERR(obj);
  183. goto fail_detach;
  184. }
  185. obj->import_attach = attach;
  186. obj->resv = dma_buf->resv;
  187. bo = to_ivpu_bo(obj);
  188. mutex_lock(&vdev->bo_list_lock);
  189. list_add_tail(&bo->bo_list_node, &vdev->bo_list);
  190. mutex_unlock(&vdev->bo_list_lock);
  191. ivpu_dbg(vdev, BO, "import: bo %8p size %9zu\n", bo, ivpu_bo_size(bo));
  192. return obj;
  193. fail_detach:
  194. dma_buf_detach(dma_buf, attach);
  195. dma_buf_put(dma_buf);
  196. return ERR_PTR(ret);
  197. }
  198. static struct ivpu_bo *ivpu_bo_alloc(struct ivpu_device *vdev, u64 size, u32 flags)
  199. {
  200. struct drm_gem_shmem_object *shmem;
  201. struct ivpu_bo *bo;
  202. switch (flags & DRM_IVPU_BO_CACHE_MASK) {
  203. case DRM_IVPU_BO_CACHED:
  204. case DRM_IVPU_BO_WC:
  205. break;
  206. default:
  207. return ERR_PTR(-EINVAL);
  208. }
  209. shmem = drm_gem_shmem_create(&vdev->drm, size);
  210. if (IS_ERR(shmem))
  211. return ERR_CAST(shmem);
  212. bo = to_ivpu_bo(&shmem->base);
  213. bo->base.map_wc = flags & DRM_IVPU_BO_WC;
  214. bo->flags = flags;
  215. mutex_lock(&vdev->bo_list_lock);
  216. list_add_tail(&bo->bo_list_node, &vdev->bo_list);
  217. mutex_unlock(&vdev->bo_list_lock);
  218. ivpu_dbg(vdev, BO, " alloc: bo %8p size %9llu\n", bo, size);
  219. return bo;
  220. }
  221. static int ivpu_gem_bo_open(struct drm_gem_object *obj, struct drm_file *file)
  222. {
  223. struct ivpu_file_priv *file_priv = file->driver_priv;
  224. struct ivpu_device *vdev = file_priv->vdev;
  225. struct ivpu_bo *bo = to_ivpu_bo(obj);
  226. struct ivpu_addr_range *range;
  227. if (bo->ctx) {
  228. ivpu_dbg(vdev, IOCTL, "Can't add BO %pe to ctx %u: already in ctx %u\n",
  229. bo, file_priv->ctx.id, bo->ctx->id);
  230. return -EALREADY;
  231. }
  232. if (bo->flags & DRM_IVPU_BO_SHAVE_MEM)
  233. range = &vdev->hw->ranges.shave;
  234. else if (bo->flags & DRM_IVPU_BO_DMA_MEM)
  235. range = &vdev->hw->ranges.dma;
  236. else
  237. range = &vdev->hw->ranges.user;
  238. return ivpu_bo_alloc_vpu_addr(bo, &file_priv->ctx, range);
  239. }
  240. static void ivpu_gem_bo_free(struct drm_gem_object *obj)
  241. {
  242. struct ivpu_device *vdev = to_ivpu_device(obj->dev);
  243. struct ivpu_bo *bo = to_ivpu_bo(obj);
  244. ivpu_dbg_bo(vdev, bo, "free");
  245. drm_WARN_ON(&vdev->drm, list_empty(&bo->bo_list_node));
  246. mutex_lock(&vdev->bo_list_lock);
  247. list_del(&bo->bo_list_node);
  248. drm_WARN_ON(&vdev->drm, !drm_gem_is_imported(&bo->base.base) &&
  249. !dma_resv_test_signaled(obj->resv, DMA_RESV_USAGE_READ));
  250. drm_WARN_ON(&vdev->drm, ivpu_bo_size(bo) == 0);
  251. drm_WARN_ON(&vdev->drm, bo->base.vaddr);
  252. ivpu_bo_lock(bo);
  253. ivpu_bo_unbind_locked(bo);
  254. ivpu_bo_unlock(bo);
  255. mutex_unlock(&vdev->bo_list_lock);
  256. drm_WARN_ON(&vdev->drm, bo->mmu_mapped);
  257. drm_WARN_ON(&vdev->drm, bo->ctx);
  258. drm_WARN_ON(obj->dev, refcount_read(&bo->base.pages_use_count) > 1);
  259. drm_WARN_ON(obj->dev, bo->base.base.vma_node.vm_files.rb_node);
  260. drm_gem_shmem_free(&bo->base);
  261. }
  262. static enum drm_gem_object_status ivpu_gem_status(struct drm_gem_object *obj)
  263. {
  264. struct ivpu_bo *bo = to_ivpu_bo(obj);
  265. enum drm_gem_object_status status = 0;
  266. if (ivpu_bo_is_resident(bo))
  267. status |= DRM_GEM_OBJECT_RESIDENT;
  268. return status;
  269. }
  270. static const struct drm_gem_object_funcs ivpu_gem_funcs = {
  271. .free = ivpu_gem_bo_free,
  272. .open = ivpu_gem_bo_open,
  273. .print_info = drm_gem_shmem_object_print_info,
  274. .pin = drm_gem_shmem_object_pin,
  275. .unpin = drm_gem_shmem_object_unpin,
  276. .get_sg_table = drm_gem_shmem_object_get_sg_table,
  277. .vmap = drm_gem_shmem_object_vmap,
  278. .vunmap = drm_gem_shmem_object_vunmap,
  279. .mmap = drm_gem_shmem_object_mmap,
  280. .status = ivpu_gem_status,
  281. .vm_ops = &drm_gem_shmem_vm_ops,
  282. };
  283. int ivpu_bo_create_ioctl(struct drm_device *dev, void *data, struct drm_file *file)
  284. {
  285. struct ivpu_file_priv *file_priv = file->driver_priv;
  286. struct ivpu_device *vdev = file_priv->vdev;
  287. struct drm_ivpu_bo_create *args = data;
  288. u64 size = PAGE_ALIGN(args->size);
  289. struct ivpu_bo *bo;
  290. int ret;
  291. if (args->flags & ~DRM_IVPU_BO_FLAGS) {
  292. ivpu_dbg(vdev, IOCTL, "Invalid BO flags 0x%x\n", args->flags);
  293. return -EINVAL;
  294. }
  295. if (size == 0) {
  296. ivpu_dbg(vdev, IOCTL, "Invalid BO size %llu\n", args->size);
  297. return -EINVAL;
  298. }
  299. bo = ivpu_bo_alloc(vdev, size, args->flags);
  300. if (IS_ERR(bo)) {
  301. ivpu_dbg(vdev, IOCTL, "Failed to allocate BO: %pe ctx %u size %llu flags 0x%x\n",
  302. bo, file_priv->ctx.id, args->size, args->flags);
  303. return PTR_ERR(bo);
  304. }
  305. drm_WARN_ON(&vdev->drm, bo->base.base.handle_count != 0);
  306. ret = drm_gem_handle_create(file, &bo->base.base, &args->handle);
  307. if (ret) {
  308. ivpu_dbg(vdev, IOCTL, "Failed to create handle for BO: %pe ctx %u size %llu flags 0x%x\n",
  309. bo, file_priv->ctx.id, args->size, args->flags);
  310. } else {
  311. args->vpu_addr = bo->vpu_addr;
  312. drm_WARN_ON(&vdev->drm, bo->base.base.handle_count != 1);
  313. }
  314. drm_gem_object_put(&bo->base.base);
  315. return ret;
  316. }
  317. struct ivpu_bo *
  318. ivpu_bo_create(struct ivpu_device *vdev, struct ivpu_mmu_context *ctx,
  319. struct ivpu_addr_range *range, u64 size, u32 flags)
  320. {
  321. struct iosys_map map;
  322. struct ivpu_bo *bo;
  323. int ret;
  324. if (drm_WARN_ON(&vdev->drm, !range))
  325. return NULL;
  326. drm_WARN_ON(&vdev->drm, !PAGE_ALIGNED(range->start));
  327. drm_WARN_ON(&vdev->drm, !PAGE_ALIGNED(range->end));
  328. drm_WARN_ON(&vdev->drm, !PAGE_ALIGNED(size));
  329. bo = ivpu_bo_alloc(vdev, size, flags);
  330. if (IS_ERR(bo)) {
  331. ivpu_err(vdev, "Failed to allocate BO: %pe vpu_addr 0x%llx size %llu flags 0x%x\n",
  332. bo, range->start, size, flags);
  333. return NULL;
  334. }
  335. ret = ivpu_bo_alloc_vpu_addr(bo, ctx, range);
  336. if (ret) {
  337. ivpu_err(vdev, "Failed to allocate NPU address for BO: %pe ctx %u size %llu: %d\n",
  338. bo, ctx->id, size, ret);
  339. goto err_put;
  340. }
  341. ret = ivpu_bo_bind(bo);
  342. if (ret)
  343. goto err_put;
  344. if (flags & DRM_IVPU_BO_MAPPABLE) {
  345. ivpu_bo_lock(bo);
  346. ret = drm_gem_shmem_vmap_locked(&bo->base, &map);
  347. ivpu_bo_unlock(bo);
  348. if (ret)
  349. goto err_put;
  350. }
  351. return bo;
  352. err_put:
  353. drm_gem_object_put(&bo->base.base);
  354. return NULL;
  355. }
  356. struct ivpu_bo *ivpu_bo_create_runtime(struct ivpu_device *vdev, u64 addr, u64 size, u32 flags)
  357. {
  358. struct ivpu_addr_range range;
  359. if (!ivpu_is_within_range(addr, size, &vdev->hw->ranges.runtime)) {
  360. ivpu_err(vdev, "Invalid runtime BO address 0x%llx size %llu\n", addr, size);
  361. return NULL;
  362. }
  363. if (ivpu_hw_range_init(vdev, &range, addr, size))
  364. return NULL;
  365. return ivpu_bo_create(vdev, &vdev->gctx, &range, size, flags);
  366. }
  367. struct ivpu_bo *ivpu_bo_create_global(struct ivpu_device *vdev, u64 size, u32 flags)
  368. {
  369. return ivpu_bo_create(vdev, &vdev->gctx, &vdev->hw->ranges.global, size, flags);
  370. }
  371. void ivpu_bo_free(struct ivpu_bo *bo)
  372. {
  373. struct iosys_map map = IOSYS_MAP_INIT_VADDR(bo->base.vaddr);
  374. if (bo->flags & DRM_IVPU_BO_MAPPABLE) {
  375. ivpu_bo_lock(bo);
  376. drm_gem_shmem_vunmap_locked(&bo->base, &map);
  377. ivpu_bo_unlock(bo);
  378. }
  379. drm_gem_object_put(&bo->base.base);
  380. }
  381. int ivpu_bo_info_ioctl(struct drm_device *dev, void *data, struct drm_file *file)
  382. {
  383. struct drm_ivpu_bo_info *args = data;
  384. struct drm_gem_object *obj;
  385. struct ivpu_bo *bo;
  386. int ret = 0;
  387. obj = drm_gem_object_lookup(file, args->handle);
  388. if (!obj)
  389. return -ENOENT;
  390. bo = to_ivpu_bo(obj);
  391. ivpu_bo_lock(bo);
  392. args->flags = bo->flags;
  393. args->mmap_offset = drm_vma_node_offset_addr(&obj->vma_node);
  394. args->vpu_addr = bo->vpu_addr;
  395. args->size = obj->size;
  396. ivpu_bo_unlock(bo);
  397. drm_gem_object_put(obj);
  398. return ret;
  399. }
  400. int ivpu_bo_wait_ioctl(struct drm_device *dev, void *data, struct drm_file *file)
  401. {
  402. struct drm_ivpu_bo_wait *args = data;
  403. struct drm_gem_object *obj;
  404. unsigned long timeout;
  405. long ret;
  406. timeout = drm_timeout_abs_to_jiffies(args->timeout_ns);
  407. /* Add 1 jiffy to ensure the wait function never times out before intended timeout_ns */
  408. timeout += 1;
  409. obj = drm_gem_object_lookup(file, args->handle);
  410. if (!obj)
  411. return -EINVAL;
  412. ret = dma_resv_wait_timeout(obj->resv, DMA_RESV_USAGE_READ, true, timeout);
  413. if (ret == 0) {
  414. ret = -ETIMEDOUT;
  415. } else if (ret > 0) {
  416. ret = 0;
  417. args->job_status = to_ivpu_bo(obj)->job_status;
  418. }
  419. drm_gem_object_put(obj);
  420. return ret;
  421. }
  422. static void ivpu_bo_print_info(struct ivpu_bo *bo, struct drm_printer *p)
  423. {
  424. ivpu_bo_lock(bo);
  425. drm_printf(p, "%-9p %-3u 0x%-12llx %-10lu 0x%-8x %-4u",
  426. bo, bo->ctx_id, bo->vpu_addr, bo->base.base.size,
  427. bo->flags, kref_read(&bo->base.base.refcount));
  428. if (bo->base.pages)
  429. drm_printf(p, " has_pages");
  430. if (bo->mmu_mapped)
  431. drm_printf(p, " mmu_mapped");
  432. if (drm_gem_is_imported(&bo->base.base))
  433. drm_printf(p, " imported");
  434. drm_printf(p, "\n");
  435. ivpu_bo_unlock(bo);
  436. }
  437. void ivpu_bo_list(struct drm_device *dev, struct drm_printer *p)
  438. {
  439. struct ivpu_device *vdev = to_ivpu_device(dev);
  440. struct ivpu_bo *bo;
  441. drm_printf(p, "%-9s %-3s %-14s %-10s %-10s %-4s %s\n",
  442. "bo", "ctx", "vpu_addr", "size", "flags", "refs", "attribs");
  443. mutex_lock(&vdev->bo_list_lock);
  444. list_for_each_entry(bo, &vdev->bo_list, bo_list_node)
  445. ivpu_bo_print_info(bo, p);
  446. mutex_unlock(&vdev->bo_list_lock);
  447. }
  448. void ivpu_bo_list_print(struct drm_device *dev)
  449. {
  450. struct drm_printer p = drm_info_printer(dev->dev);
  451. ivpu_bo_list(dev, &p);
  452. }