radeon_ttm.c 23 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910
  1. /*
  2. * Copyright 2009 Jerome Glisse.
  3. * All Rights Reserved.
  4. *
  5. * Permission is hereby granted, free of charge, to any person obtaining a
  6. * copy of this software and associated documentation files (the
  7. * "Software"), to deal in the Software without restriction, including
  8. * without limitation the rights to use, copy, modify, merge, publish,
  9. * distribute, sub license, and/or sell copies of the Software, and to
  10. * permit persons to whom the Software is furnished to do so, subject to
  11. * the following conditions:
  12. *
  13. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  14. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  15. * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
  16. * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
  17. * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
  18. * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
  19. * USE OR OTHER DEALINGS IN THE SOFTWARE.
  20. *
  21. * The above copyright notice and this permission notice (including the
  22. * next paragraph) shall be included in all copies or substantial portions
  23. * of the Software.
  24. *
  25. */
  26. /*
  27. * Authors:
  28. * Jerome Glisse <glisse@freedesktop.org>
  29. * Thomas Hellstrom <thomas-at-tungstengraphics-dot-com>
  30. * Dave Airlie
  31. */
  32. #include <linux/debugfs.h>
  33. #include <linux/dma-mapping.h>
  34. #include <linux/pagemap.h>
  35. #include <linux/pci.h>
  36. #include <linux/seq_file.h>
  37. #include <linux/slab.h>
  38. #include <linux/swap.h>
  39. #include <drm/drm_device.h>
  40. #include <drm/drm_file.h>
  41. #include <drm/drm_prime.h>
  42. #include <drm/radeon_drm.h>
  43. #include <drm/ttm/ttm_bo.h>
  44. #include <drm/ttm/ttm_placement.h>
  45. #include <drm/ttm/ttm_range_manager.h>
  46. #include <drm/ttm/ttm_tt.h>
  47. #include "radeon_reg.h"
  48. #include "radeon.h"
  49. #include "radeon_ttm.h"
  50. static void radeon_ttm_debugfs_init(struct radeon_device *rdev);
  51. static int radeon_ttm_tt_bind(struct ttm_device *bdev, struct ttm_tt *ttm,
  52. struct ttm_resource *bo_mem);
  53. static void radeon_ttm_tt_unbind(struct ttm_device *bdev, struct ttm_tt *ttm);
  54. struct radeon_device *radeon_get_rdev(struct ttm_device *bdev)
  55. {
  56. struct radeon_mman *mman;
  57. struct radeon_device *rdev;
  58. mman = container_of(bdev, struct radeon_mman, bdev);
  59. rdev = container_of(mman, struct radeon_device, mman);
  60. return rdev;
  61. }
  62. static int radeon_ttm_init_vram(struct radeon_device *rdev)
  63. {
  64. return ttm_range_man_init(&rdev->mman.bdev, TTM_PL_VRAM,
  65. false, rdev->mc.real_vram_size >> PAGE_SHIFT);
  66. }
  67. static int radeon_ttm_init_gtt(struct radeon_device *rdev)
  68. {
  69. return ttm_range_man_init(&rdev->mman.bdev, TTM_PL_TT,
  70. true, rdev->mc.gtt_size >> PAGE_SHIFT);
  71. }
  72. static void radeon_evict_flags(struct ttm_buffer_object *bo,
  73. struct ttm_placement *placement)
  74. {
  75. static const struct ttm_place placements = {
  76. .fpfn = 0,
  77. .lpfn = 0,
  78. .mem_type = TTM_PL_SYSTEM,
  79. .flags = 0
  80. };
  81. struct radeon_bo *rbo;
  82. if (!radeon_ttm_bo_is_radeon_bo(bo)) {
  83. placement->placement = &placements;
  84. placement->num_placement = 1;
  85. return;
  86. }
  87. rbo = container_of(bo, struct radeon_bo, tbo);
  88. switch (bo->resource->mem_type) {
  89. case TTM_PL_VRAM:
  90. if (rbo->rdev->ring[radeon_copy_ring_index(rbo->rdev)].ready == false)
  91. radeon_ttm_placement_from_domain(rbo, RADEON_GEM_DOMAIN_CPU);
  92. else if (rbo->rdev->mc.visible_vram_size < rbo->rdev->mc.real_vram_size &&
  93. bo->resource->start < (rbo->rdev->mc.visible_vram_size >> PAGE_SHIFT)) {
  94. unsigned fpfn = rbo->rdev->mc.visible_vram_size >> PAGE_SHIFT;
  95. int i;
  96. /* Try evicting to the CPU inaccessible part of VRAM
  97. * first, but only set GTT as busy placement, so this
  98. * BO will be evicted to GTT rather than causing other
  99. * BOs to be evicted from VRAM
  100. */
  101. radeon_ttm_placement_from_domain(rbo, RADEON_GEM_DOMAIN_VRAM |
  102. RADEON_GEM_DOMAIN_GTT);
  103. for (i = 0; i < rbo->placement.num_placement; i++) {
  104. if (rbo->placements[i].mem_type == TTM_PL_VRAM) {
  105. if (rbo->placements[i].fpfn < fpfn)
  106. rbo->placements[i].fpfn = fpfn;
  107. rbo->placements[0].flags |= TTM_PL_FLAG_DESIRED;
  108. }
  109. }
  110. } else
  111. radeon_ttm_placement_from_domain(rbo, RADEON_GEM_DOMAIN_GTT);
  112. break;
  113. case TTM_PL_TT:
  114. default:
  115. radeon_ttm_placement_from_domain(rbo, RADEON_GEM_DOMAIN_CPU);
  116. }
  117. *placement = rbo->placement;
  118. }
  119. static int radeon_move_blit(struct ttm_buffer_object *bo,
  120. bool evict,
  121. struct ttm_resource *new_mem,
  122. struct ttm_resource *old_mem)
  123. {
  124. struct radeon_device *rdev;
  125. uint64_t old_start, new_start;
  126. struct radeon_fence *fence;
  127. unsigned num_pages;
  128. int r, ridx;
  129. rdev = radeon_get_rdev(bo->bdev);
  130. ridx = radeon_copy_ring_index(rdev);
  131. old_start = (u64)old_mem->start << PAGE_SHIFT;
  132. new_start = (u64)new_mem->start << PAGE_SHIFT;
  133. switch (old_mem->mem_type) {
  134. case TTM_PL_VRAM:
  135. old_start += rdev->mc.vram_start;
  136. break;
  137. case TTM_PL_TT:
  138. old_start += rdev->mc.gtt_start;
  139. break;
  140. default:
  141. DRM_ERROR("Unknown placement %d\n", old_mem->mem_type);
  142. return -EINVAL;
  143. }
  144. switch (new_mem->mem_type) {
  145. case TTM_PL_VRAM:
  146. new_start += rdev->mc.vram_start;
  147. break;
  148. case TTM_PL_TT:
  149. new_start += rdev->mc.gtt_start;
  150. break;
  151. default:
  152. DRM_ERROR("Unknown placement %d\n", old_mem->mem_type);
  153. return -EINVAL;
  154. }
  155. if (!rdev->ring[ridx].ready) {
  156. DRM_ERROR("Trying to move memory with ring turned off.\n");
  157. return -EINVAL;
  158. }
  159. BUILD_BUG_ON((PAGE_SIZE % RADEON_GPU_PAGE_SIZE) != 0);
  160. num_pages = PFN_UP(new_mem->size) * (PAGE_SIZE / RADEON_GPU_PAGE_SIZE);
  161. fence = radeon_copy(rdev, old_start, new_start, num_pages, bo->base.resv);
  162. if (IS_ERR(fence))
  163. return PTR_ERR(fence);
  164. r = ttm_bo_move_accel_cleanup(bo, &fence->base, evict, false, new_mem);
  165. radeon_fence_unref(&fence);
  166. return r;
  167. }
  168. static int radeon_bo_move(struct ttm_buffer_object *bo, bool evict,
  169. struct ttm_operation_ctx *ctx,
  170. struct ttm_resource *new_mem,
  171. struct ttm_place *hop)
  172. {
  173. struct ttm_resource *old_mem = bo->resource;
  174. struct radeon_device *rdev;
  175. int r;
  176. if (new_mem->mem_type == TTM_PL_TT) {
  177. r = radeon_ttm_tt_bind(bo->bdev, bo->ttm, new_mem);
  178. if (r)
  179. return r;
  180. }
  181. r = ttm_bo_wait_ctx(bo, ctx);
  182. if (r)
  183. return r;
  184. rdev = radeon_get_rdev(bo->bdev);
  185. if (!old_mem || (old_mem->mem_type == TTM_PL_SYSTEM &&
  186. bo->ttm == NULL)) {
  187. ttm_bo_move_null(bo, new_mem);
  188. goto out;
  189. }
  190. if (old_mem->mem_type == TTM_PL_SYSTEM &&
  191. new_mem->mem_type == TTM_PL_TT) {
  192. ttm_bo_move_null(bo, new_mem);
  193. goto out;
  194. }
  195. if (old_mem->mem_type == TTM_PL_TT &&
  196. new_mem->mem_type == TTM_PL_SYSTEM) {
  197. radeon_ttm_tt_unbind(bo->bdev, bo->ttm);
  198. ttm_bo_move_null(bo, new_mem);
  199. goto out;
  200. }
  201. if (rdev->ring[radeon_copy_ring_index(rdev)].ready &&
  202. rdev->asic->copy.copy != NULL) {
  203. if ((old_mem->mem_type == TTM_PL_SYSTEM &&
  204. new_mem->mem_type == TTM_PL_VRAM) ||
  205. (old_mem->mem_type == TTM_PL_VRAM &&
  206. new_mem->mem_type == TTM_PL_SYSTEM)) {
  207. hop->fpfn = 0;
  208. hop->lpfn = 0;
  209. hop->mem_type = TTM_PL_TT;
  210. hop->flags = 0;
  211. return -EMULTIHOP;
  212. }
  213. r = radeon_move_blit(bo, evict, new_mem, old_mem);
  214. } else {
  215. r = -ENODEV;
  216. }
  217. if (r) {
  218. r = ttm_bo_move_memcpy(bo, ctx, new_mem);
  219. if (r)
  220. return r;
  221. }
  222. out:
  223. /* update statistics */
  224. atomic64_add(bo->base.size, &rdev->num_bytes_moved);
  225. radeon_bo_move_notify(bo);
  226. return 0;
  227. }
  228. static int radeon_ttm_io_mem_reserve(struct ttm_device *bdev, struct ttm_resource *mem)
  229. {
  230. struct radeon_device *rdev = radeon_get_rdev(bdev);
  231. size_t bus_size = (size_t)mem->size;
  232. switch (mem->mem_type) {
  233. case TTM_PL_SYSTEM:
  234. /* system memory */
  235. return 0;
  236. case TTM_PL_TT:
  237. #if IS_ENABLED(CONFIG_AGP)
  238. if (rdev->flags & RADEON_IS_AGP) {
  239. /* RADEON_IS_AGP is set only if AGP is active */
  240. mem->bus.offset = (mem->start << PAGE_SHIFT) +
  241. rdev->mc.agp_base;
  242. mem->bus.is_iomem = !rdev->agp->cant_use_aperture;
  243. mem->bus.caching = ttm_write_combined;
  244. }
  245. #endif
  246. break;
  247. case TTM_PL_VRAM:
  248. mem->bus.offset = mem->start << PAGE_SHIFT;
  249. /* check if it's visible */
  250. if ((mem->bus.offset + bus_size) > rdev->mc.visible_vram_size)
  251. return -EINVAL;
  252. mem->bus.offset += rdev->mc.aper_base;
  253. mem->bus.is_iomem = true;
  254. mem->bus.caching = ttm_write_combined;
  255. #ifdef __alpha__
  256. /*
  257. * Alpha: use bus.addr to hold the ioremap() return,
  258. * so we can modify bus.base below.
  259. */
  260. mem->bus.addr = ioremap_wc(mem->bus.offset, bus_size);
  261. if (!mem->bus.addr)
  262. return -ENOMEM;
  263. /*
  264. * Alpha: Use just the bus offset plus
  265. * the hose/domain memory base for bus.base.
  266. * It then can be used to build PTEs for VRAM
  267. * access, as done in ttm_bo_vm_fault().
  268. */
  269. mem->bus.offset = (mem->bus.offset & 0x0ffffffffUL) +
  270. rdev->hose->dense_mem_base;
  271. #endif
  272. break;
  273. default:
  274. return -EINVAL;
  275. }
  276. return 0;
  277. }
  278. /*
  279. * TTM backend functions.
  280. */
  281. struct radeon_ttm_tt {
  282. struct ttm_tt ttm;
  283. u64 offset;
  284. uint64_t userptr;
  285. struct mm_struct *usermm;
  286. uint32_t userflags;
  287. bool bound;
  288. };
  289. /* prepare the sg table with the user pages */
  290. static int radeon_ttm_tt_pin_userptr(struct ttm_device *bdev, struct ttm_tt *ttm)
  291. {
  292. struct radeon_device *rdev = radeon_get_rdev(bdev);
  293. struct radeon_ttm_tt *gtt = (void *)ttm;
  294. unsigned pinned = 0;
  295. int r;
  296. int write = !(gtt->userflags & RADEON_GEM_USERPTR_READONLY);
  297. enum dma_data_direction direction = write ?
  298. DMA_BIDIRECTIONAL : DMA_TO_DEVICE;
  299. if (current->mm != gtt->usermm)
  300. return -EPERM;
  301. if (gtt->userflags & RADEON_GEM_USERPTR_ANONONLY) {
  302. /* check that we only pin down anonymous memory
  303. to prevent problems with writeback */
  304. unsigned long end = gtt->userptr + (u64)ttm->num_pages * PAGE_SIZE;
  305. struct vm_area_struct *vma;
  306. vma = find_vma(gtt->usermm, gtt->userptr);
  307. if (!vma || vma->vm_file || vma->vm_end < end)
  308. return -EPERM;
  309. }
  310. do {
  311. unsigned num_pages = ttm->num_pages - pinned;
  312. uint64_t userptr = gtt->userptr + pinned * PAGE_SIZE;
  313. struct page **pages = ttm->pages + pinned;
  314. r = get_user_pages(userptr, num_pages, write ? FOLL_WRITE : 0,
  315. pages);
  316. if (r < 0)
  317. goto release_pages;
  318. pinned += r;
  319. } while (pinned < ttm->num_pages);
  320. r = sg_alloc_table_from_pages(ttm->sg, ttm->pages, ttm->num_pages, 0,
  321. (u64)ttm->num_pages << PAGE_SHIFT,
  322. GFP_KERNEL);
  323. if (r)
  324. goto release_sg;
  325. r = dma_map_sgtable(rdev->dev, ttm->sg, direction, 0);
  326. if (r)
  327. goto release_sg;
  328. drm_prime_sg_to_dma_addr_array(ttm->sg, gtt->ttm.dma_address,
  329. ttm->num_pages);
  330. return 0;
  331. release_sg:
  332. kfree(ttm->sg);
  333. release_pages:
  334. release_pages(ttm->pages, pinned);
  335. return r;
  336. }
  337. static void radeon_ttm_tt_unpin_userptr(struct ttm_device *bdev, struct ttm_tt *ttm)
  338. {
  339. struct radeon_device *rdev = radeon_get_rdev(bdev);
  340. struct radeon_ttm_tt *gtt = (void *)ttm;
  341. struct sg_page_iter sg_iter;
  342. int write = !(gtt->userflags & RADEON_GEM_USERPTR_READONLY);
  343. enum dma_data_direction direction = write ?
  344. DMA_BIDIRECTIONAL : DMA_TO_DEVICE;
  345. /* double check that we don't free the table twice */
  346. if (!ttm->sg || !ttm->sg->sgl)
  347. return;
  348. /* free the sg table and pages again */
  349. dma_unmap_sgtable(rdev->dev, ttm->sg, direction, 0);
  350. for_each_sgtable_page(ttm->sg, &sg_iter, 0) {
  351. struct page *page = sg_page_iter_page(&sg_iter);
  352. if (!(gtt->userflags & RADEON_GEM_USERPTR_READONLY))
  353. set_page_dirty(page);
  354. mark_page_accessed(page);
  355. put_page(page);
  356. }
  357. sg_free_table(ttm->sg);
  358. }
  359. static bool radeon_ttm_backend_is_bound(struct ttm_tt *ttm)
  360. {
  361. struct radeon_ttm_tt *gtt = (void*)ttm;
  362. return (gtt->bound);
  363. }
  364. static int radeon_ttm_backend_bind(struct ttm_device *bdev,
  365. struct ttm_tt *ttm,
  366. struct ttm_resource *bo_mem)
  367. {
  368. struct radeon_ttm_tt *gtt = (void*)ttm;
  369. struct radeon_device *rdev = radeon_get_rdev(bdev);
  370. uint32_t flags = RADEON_GART_PAGE_VALID | RADEON_GART_PAGE_READ |
  371. RADEON_GART_PAGE_WRITE;
  372. int r;
  373. if (gtt->bound)
  374. return 0;
  375. if (gtt->userptr) {
  376. radeon_ttm_tt_pin_userptr(bdev, ttm);
  377. flags &= ~RADEON_GART_PAGE_WRITE;
  378. }
  379. gtt->offset = (unsigned long)(bo_mem->start << PAGE_SHIFT);
  380. if (!ttm->num_pages) {
  381. WARN(1, "nothing to bind %u pages for mreg %p back %p!\n",
  382. ttm->num_pages, bo_mem, ttm);
  383. }
  384. if (ttm->caching == ttm_cached)
  385. flags |= RADEON_GART_PAGE_SNOOP;
  386. r = radeon_gart_bind(rdev, gtt->offset, ttm->num_pages,
  387. ttm->pages, gtt->ttm.dma_address, flags);
  388. if (r) {
  389. DRM_ERROR("failed to bind %u pages at 0x%08X\n",
  390. ttm->num_pages, (unsigned)gtt->offset);
  391. return r;
  392. }
  393. gtt->bound = true;
  394. return 0;
  395. }
  396. static void radeon_ttm_backend_unbind(struct ttm_device *bdev, struct ttm_tt *ttm)
  397. {
  398. struct radeon_ttm_tt *gtt = (void *)ttm;
  399. struct radeon_device *rdev = radeon_get_rdev(bdev);
  400. if (gtt->userptr)
  401. radeon_ttm_tt_unpin_userptr(bdev, ttm);
  402. if (!gtt->bound)
  403. return;
  404. radeon_gart_unbind(rdev, gtt->offset, ttm->num_pages);
  405. gtt->bound = false;
  406. }
  407. static void radeon_ttm_backend_destroy(struct ttm_device *bdev, struct ttm_tt *ttm)
  408. {
  409. struct radeon_ttm_tt *gtt = (void *)ttm;
  410. ttm_tt_fini(&gtt->ttm);
  411. kfree(gtt);
  412. }
  413. static struct ttm_tt *radeon_ttm_tt_create(struct ttm_buffer_object *bo,
  414. uint32_t page_flags)
  415. {
  416. struct radeon_ttm_tt *gtt;
  417. enum ttm_caching caching;
  418. struct radeon_bo *rbo;
  419. #if IS_ENABLED(CONFIG_AGP)
  420. struct radeon_device *rdev = radeon_get_rdev(bo->bdev);
  421. if (rdev->flags & RADEON_IS_AGP) {
  422. return ttm_agp_tt_create(bo, rdev->agp->bridge, page_flags);
  423. }
  424. #endif
  425. rbo = container_of(bo, struct radeon_bo, tbo);
  426. gtt = kzalloc_obj(struct radeon_ttm_tt);
  427. if (gtt == NULL) {
  428. return NULL;
  429. }
  430. if (rbo->flags & RADEON_GEM_GTT_UC)
  431. caching = ttm_uncached;
  432. else if (rbo->flags & RADEON_GEM_GTT_WC)
  433. caching = ttm_write_combined;
  434. else
  435. caching = ttm_cached;
  436. if (ttm_sg_tt_init(&gtt->ttm, bo, page_flags, caching)) {
  437. kfree(gtt);
  438. return NULL;
  439. }
  440. return &gtt->ttm;
  441. }
  442. static struct radeon_ttm_tt *radeon_ttm_tt_to_gtt(struct radeon_device *rdev,
  443. struct ttm_tt *ttm)
  444. {
  445. #if IS_ENABLED(CONFIG_AGP)
  446. if (rdev->flags & RADEON_IS_AGP)
  447. return NULL;
  448. #endif
  449. if (!ttm)
  450. return NULL;
  451. return container_of(ttm, struct radeon_ttm_tt, ttm);
  452. }
  453. static int radeon_ttm_tt_populate(struct ttm_device *bdev,
  454. struct ttm_tt *ttm,
  455. struct ttm_operation_ctx *ctx)
  456. {
  457. struct radeon_device *rdev = radeon_get_rdev(bdev);
  458. struct radeon_ttm_tt *gtt = radeon_ttm_tt_to_gtt(rdev, ttm);
  459. bool slave = !!(ttm->page_flags & TTM_TT_FLAG_EXTERNAL);
  460. if (gtt && gtt->userptr) {
  461. ttm->sg = kzalloc_obj(struct sg_table);
  462. if (!ttm->sg)
  463. return -ENOMEM;
  464. ttm->page_flags |= TTM_TT_FLAG_EXTERNAL;
  465. return 0;
  466. }
  467. if (slave && ttm->sg) {
  468. drm_prime_sg_to_dma_addr_array(ttm->sg, gtt->ttm.dma_address,
  469. ttm->num_pages);
  470. return 0;
  471. }
  472. return ttm_pool_alloc(&rdev->mman.bdev.pool, ttm, ctx);
  473. }
  474. static void radeon_ttm_tt_unpopulate(struct ttm_device *bdev, struct ttm_tt *ttm)
  475. {
  476. struct radeon_device *rdev = radeon_get_rdev(bdev);
  477. struct radeon_ttm_tt *gtt = radeon_ttm_tt_to_gtt(rdev, ttm);
  478. bool slave = !!(ttm->page_flags & TTM_TT_FLAG_EXTERNAL);
  479. radeon_ttm_tt_unbind(bdev, ttm);
  480. if (gtt && gtt->userptr) {
  481. kfree(ttm->sg);
  482. ttm->page_flags &= ~TTM_TT_FLAG_EXTERNAL;
  483. return;
  484. }
  485. if (slave)
  486. return;
  487. return ttm_pool_free(&rdev->mman.bdev.pool, ttm);
  488. }
  489. int radeon_ttm_tt_set_userptr(struct radeon_device *rdev,
  490. struct ttm_tt *ttm, uint64_t addr,
  491. uint32_t flags)
  492. {
  493. struct radeon_ttm_tt *gtt = radeon_ttm_tt_to_gtt(rdev, ttm);
  494. if (gtt == NULL)
  495. return -EINVAL;
  496. gtt->userptr = addr;
  497. gtt->usermm = current->mm;
  498. gtt->userflags = flags;
  499. return 0;
  500. }
  501. bool radeon_ttm_tt_is_bound(struct ttm_device *bdev,
  502. struct ttm_tt *ttm)
  503. {
  504. #if IS_ENABLED(CONFIG_AGP)
  505. struct radeon_device *rdev = radeon_get_rdev(bdev);
  506. if (rdev->flags & RADEON_IS_AGP)
  507. return ttm_agp_is_bound(ttm);
  508. #endif
  509. return radeon_ttm_backend_is_bound(ttm);
  510. }
  511. static int radeon_ttm_tt_bind(struct ttm_device *bdev,
  512. struct ttm_tt *ttm,
  513. struct ttm_resource *bo_mem)
  514. {
  515. #if IS_ENABLED(CONFIG_AGP)
  516. struct radeon_device *rdev = radeon_get_rdev(bdev);
  517. #endif
  518. if (!bo_mem)
  519. return -EINVAL;
  520. #if IS_ENABLED(CONFIG_AGP)
  521. if (rdev->flags & RADEON_IS_AGP)
  522. return ttm_agp_bind(ttm, bo_mem);
  523. #endif
  524. return radeon_ttm_backend_bind(bdev, ttm, bo_mem);
  525. }
  526. static void radeon_ttm_tt_unbind(struct ttm_device *bdev,
  527. struct ttm_tt *ttm)
  528. {
  529. #if IS_ENABLED(CONFIG_AGP)
  530. struct radeon_device *rdev = radeon_get_rdev(bdev);
  531. if (rdev->flags & RADEON_IS_AGP) {
  532. ttm_agp_unbind(ttm);
  533. return;
  534. }
  535. #endif
  536. radeon_ttm_backend_unbind(bdev, ttm);
  537. }
  538. static void radeon_ttm_tt_destroy(struct ttm_device *bdev,
  539. struct ttm_tt *ttm)
  540. {
  541. #if IS_ENABLED(CONFIG_AGP)
  542. struct radeon_device *rdev = radeon_get_rdev(bdev);
  543. if (rdev->flags & RADEON_IS_AGP) {
  544. ttm_agp_destroy(ttm);
  545. return;
  546. }
  547. #endif
  548. radeon_ttm_backend_destroy(bdev, ttm);
  549. }
  550. bool radeon_ttm_tt_has_userptr(struct radeon_device *rdev,
  551. struct ttm_tt *ttm)
  552. {
  553. struct radeon_ttm_tt *gtt = radeon_ttm_tt_to_gtt(rdev, ttm);
  554. if (gtt == NULL)
  555. return false;
  556. return !!gtt->userptr;
  557. }
  558. bool radeon_ttm_tt_is_readonly(struct radeon_device *rdev,
  559. struct ttm_tt *ttm)
  560. {
  561. struct radeon_ttm_tt *gtt = radeon_ttm_tt_to_gtt(rdev, ttm);
  562. if (gtt == NULL)
  563. return false;
  564. return !!(gtt->userflags & RADEON_GEM_USERPTR_READONLY);
  565. }
  566. static struct ttm_device_funcs radeon_bo_driver = {
  567. .ttm_tt_create = &radeon_ttm_tt_create,
  568. .ttm_tt_populate = &radeon_ttm_tt_populate,
  569. .ttm_tt_unpopulate = &radeon_ttm_tt_unpopulate,
  570. .ttm_tt_destroy = &radeon_ttm_tt_destroy,
  571. .eviction_valuable = ttm_bo_eviction_valuable,
  572. .evict_flags = &radeon_evict_flags,
  573. .move = &radeon_bo_move,
  574. .io_mem_reserve = &radeon_ttm_io_mem_reserve,
  575. };
  576. int radeon_ttm_init(struct radeon_device *rdev)
  577. {
  578. int r;
  579. /* No others user of address space so set it to 0 */
  580. r = ttm_device_init(&rdev->mman.bdev, &radeon_bo_driver, rdev->dev,
  581. rdev_to_drm(rdev)->anon_inode->i_mapping,
  582. rdev_to_drm(rdev)->vma_offset_manager,
  583. (rdev->need_swiotlb ?
  584. TTM_ALLOCATION_POOL_USE_DMA_ALLOC : 0) |
  585. (dma_addressing_limited(&rdev->pdev->dev) ?
  586. TTM_ALLOCATION_POOL_USE_DMA32 : 0));
  587. if (r) {
  588. DRM_ERROR("failed initializing buffer object driver(%d).\n", r);
  589. return r;
  590. }
  591. rdev->mman.initialized = true;
  592. r = radeon_ttm_init_vram(rdev);
  593. if (r) {
  594. DRM_ERROR("Failed initializing VRAM heap.\n");
  595. return r;
  596. }
  597. /* Change the size here instead of the init above so only lpfn is affected */
  598. radeon_ttm_set_active_vram_size(rdev, rdev->mc.visible_vram_size);
  599. r = radeon_bo_create(rdev, 256 * 1024, PAGE_SIZE, true,
  600. RADEON_GEM_DOMAIN_VRAM, 0, NULL,
  601. NULL, &rdev->stolen_vga_memory);
  602. if (r) {
  603. return r;
  604. }
  605. r = radeon_bo_reserve(rdev->stolen_vga_memory, false);
  606. if (r)
  607. return r;
  608. r = radeon_bo_pin(rdev->stolen_vga_memory, RADEON_GEM_DOMAIN_VRAM, NULL);
  609. radeon_bo_unreserve(rdev->stolen_vga_memory);
  610. if (r) {
  611. radeon_bo_unref(&rdev->stolen_vga_memory);
  612. return r;
  613. }
  614. DRM_INFO("radeon: %uM of VRAM memory ready\n",
  615. (unsigned) (rdev->mc.real_vram_size / (1024 * 1024)));
  616. r = radeon_ttm_init_gtt(rdev);
  617. if (r) {
  618. DRM_ERROR("Failed initializing GTT heap.\n");
  619. return r;
  620. }
  621. DRM_INFO("radeon: %uM of GTT memory ready.\n",
  622. (unsigned)(rdev->mc.gtt_size / (1024 * 1024)));
  623. radeon_ttm_debugfs_init(rdev);
  624. return 0;
  625. }
  626. void radeon_ttm_fini(struct radeon_device *rdev)
  627. {
  628. int r;
  629. if (!rdev->mman.initialized)
  630. return;
  631. if (rdev->stolen_vga_memory) {
  632. r = radeon_bo_reserve(rdev->stolen_vga_memory, false);
  633. if (r == 0) {
  634. radeon_bo_unpin(rdev->stolen_vga_memory);
  635. radeon_bo_unreserve(rdev->stolen_vga_memory);
  636. }
  637. radeon_bo_unref(&rdev->stolen_vga_memory);
  638. }
  639. ttm_range_man_fini(&rdev->mman.bdev, TTM_PL_VRAM);
  640. ttm_range_man_fini(&rdev->mman.bdev, TTM_PL_TT);
  641. ttm_device_fini(&rdev->mman.bdev);
  642. radeon_gart_fini(rdev);
  643. rdev->mman.initialized = false;
  644. DRM_INFO("radeon: ttm finalized\n");
  645. }
  646. /* this should only be called at bootup or when userspace
  647. * isn't running */
  648. void radeon_ttm_set_active_vram_size(struct radeon_device *rdev, u64 size)
  649. {
  650. struct ttm_resource_manager *man;
  651. if (!rdev->mman.initialized)
  652. return;
  653. man = ttm_manager_type(&rdev->mman.bdev, TTM_PL_VRAM);
  654. /* this just adjusts TTM size idea, which sets lpfn to the correct value */
  655. man->size = size >> PAGE_SHIFT;
  656. }
  657. #if defined(CONFIG_DEBUG_FS)
  658. static int radeon_ttm_page_pool_show(struct seq_file *m, void *data)
  659. {
  660. struct radeon_device *rdev = m->private;
  661. return ttm_pool_debugfs(&rdev->mman.bdev.pool, m);
  662. }
  663. DEFINE_SHOW_ATTRIBUTE(radeon_ttm_page_pool);
  664. static int radeon_ttm_vram_open(struct inode *inode, struct file *filep)
  665. {
  666. struct radeon_device *rdev = inode->i_private;
  667. i_size_write(inode, rdev->mc.mc_vram_size);
  668. filep->private_data = inode->i_private;
  669. return 0;
  670. }
  671. static ssize_t radeon_ttm_vram_read(struct file *f, char __user *buf,
  672. size_t size, loff_t *pos)
  673. {
  674. struct radeon_device *rdev = f->private_data;
  675. ssize_t result = 0;
  676. int r;
  677. if (size & 0x3 || *pos & 0x3)
  678. return -EINVAL;
  679. while (size) {
  680. unsigned long flags;
  681. uint32_t value;
  682. if (*pos >= rdev->mc.mc_vram_size)
  683. return result;
  684. spin_lock_irqsave(&rdev->mmio_idx_lock, flags);
  685. WREG32(RADEON_MM_INDEX, ((uint32_t)*pos) | 0x80000000);
  686. if (rdev->family >= CHIP_CEDAR)
  687. WREG32(EVERGREEN_MM_INDEX_HI, *pos >> 31);
  688. value = RREG32(RADEON_MM_DATA);
  689. spin_unlock_irqrestore(&rdev->mmio_idx_lock, flags);
  690. r = put_user(value, (uint32_t __user *)buf);
  691. if (r)
  692. return r;
  693. result += 4;
  694. buf += 4;
  695. *pos += 4;
  696. size -= 4;
  697. }
  698. return result;
  699. }
  700. static const struct file_operations radeon_ttm_vram_fops = {
  701. .owner = THIS_MODULE,
  702. .open = radeon_ttm_vram_open,
  703. .read = radeon_ttm_vram_read,
  704. .llseek = default_llseek
  705. };
  706. static int radeon_ttm_gtt_open(struct inode *inode, struct file *filep)
  707. {
  708. struct radeon_device *rdev = inode->i_private;
  709. i_size_write(inode, rdev->mc.gtt_size);
  710. filep->private_data = inode->i_private;
  711. return 0;
  712. }
  713. static ssize_t radeon_ttm_gtt_read(struct file *f, char __user *buf,
  714. size_t size, loff_t *pos)
  715. {
  716. struct radeon_device *rdev = f->private_data;
  717. ssize_t result = 0;
  718. int r;
  719. while (size) {
  720. loff_t p = *pos / PAGE_SIZE;
  721. unsigned off = *pos & ~PAGE_MASK;
  722. size_t cur_size = min_t(size_t, size, PAGE_SIZE - off);
  723. struct page *page;
  724. void *ptr;
  725. if (p >= rdev->gart.num_cpu_pages)
  726. return result;
  727. page = rdev->gart.pages[p];
  728. if (page) {
  729. ptr = kmap_local_page(page);
  730. ptr += off;
  731. r = copy_to_user(buf, ptr, cur_size);
  732. kunmap_local(ptr);
  733. } else
  734. r = clear_user(buf, cur_size);
  735. if (r)
  736. return -EFAULT;
  737. result += cur_size;
  738. buf += cur_size;
  739. *pos += cur_size;
  740. size -= cur_size;
  741. }
  742. return result;
  743. }
  744. static const struct file_operations radeon_ttm_gtt_fops = {
  745. .owner = THIS_MODULE,
  746. .open = radeon_ttm_gtt_open,
  747. .read = radeon_ttm_gtt_read,
  748. .llseek = default_llseek
  749. };
  750. #endif
  751. static void radeon_ttm_debugfs_init(struct radeon_device *rdev)
  752. {
  753. #if defined(CONFIG_DEBUG_FS)
  754. struct drm_minor *minor = rdev_to_drm(rdev)->primary;
  755. struct dentry *root = minor->debugfs_root;
  756. debugfs_create_file("radeon_vram", 0444, root, rdev,
  757. &radeon_ttm_vram_fops);
  758. debugfs_create_file("radeon_gtt", 0444, root, rdev,
  759. &radeon_ttm_gtt_fops);
  760. debugfs_create_file("ttm_page_pool", 0444, root, rdev,
  761. &radeon_ttm_page_pool_fops);
  762. ttm_resource_manager_create_debugfs(ttm_manager_type(&rdev->mman.bdev,
  763. TTM_PL_VRAM),
  764. root, "radeon_vram_mm");
  765. ttm_resource_manager_create_debugfs(ttm_manager_type(&rdev->mman.bdev,
  766. TTM_PL_TT),
  767. root, "radeon_gtt_mm");
  768. #endif
  769. }