vmwgfx_page_dirty.c 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494
  1. // SPDX-License-Identifier: GPL-2.0 OR MIT
  2. /**************************************************************************
  3. *
  4. * Copyright (c) 2019-2025 Broadcom. All Rights Reserved. The term
  5. * “Broadcom” refers to Broadcom Inc. and/or its subsidiaries.
  6. *
  7. **************************************************************************/
  8. #include "vmwgfx_bo.h"
  9. #include "vmwgfx_drv.h"
  10. /*
  11. * Different methods for tracking dirty:
  12. * VMW_BO_DIRTY_PAGETABLE - Scan the pagetable for hardware dirty bits
  13. * VMW_BO_DIRTY_MKWRITE - Write-protect page table entries and record write-
  14. * accesses in the VM mkwrite() callback
  15. */
  16. enum vmw_bo_dirty_method {
  17. VMW_BO_DIRTY_PAGETABLE,
  18. VMW_BO_DIRTY_MKWRITE,
  19. };
  20. /*
  21. * No dirtied pages at scan trigger a transition to the _MKWRITE method,
  22. * similarly a certain percentage of dirty pages trigger a transition to
  23. * the _PAGETABLE method. How many triggers should we wait for before
  24. * changing method?
  25. */
  26. #define VMW_DIRTY_NUM_CHANGE_TRIGGERS 2
  27. /* Percentage to trigger a transition to the _PAGETABLE method */
  28. #define VMW_DIRTY_PERCENTAGE 10
  29. /**
  30. * struct vmw_bo_dirty - Dirty information for buffer objects
  31. * @ref_count: Reference count for this structure. Must be first member!
  32. * @start: First currently dirty bit
  33. * @end: Last currently dirty bit + 1
  34. * @method: The currently used dirty method
  35. * @change_count: Number of consecutive method change triggers
  36. * @bitmap_size: The size of the bitmap in bits. Typically equal to the
  37. * nuber of pages in the bo.
  38. * @bitmap: A bitmap where each bit represents a page. A set bit means a
  39. * dirty page.
  40. */
  41. struct vmw_bo_dirty {
  42. struct kref ref_count;
  43. unsigned long start;
  44. unsigned long end;
  45. enum vmw_bo_dirty_method method;
  46. unsigned int change_count;
  47. unsigned long bitmap_size;
  48. unsigned long bitmap[];
  49. };
  50. bool vmw_bo_is_dirty(struct vmw_bo *vbo)
  51. {
  52. return vbo->dirty && (vbo->dirty->start < vbo->dirty->end);
  53. }
  54. /**
  55. * vmw_bo_dirty_scan_pagetable - Perform a pagetable scan for dirty bits
  56. * @vbo: The buffer object to scan
  57. *
  58. * Scans the pagetable for dirty bits. Clear those bits and modify the
  59. * dirty structure with the results. This function may change the
  60. * dirty-tracking method.
  61. */
  62. static void vmw_bo_dirty_scan_pagetable(struct vmw_bo *vbo)
  63. {
  64. struct vmw_bo_dirty *dirty = vbo->dirty;
  65. pgoff_t offset = drm_vma_node_start(&vbo->tbo.base.vma_node);
  66. struct address_space *mapping = vbo->tbo.bdev->dev_mapping;
  67. pgoff_t num_marked;
  68. num_marked = clean_record_shared_mapping_range
  69. (mapping,
  70. offset, dirty->bitmap_size,
  71. offset, &dirty->bitmap[0],
  72. &dirty->start, &dirty->end);
  73. if (num_marked == 0)
  74. dirty->change_count++;
  75. else
  76. dirty->change_count = 0;
  77. if (dirty->change_count > VMW_DIRTY_NUM_CHANGE_TRIGGERS) {
  78. dirty->change_count = 0;
  79. dirty->method = VMW_BO_DIRTY_MKWRITE;
  80. wp_shared_mapping_range(mapping,
  81. offset, dirty->bitmap_size);
  82. clean_record_shared_mapping_range(mapping,
  83. offset, dirty->bitmap_size,
  84. offset, &dirty->bitmap[0],
  85. &dirty->start, &dirty->end);
  86. }
  87. }
  88. /**
  89. * vmw_bo_dirty_scan_mkwrite - Reset the mkwrite dirty-tracking method
  90. * @vbo: The buffer object to scan
  91. *
  92. * Write-protect pages written to so that consecutive write accesses will
  93. * trigger a call to mkwrite.
  94. *
  95. * This function may change the dirty-tracking method.
  96. */
  97. static void vmw_bo_dirty_scan_mkwrite(struct vmw_bo *vbo)
  98. {
  99. struct vmw_bo_dirty *dirty = vbo->dirty;
  100. unsigned long offset = drm_vma_node_start(&vbo->tbo.base.vma_node);
  101. struct address_space *mapping = vbo->tbo.bdev->dev_mapping;
  102. pgoff_t num_marked;
  103. if (dirty->end <= dirty->start)
  104. return;
  105. num_marked = wp_shared_mapping_range(vbo->tbo.bdev->dev_mapping,
  106. dirty->start + offset,
  107. dirty->end - dirty->start);
  108. if (100UL * num_marked / dirty->bitmap_size >
  109. VMW_DIRTY_PERCENTAGE)
  110. dirty->change_count++;
  111. else
  112. dirty->change_count = 0;
  113. if (dirty->change_count > VMW_DIRTY_NUM_CHANGE_TRIGGERS) {
  114. pgoff_t start = 0;
  115. pgoff_t end = dirty->bitmap_size;
  116. dirty->method = VMW_BO_DIRTY_PAGETABLE;
  117. clean_record_shared_mapping_range(mapping, offset, end, offset,
  118. &dirty->bitmap[0],
  119. &start, &end);
  120. bitmap_clear(&dirty->bitmap[0], 0, dirty->bitmap_size);
  121. if (dirty->start < dirty->end)
  122. bitmap_set(&dirty->bitmap[0], dirty->start,
  123. dirty->end - dirty->start);
  124. dirty->change_count = 0;
  125. }
  126. }
  127. /**
  128. * vmw_bo_dirty_scan - Scan for dirty pages and add them to the dirty
  129. * tracking structure
  130. * @vbo: The buffer object to scan
  131. *
  132. * This function may change the dirty tracking method.
  133. */
  134. void vmw_bo_dirty_scan(struct vmw_bo *vbo)
  135. {
  136. struct vmw_bo_dirty *dirty = vbo->dirty;
  137. if (dirty->method == VMW_BO_DIRTY_PAGETABLE)
  138. vmw_bo_dirty_scan_pagetable(vbo);
  139. else
  140. vmw_bo_dirty_scan_mkwrite(vbo);
  141. }
  142. /**
  143. * vmw_bo_dirty_pre_unmap - write-protect and pick up dirty pages before
  144. * an unmap_mapping_range operation.
  145. * @vbo: The buffer object,
  146. * @start: First page of the range within the buffer object.
  147. * @end: Last page of the range within the buffer object + 1.
  148. *
  149. * If we're using the _PAGETABLE scan method, we may leak dirty pages
  150. * when calling unmap_mapping_range(). This function makes sure we pick
  151. * up all dirty pages.
  152. */
  153. static void vmw_bo_dirty_pre_unmap(struct vmw_bo *vbo,
  154. pgoff_t start, pgoff_t end)
  155. {
  156. struct vmw_bo_dirty *dirty = vbo->dirty;
  157. unsigned long offset = drm_vma_node_start(&vbo->tbo.base.vma_node);
  158. struct address_space *mapping = vbo->tbo.bdev->dev_mapping;
  159. if (dirty->method != VMW_BO_DIRTY_PAGETABLE || start >= end)
  160. return;
  161. wp_shared_mapping_range(mapping, start + offset, end - start);
  162. clean_record_shared_mapping_range(mapping, start + offset,
  163. end - start, offset,
  164. &dirty->bitmap[0], &dirty->start,
  165. &dirty->end);
  166. }
  167. /**
  168. * vmw_bo_dirty_unmap - Clear all ptes pointing to a range within a bo
  169. * @vbo: The buffer object,
  170. * @start: First page of the range within the buffer object.
  171. * @end: Last page of the range within the buffer object + 1.
  172. *
  173. * This is similar to ttm_bo_unmap_virtual() except it takes a subrange.
  174. */
  175. void vmw_bo_dirty_unmap(struct vmw_bo *vbo,
  176. pgoff_t start, pgoff_t end)
  177. {
  178. unsigned long offset = drm_vma_node_start(&vbo->tbo.base.vma_node);
  179. struct address_space *mapping = vbo->tbo.bdev->dev_mapping;
  180. vmw_bo_dirty_pre_unmap(vbo, start, end);
  181. unmap_shared_mapping_range(mapping, (offset + start) << PAGE_SHIFT,
  182. (loff_t) (end - start) << PAGE_SHIFT);
  183. }
  184. /**
  185. * vmw_bo_dirty_add - Add a dirty-tracking user to a buffer object
  186. * @vbo: The buffer object
  187. *
  188. * This function registers a dirty-tracking user to a buffer object.
  189. * A user can be for example a resource or a vma in a special user-space
  190. * mapping.
  191. *
  192. * Return: Zero on success, -ENOMEM on memory allocation failure.
  193. */
  194. int vmw_bo_dirty_add(struct vmw_bo *vbo)
  195. {
  196. struct vmw_bo_dirty *dirty = vbo->dirty;
  197. pgoff_t num_pages = PFN_UP(vbo->tbo.resource->size);
  198. size_t size;
  199. int ret;
  200. if (dirty) {
  201. kref_get(&dirty->ref_count);
  202. return 0;
  203. }
  204. size = sizeof(*dirty) + BITS_TO_LONGS(num_pages) * sizeof(long);
  205. dirty = kvzalloc(size, GFP_KERNEL);
  206. if (!dirty) {
  207. ret = -ENOMEM;
  208. goto out_no_dirty;
  209. }
  210. dirty->bitmap_size = num_pages;
  211. dirty->start = dirty->bitmap_size;
  212. dirty->end = 0;
  213. kref_init(&dirty->ref_count);
  214. if (num_pages < PAGE_SIZE / sizeof(pte_t)) {
  215. dirty->method = VMW_BO_DIRTY_PAGETABLE;
  216. } else {
  217. struct address_space *mapping = vbo->tbo.bdev->dev_mapping;
  218. pgoff_t offset = drm_vma_node_start(&vbo->tbo.base.vma_node);
  219. dirty->method = VMW_BO_DIRTY_MKWRITE;
  220. /* Write-protect and then pick up already dirty bits */
  221. wp_shared_mapping_range(mapping, offset, num_pages);
  222. clean_record_shared_mapping_range(mapping, offset, num_pages,
  223. offset,
  224. &dirty->bitmap[0],
  225. &dirty->start, &dirty->end);
  226. }
  227. vbo->dirty = dirty;
  228. return 0;
  229. out_no_dirty:
  230. return ret;
  231. }
  232. static void vmw_bo_dirty_free(struct kref *kref)
  233. {
  234. struct vmw_bo_dirty *dirty = container_of(kref, struct vmw_bo_dirty, ref_count);
  235. kvfree(dirty);
  236. }
  237. /**
  238. * vmw_bo_dirty_release - Release a dirty-tracking user from a buffer object
  239. * @vbo: The buffer object
  240. *
  241. * This function releases a dirty-tracking user from a buffer object.
  242. * If the reference count reaches zero, then the dirty-tracking object is
  243. * freed and the pointer to it cleared.
  244. *
  245. * Return: Zero on success, -ENOMEM on memory allocation failure.
  246. */
  247. void vmw_bo_dirty_release(struct vmw_bo *vbo)
  248. {
  249. struct vmw_bo_dirty *dirty = vbo->dirty;
  250. if (dirty && kref_put(&dirty->ref_count, vmw_bo_dirty_free))
  251. vbo->dirty = NULL;
  252. }
  253. /**
  254. * vmw_bo_dirty_transfer_to_res - Pick up a resource's dirty region from
  255. * its backing mob.
  256. * @res: The resource
  257. *
  258. * This function will pick up all dirty ranges affecting the resource from
  259. * it's backup mob, and call vmw_resource_dirty_update() once for each
  260. * range. The transferred ranges will be cleared from the backing mob's
  261. * dirty tracking.
  262. */
  263. void vmw_bo_dirty_transfer_to_res(struct vmw_resource *res)
  264. {
  265. struct vmw_bo *vbo = res->guest_memory_bo;
  266. struct vmw_bo_dirty *dirty = vbo->dirty;
  267. pgoff_t start, cur, end;
  268. unsigned long res_start = res->guest_memory_offset;
  269. unsigned long res_end = res->guest_memory_offset + res->guest_memory_size;
  270. WARN_ON_ONCE(res_start & ~PAGE_MASK);
  271. res_start >>= PAGE_SHIFT;
  272. res_end = DIV_ROUND_UP(res_end, PAGE_SIZE);
  273. if (res_start >= dirty->end || res_end <= dirty->start)
  274. return;
  275. cur = max(res_start, dirty->start);
  276. res_end = max(res_end, dirty->end);
  277. while (cur < res_end) {
  278. unsigned long num;
  279. start = find_next_bit(&dirty->bitmap[0], res_end, cur);
  280. if (start >= res_end)
  281. break;
  282. end = find_next_zero_bit(&dirty->bitmap[0], res_end, start + 1);
  283. cur = end + 1;
  284. num = end - start;
  285. bitmap_clear(&dirty->bitmap[0], start, num);
  286. vmw_resource_dirty_update(res, start, end);
  287. }
  288. if (res_start <= dirty->start && res_end > dirty->start)
  289. dirty->start = res_end;
  290. if (res_start < dirty->end && res_end >= dirty->end)
  291. dirty->end = res_start;
  292. }
  293. void vmw_bo_dirty_clear(struct vmw_bo *vbo)
  294. {
  295. struct vmw_bo_dirty *dirty = vbo->dirty;
  296. pgoff_t start, cur, end;
  297. unsigned long res_start = 0;
  298. unsigned long res_end = vbo->tbo.base.size;
  299. WARN_ON_ONCE(res_start & ~PAGE_MASK);
  300. res_start >>= PAGE_SHIFT;
  301. res_end = DIV_ROUND_UP(res_end, PAGE_SIZE);
  302. if (res_start >= dirty->end || res_end <= dirty->start)
  303. return;
  304. cur = max(res_start, dirty->start);
  305. res_end = max(res_end, dirty->end);
  306. while (cur < res_end) {
  307. unsigned long num;
  308. start = find_next_bit(&dirty->bitmap[0], res_end, cur);
  309. if (start >= res_end)
  310. break;
  311. end = find_next_zero_bit(&dirty->bitmap[0], res_end, start + 1);
  312. cur = end + 1;
  313. num = end - start;
  314. bitmap_clear(&dirty->bitmap[0], start, num);
  315. }
  316. if (res_start <= dirty->start && res_end > dirty->start)
  317. dirty->start = res_end;
  318. if (res_start < dirty->end && res_end >= dirty->end)
  319. dirty->end = res_start;
  320. }
  321. /**
  322. * vmw_bo_dirty_clear_res - Clear a resource's dirty region from
  323. * its backing mob.
  324. * @res: The resource
  325. *
  326. * This function will clear all dirty ranges affecting the resource from
  327. * it's backup mob's dirty tracking.
  328. */
  329. void vmw_bo_dirty_clear_res(struct vmw_resource *res)
  330. {
  331. unsigned long res_start = res->guest_memory_offset;
  332. unsigned long res_end = res->guest_memory_offset + res->guest_memory_size;
  333. struct vmw_bo *vbo = res->guest_memory_bo;
  334. struct vmw_bo_dirty *dirty = vbo->dirty;
  335. res_start >>= PAGE_SHIFT;
  336. res_end = DIV_ROUND_UP(res_end, PAGE_SIZE);
  337. if (res_start >= dirty->end || res_end <= dirty->start)
  338. return;
  339. res_start = max(res_start, dirty->start);
  340. res_end = min(res_end, dirty->end);
  341. bitmap_clear(&dirty->bitmap[0], res_start, res_end - res_start);
  342. if (res_start <= dirty->start && res_end > dirty->start)
  343. dirty->start = res_end;
  344. if (res_start < dirty->end && res_end >= dirty->end)
  345. dirty->end = res_start;
  346. }
  347. vm_fault_t vmw_bo_vm_mkwrite(struct vm_fault *vmf)
  348. {
  349. struct vm_area_struct *vma = vmf->vma;
  350. struct ttm_buffer_object *bo = (struct ttm_buffer_object *)
  351. vma->vm_private_data;
  352. vm_fault_t ret;
  353. unsigned long page_offset;
  354. unsigned int save_flags;
  355. struct vmw_bo *vbo = to_vmw_bo(&bo->base);
  356. /*
  357. * mkwrite() doesn't handle the VM_FAULT_RETRY return value correctly.
  358. * So make sure the TTM helpers are aware.
  359. */
  360. save_flags = vmf->flags;
  361. vmf->flags &= ~FAULT_FLAG_ALLOW_RETRY;
  362. ret = ttm_bo_vm_reserve(bo, vmf);
  363. vmf->flags = save_flags;
  364. if (ret)
  365. return ret;
  366. page_offset = vmf->pgoff - drm_vma_node_start(&bo->base.vma_node);
  367. if (unlikely(page_offset >= PFN_UP(bo->resource->size))) {
  368. ret = VM_FAULT_SIGBUS;
  369. goto out_unlock;
  370. }
  371. if (vbo->dirty && vbo->dirty->method == VMW_BO_DIRTY_MKWRITE &&
  372. !test_bit(page_offset, &vbo->dirty->bitmap[0])) {
  373. struct vmw_bo_dirty *dirty = vbo->dirty;
  374. __set_bit(page_offset, &dirty->bitmap[0]);
  375. dirty->start = min(dirty->start, page_offset);
  376. dirty->end = max(dirty->end, page_offset + 1);
  377. }
  378. out_unlock:
  379. dma_resv_unlock(bo->base.resv);
  380. return ret;
  381. }
  382. vm_fault_t vmw_bo_vm_fault(struct vm_fault *vmf)
  383. {
  384. struct vm_area_struct *vma = vmf->vma;
  385. struct ttm_buffer_object *bo = (struct ttm_buffer_object *)
  386. vma->vm_private_data;
  387. struct vmw_bo *vbo = to_vmw_bo(&bo->base);
  388. pgoff_t num_prefault;
  389. pgprot_t prot;
  390. vm_fault_t ret;
  391. ret = ttm_bo_vm_reserve(bo, vmf);
  392. if (ret)
  393. return ret;
  394. num_prefault = (vma->vm_flags & VM_RAND_READ) ? 1 :
  395. TTM_BO_VM_NUM_PREFAULT;
  396. if (vbo->dirty) {
  397. pgoff_t allowed_prefault;
  398. unsigned long page_offset;
  399. page_offset = vmf->pgoff -
  400. drm_vma_node_start(&bo->base.vma_node);
  401. if (page_offset >= PFN_UP(bo->resource->size) ||
  402. vmw_resources_clean(vbo, page_offset,
  403. page_offset + PAGE_SIZE,
  404. &allowed_prefault)) {
  405. ret = VM_FAULT_SIGBUS;
  406. goto out_unlock;
  407. }
  408. num_prefault = min(num_prefault, allowed_prefault);
  409. }
  410. /*
  411. * If we don't track dirty using the MKWRITE method, make sure
  412. * sure the page protection is write-enabled so we don't get
  413. * a lot of unnecessary write faults.
  414. */
  415. if (vbo->dirty && vbo->dirty->method == VMW_BO_DIRTY_MKWRITE)
  416. prot = vm_get_page_prot(vma->vm_flags & ~VM_SHARED);
  417. else
  418. prot = vm_get_page_prot(vma->vm_flags);
  419. ret = ttm_bo_vm_fault_reserved(vmf, prot, num_prefault);
  420. if (ret == VM_FAULT_RETRY && !(vmf->flags & FAULT_FLAG_RETRY_NOWAIT))
  421. return ret;
  422. out_unlock:
  423. dma_resv_unlock(bo->base.resv);
  424. return ret;
  425. }