iterator.c 7.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293
  1. // SPDX-License-Identifier: GPL-2.0-or-later
  2. /* Iterator helpers.
  3. *
  4. * Copyright (C) 2022 Red Hat, Inc. All Rights Reserved.
  5. * Written by David Howells (dhowells@redhat.com)
  6. */
  7. #include <linux/export.h>
  8. #include <linux/slab.h>
  9. #include <linux/mm.h>
  10. #include <linux/uio.h>
  11. #include <linux/scatterlist.h>
  12. #include <linux/netfs.h>
  13. #include "internal.h"
  14. /**
  15. * netfs_extract_user_iter - Extract the pages from a user iterator into a bvec
  16. * @orig: The original iterator
  17. * @orig_len: The amount of iterator to copy
  18. * @new: The iterator to be set up
  19. * @extraction_flags: Flags to qualify the request
  20. *
  21. * Extract the page fragments from the given amount of the source iterator and
  22. * build up a second iterator that refers to all of those bits. This allows
  23. * the original iterator to disposed of.
  24. *
  25. * @extraction_flags can have ITER_ALLOW_P2PDMA set to request peer-to-peer DMA be
  26. * allowed on the pages extracted.
  27. *
  28. * On success, the number of elements in the bvec is returned, the original
  29. * iterator will have been advanced by the amount extracted.
  30. *
  31. * The iov_iter_extract_mode() function should be used to query how cleanup
  32. * should be performed.
  33. */
  34. ssize_t netfs_extract_user_iter(struct iov_iter *orig, size_t orig_len,
  35. struct iov_iter *new,
  36. iov_iter_extraction_t extraction_flags)
  37. {
  38. struct bio_vec *bv = NULL;
  39. struct page **pages;
  40. unsigned int cur_npages;
  41. unsigned int max_pages;
  42. unsigned int npages = 0;
  43. unsigned int i;
  44. ssize_t ret;
  45. size_t count = orig_len, offset, len;
  46. size_t bv_size, pg_size;
  47. if (WARN_ON_ONCE(!iter_is_ubuf(orig) && !iter_is_iovec(orig)))
  48. return -EIO;
  49. max_pages = iov_iter_npages(orig, INT_MAX);
  50. bv_size = array_size(max_pages, sizeof(*bv));
  51. bv = kvmalloc(bv_size, GFP_KERNEL);
  52. if (!bv)
  53. return -ENOMEM;
  54. /* Put the page list at the end of the bvec list storage. bvec
  55. * elements are larger than page pointers, so as long as we work
  56. * 0->last, we should be fine.
  57. */
  58. pg_size = array_size(max_pages, sizeof(*pages));
  59. pages = (void *)bv + bv_size - pg_size;
  60. while (count && npages < max_pages) {
  61. ret = iov_iter_extract_pages(orig, &pages, count,
  62. max_pages - npages, extraction_flags,
  63. &offset);
  64. if (ret < 0) {
  65. pr_err("Couldn't get user pages (rc=%zd)\n", ret);
  66. break;
  67. }
  68. if (ret > count) {
  69. pr_err("get_pages rc=%zd more than %zu\n", ret, count);
  70. break;
  71. }
  72. count -= ret;
  73. ret += offset;
  74. cur_npages = DIV_ROUND_UP(ret, PAGE_SIZE);
  75. if (npages + cur_npages > max_pages) {
  76. pr_err("Out of bvec array capacity (%u vs %u)\n",
  77. npages + cur_npages, max_pages);
  78. break;
  79. }
  80. for (i = 0; i < cur_npages; i++) {
  81. len = ret > PAGE_SIZE ? PAGE_SIZE : ret;
  82. bvec_set_page(bv + npages + i, *pages++, len - offset, offset);
  83. ret -= len;
  84. offset = 0;
  85. }
  86. npages += cur_npages;
  87. }
  88. iov_iter_bvec(new, orig->data_source, bv, npages, orig_len - count);
  89. return npages;
  90. }
  91. EXPORT_SYMBOL_GPL(netfs_extract_user_iter);
  92. /*
  93. * Select the span of a bvec iterator we're going to use. Limit it by both maximum
  94. * size and maximum number of segments. Returns the size of the span in bytes.
  95. */
  96. static size_t netfs_limit_bvec(const struct iov_iter *iter, size_t start_offset,
  97. size_t max_size, size_t max_segs)
  98. {
  99. const struct bio_vec *bvecs = iter->bvec;
  100. unsigned int nbv = iter->nr_segs, ix = 0, nsegs = 0;
  101. size_t len, span = 0, n = iter->count;
  102. size_t skip = iter->iov_offset + start_offset;
  103. if (WARN_ON(!iov_iter_is_bvec(iter)) ||
  104. WARN_ON(start_offset > n) ||
  105. n == 0)
  106. return 0;
  107. while (n && ix < nbv && skip) {
  108. len = bvecs[ix].bv_len;
  109. if (skip < len)
  110. break;
  111. skip -= len;
  112. n -= len;
  113. ix++;
  114. }
  115. while (n && ix < nbv) {
  116. len = min3(n, bvecs[ix].bv_len - skip, max_size);
  117. span += len;
  118. nsegs++;
  119. ix++;
  120. if (span >= max_size || nsegs >= max_segs)
  121. break;
  122. skip = 0;
  123. n -= len;
  124. }
  125. return min(span, max_size);
  126. }
  127. /*
  128. * Select the span of a kvec iterator we're going to use. Limit it by both
  129. * maximum size and maximum number of segments. Returns the size of the span
  130. * in bytes.
  131. */
  132. static size_t netfs_limit_kvec(const struct iov_iter *iter, size_t start_offset,
  133. size_t max_size, size_t max_segs)
  134. {
  135. const struct kvec *kvecs = iter->kvec;
  136. unsigned int nkv = iter->nr_segs, ix = 0, nsegs = 0;
  137. size_t len, span = 0, n = iter->count;
  138. size_t skip = iter->iov_offset + start_offset;
  139. if (WARN_ON(!iov_iter_is_kvec(iter)) ||
  140. WARN_ON(start_offset > n) ||
  141. n == 0)
  142. return 0;
  143. while (n && ix < nkv && skip) {
  144. len = kvecs[ix].iov_len;
  145. if (skip < len)
  146. break;
  147. skip -= len;
  148. n -= len;
  149. ix++;
  150. }
  151. while (n && ix < nkv) {
  152. len = min3(n, kvecs[ix].iov_len - skip, max_size);
  153. span += len;
  154. nsegs++;
  155. ix++;
  156. if (span >= max_size || nsegs >= max_segs)
  157. break;
  158. skip = 0;
  159. n -= len;
  160. }
  161. return min(span, max_size);
  162. }
  163. /*
  164. * Select the span of an xarray iterator we're going to use. Limit it by both
  165. * maximum size and maximum number of segments. It is assumed that segments
  166. * can be larger than a page in size, provided they're physically contiguous.
  167. * Returns the size of the span in bytes.
  168. */
  169. static size_t netfs_limit_xarray(const struct iov_iter *iter, size_t start_offset,
  170. size_t max_size, size_t max_segs)
  171. {
  172. struct folio *folio;
  173. unsigned int nsegs = 0;
  174. loff_t pos = iter->xarray_start + iter->iov_offset;
  175. pgoff_t index = pos / PAGE_SIZE;
  176. size_t span = 0, n = iter->count;
  177. XA_STATE(xas, iter->xarray, index);
  178. if (WARN_ON(!iov_iter_is_xarray(iter)) ||
  179. WARN_ON(start_offset > n) ||
  180. n == 0)
  181. return 0;
  182. max_size = min(max_size, n - start_offset);
  183. rcu_read_lock();
  184. xas_for_each(&xas, folio, ULONG_MAX) {
  185. size_t offset, flen, len;
  186. if (xas_retry(&xas, folio))
  187. continue;
  188. if (WARN_ON(xa_is_value(folio)))
  189. break;
  190. if (WARN_ON(folio_test_hugetlb(folio)))
  191. break;
  192. flen = folio_size(folio);
  193. offset = offset_in_folio(folio, pos);
  194. len = min(max_size, flen - offset);
  195. span += len;
  196. nsegs++;
  197. if (span >= max_size || nsegs >= max_segs)
  198. break;
  199. }
  200. rcu_read_unlock();
  201. return min(span, max_size);
  202. }
  203. /*
  204. * Select the span of a folio queue iterator we're going to use. Limit it by
  205. * both maximum size and maximum number of segments. Returns the size of the
  206. * span in bytes.
  207. */
  208. static size_t netfs_limit_folioq(const struct iov_iter *iter, size_t start_offset,
  209. size_t max_size, size_t max_segs)
  210. {
  211. const struct folio_queue *folioq = iter->folioq;
  212. unsigned int nsegs = 0;
  213. unsigned int slot = iter->folioq_slot;
  214. size_t span = 0, n = iter->count;
  215. if (WARN_ON(!iov_iter_is_folioq(iter)) ||
  216. WARN_ON(start_offset > n) ||
  217. n == 0)
  218. return 0;
  219. max_size = umin(max_size, n - start_offset);
  220. if (slot >= folioq_nr_slots(folioq)) {
  221. folioq = folioq->next;
  222. slot = 0;
  223. }
  224. start_offset += iter->iov_offset;
  225. do {
  226. size_t flen = folioq_folio_size(folioq, slot);
  227. if (start_offset < flen) {
  228. span += flen - start_offset;
  229. nsegs++;
  230. start_offset = 0;
  231. } else {
  232. start_offset -= flen;
  233. }
  234. if (span >= max_size || nsegs >= max_segs)
  235. break;
  236. slot++;
  237. if (slot >= folioq_nr_slots(folioq)) {
  238. folioq = folioq->next;
  239. slot = 0;
  240. }
  241. } while (folioq);
  242. return umin(span, max_size);
  243. }
  244. size_t netfs_limit_iter(const struct iov_iter *iter, size_t start_offset,
  245. size_t max_size, size_t max_segs)
  246. {
  247. if (iov_iter_is_folioq(iter))
  248. return netfs_limit_folioq(iter, start_offset, max_size, max_segs);
  249. if (iov_iter_is_bvec(iter))
  250. return netfs_limit_bvec(iter, start_offset, max_size, max_segs);
  251. if (iov_iter_is_xarray(iter))
  252. return netfs_limit_xarray(iter, start_offset, max_size, max_segs);
  253. if (iov_iter_is_kvec(iter))
  254. return netfs_limit_kvec(iter, start_offset, max_size, max_segs);
  255. BUG();
  256. }
  257. EXPORT_SYMBOL(netfs_limit_iter);