scatterlist.c 37 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438
  1. // SPDX-License-Identifier: GPL-2.0-only
  2. /*
  3. * Copyright (C) 2007 Jens Axboe <jens.axboe@oracle.com>
  4. *
  5. * Scatterlist handling helpers.
  6. */
  7. #include <linux/export.h>
  8. #include <linux/slab.h>
  9. #include <linux/scatterlist.h>
  10. #include <linux/highmem.h>
  11. #include <linux/kmemleak.h>
  12. #include <linux/bvec.h>
  13. #include <linux/uio.h>
  14. #include <linux/folio_queue.h>
  15. /**
  16. * sg_nents - return total count of entries in scatterlist
  17. * @sg: The scatterlist
  18. *
  19. * Description:
  20. * Allows to know how many entries are in sg, taking into account
  21. * chaining as well
  22. *
  23. **/
  24. int sg_nents(struct scatterlist *sg)
  25. {
  26. int nents;
  27. for (nents = 0; sg; sg = sg_next(sg))
  28. nents++;
  29. return nents;
  30. }
  31. EXPORT_SYMBOL(sg_nents);
  32. /**
  33. * sg_nents_for_len - return total count of entries in scatterlist
  34. * needed to satisfy the supplied length
  35. * @sg: The scatterlist
  36. * @len: The total required length
  37. *
  38. * Description:
  39. * Determines the number of entries in sg that are required to meet
  40. * the supplied length, taking into account chaining as well
  41. *
  42. * Returns:
  43. * the number of sg entries needed, negative error on failure
  44. *
  45. **/
  46. int sg_nents_for_len(struct scatterlist *sg, u64 len)
  47. {
  48. int nents;
  49. u64 total;
  50. if (!len)
  51. return 0;
  52. for (nents = 0, total = 0; sg; sg = sg_next(sg)) {
  53. nents++;
  54. total += sg->length;
  55. if (total >= len)
  56. return nents;
  57. }
  58. return -EINVAL;
  59. }
  60. EXPORT_SYMBOL(sg_nents_for_len);
  61. /**
  62. * sg_nents_for_dma - return the count of DMA-capable entries in scatterlist
  63. * @sgl: The scatterlist
  64. * @sglen: The current number of entries
  65. * @len: The maximum length of DMA-capable block
  66. *
  67. * Description:
  68. * Determines the number of entries in @sgl which would be permitted in
  69. * DMA-capable transfer if list had been split accordingly, taking into
  70. * account chaining as well.
  71. *
  72. * Returns:
  73. * the number of sgl entries needed
  74. *
  75. **/
  76. int sg_nents_for_dma(struct scatterlist *sgl, unsigned int sglen, size_t len)
  77. {
  78. struct scatterlist *sg;
  79. int i, nents = 0;
  80. for_each_sg(sgl, sg, sglen, i)
  81. nents += DIV_ROUND_UP(sg_dma_len(sg), len);
  82. return nents;
  83. }
  84. EXPORT_SYMBOL(sg_nents_for_dma);
  85. /**
  86. * sg_last - return the last scatterlist entry in a list
  87. * @sgl: First entry in the scatterlist
  88. * @nents: Number of entries in the scatterlist
  89. *
  90. * Description:
  91. * Should only be used casually, it (currently) scans the entire list
  92. * to get the last entry.
  93. *
  94. * Note that the @sgl pointer passed in need not be the first one,
  95. * the important bit is that @nents denotes the number of entries that
  96. * exist from @sgl.
  97. *
  98. **/
  99. struct scatterlist *sg_last(struct scatterlist *sgl, unsigned int nents)
  100. {
  101. struct scatterlist *sg, *ret = NULL;
  102. unsigned int i;
  103. for_each_sg(sgl, sg, nents, i)
  104. ret = sg;
  105. BUG_ON(!sg_is_last(ret));
  106. return ret;
  107. }
  108. EXPORT_SYMBOL(sg_last);
  109. /**
  110. * sg_init_table - Initialize SG table
  111. * @sgl: The SG table
  112. * @nents: Number of entries in table
  113. *
  114. * Notes:
  115. * If this is part of a chained sg table, sg_mark_end() should be
  116. * used only on the last table part.
  117. *
  118. **/
  119. void sg_init_table(struct scatterlist *sgl, unsigned int nents)
  120. {
  121. memset(sgl, 0, sizeof(*sgl) * nents);
  122. sg_init_marker(sgl, nents);
  123. }
  124. EXPORT_SYMBOL(sg_init_table);
  125. /**
  126. * sg_init_one - Initialize a single entry sg list
  127. * @sg: SG entry
  128. * @buf: Virtual address for IO
  129. * @buflen: IO length
  130. *
  131. **/
  132. void sg_init_one(struct scatterlist *sg, const void *buf, unsigned int buflen)
  133. {
  134. sg_init_table(sg, 1);
  135. sg_set_buf(sg, buf, buflen);
  136. }
  137. EXPORT_SYMBOL(sg_init_one);
  138. /*
  139. * The default behaviour of sg_alloc_table() is to use these kmalloc/kfree
  140. * helpers.
  141. */
  142. static struct scatterlist *sg_kmalloc(unsigned int nents, gfp_t gfp_mask)
  143. {
  144. if (nents == SG_MAX_SINGLE_ALLOC) {
  145. /*
  146. * Kmemleak doesn't track page allocations as they are not
  147. * commonly used (in a raw form) for kernel data structures.
  148. * As we chain together a list of pages and then a normal
  149. * kmalloc (tracked by kmemleak), in order to for that last
  150. * allocation not to become decoupled (and thus a
  151. * false-positive) we need to inform kmemleak of all the
  152. * intermediate allocations.
  153. */
  154. void *ptr = (void *) __get_free_page(gfp_mask);
  155. kmemleak_alloc(ptr, PAGE_SIZE, 1, gfp_mask);
  156. return ptr;
  157. } else
  158. return kmalloc_objs(struct scatterlist, nents, gfp_mask);
  159. }
  160. static void sg_kfree(struct scatterlist *sg, unsigned int nents)
  161. {
  162. if (nents == SG_MAX_SINGLE_ALLOC) {
  163. kmemleak_free(sg);
  164. free_page((unsigned long) sg);
  165. } else
  166. kfree(sg);
  167. }
  168. /**
  169. * __sg_free_table - Free a previously mapped sg table
  170. * @table: The sg table header to use
  171. * @max_ents: The maximum number of entries per single scatterlist
  172. * @nents_first_chunk: Number of entries int the (preallocated) first
  173. * scatterlist chunk, 0 means no such preallocated first chunk
  174. * @free_fn: Free function
  175. * @num_ents: Number of entries in the table
  176. *
  177. * Description:
  178. * Free an sg table previously allocated and setup with
  179. * __sg_alloc_table(). The @max_ents value must be identical to
  180. * that previously used with __sg_alloc_table().
  181. *
  182. **/
  183. void __sg_free_table(struct sg_table *table, unsigned int max_ents,
  184. unsigned int nents_first_chunk, sg_free_fn *free_fn,
  185. unsigned int num_ents)
  186. {
  187. struct scatterlist *sgl, *next;
  188. unsigned curr_max_ents = nents_first_chunk ?: max_ents;
  189. if (unlikely(!table->sgl))
  190. return;
  191. sgl = table->sgl;
  192. while (num_ents) {
  193. unsigned int alloc_size = num_ents;
  194. unsigned int sg_size;
  195. /*
  196. * If we have more than max_ents segments left,
  197. * then assign 'next' to the sg table after the current one.
  198. * sg_size is then one less than alloc size, since the last
  199. * element is the chain pointer.
  200. */
  201. if (alloc_size > curr_max_ents) {
  202. next = sg_chain_ptr(&sgl[curr_max_ents - 1]);
  203. alloc_size = curr_max_ents;
  204. sg_size = alloc_size - 1;
  205. } else {
  206. sg_size = alloc_size;
  207. next = NULL;
  208. }
  209. num_ents -= sg_size;
  210. if (nents_first_chunk)
  211. nents_first_chunk = 0;
  212. else
  213. free_fn(sgl, alloc_size);
  214. sgl = next;
  215. curr_max_ents = max_ents;
  216. }
  217. table->sgl = NULL;
  218. }
  219. EXPORT_SYMBOL(__sg_free_table);
  220. /**
  221. * sg_free_append_table - Free a previously allocated append sg table.
  222. * @table: The mapped sg append table header
  223. *
  224. **/
  225. void sg_free_append_table(struct sg_append_table *table)
  226. {
  227. __sg_free_table(&table->sgt, SG_MAX_SINGLE_ALLOC, 0, sg_kfree,
  228. table->total_nents);
  229. }
  230. EXPORT_SYMBOL(sg_free_append_table);
  231. /**
  232. * sg_free_table - Free a previously allocated sg table
  233. * @table: The mapped sg table header
  234. *
  235. **/
  236. void sg_free_table(struct sg_table *table)
  237. {
  238. __sg_free_table(table, SG_MAX_SINGLE_ALLOC, 0, sg_kfree,
  239. table->orig_nents);
  240. }
  241. EXPORT_SYMBOL(sg_free_table);
  242. /**
  243. * __sg_alloc_table - Allocate and initialize an sg table with given allocator
  244. * @table: The sg table header to use
  245. * @nents: Number of entries in sg list
  246. * @max_ents: The maximum number of entries the allocator returns per call
  247. * @first_chunk: first SGL if preallocated (may be %NULL)
  248. * @nents_first_chunk: Number of entries in the (preallocated) first
  249. * scatterlist chunk, 0 means no such preallocated chunk provided by user
  250. * @gfp_mask: GFP allocation mask
  251. * @alloc_fn: Allocator to use
  252. *
  253. * Description:
  254. * This function returns a @table @nents long. The allocator is
  255. * defined to return scatterlist chunks of maximum size @max_ents.
  256. * Thus if @nents is bigger than @max_ents, the scatterlists will be
  257. * chained in units of @max_ents.
  258. *
  259. * Notes:
  260. * If this function returns non-0 (eg failure), the caller must call
  261. * __sg_free_table() to cleanup any leftover allocations.
  262. *
  263. **/
  264. int __sg_alloc_table(struct sg_table *table, unsigned int nents,
  265. unsigned int max_ents, struct scatterlist *first_chunk,
  266. unsigned int nents_first_chunk, gfp_t gfp_mask,
  267. sg_alloc_fn *alloc_fn)
  268. {
  269. struct scatterlist *sg, *prv;
  270. unsigned int left;
  271. unsigned curr_max_ents = nents_first_chunk ?: max_ents;
  272. unsigned prv_max_ents;
  273. memset(table, 0, sizeof(*table));
  274. if (nents == 0)
  275. return -EINVAL;
  276. #ifdef CONFIG_ARCH_NO_SG_CHAIN
  277. if (WARN_ON_ONCE(nents > max_ents))
  278. return -EINVAL;
  279. #endif
  280. left = nents;
  281. prv = NULL;
  282. do {
  283. unsigned int sg_size, alloc_size = left;
  284. if (alloc_size > curr_max_ents) {
  285. alloc_size = curr_max_ents;
  286. sg_size = alloc_size - 1;
  287. } else
  288. sg_size = alloc_size;
  289. left -= sg_size;
  290. if (first_chunk) {
  291. sg = first_chunk;
  292. first_chunk = NULL;
  293. } else {
  294. sg = alloc_fn(alloc_size, gfp_mask);
  295. }
  296. if (unlikely(!sg)) {
  297. /*
  298. * Adjust entry count to reflect that the last
  299. * entry of the previous table won't be used for
  300. * linkage. Without this, sg_kfree() may get
  301. * confused.
  302. */
  303. if (prv)
  304. table->nents = ++table->orig_nents;
  305. return -ENOMEM;
  306. }
  307. sg_init_table(sg, alloc_size);
  308. table->nents = table->orig_nents += sg_size;
  309. /*
  310. * If this is the first mapping, assign the sg table header.
  311. * If this is not the first mapping, chain previous part.
  312. */
  313. if (prv)
  314. sg_chain(prv, prv_max_ents, sg);
  315. else
  316. table->sgl = sg;
  317. /*
  318. * If no more entries after this one, mark the end
  319. */
  320. if (!left)
  321. sg_mark_end(&sg[sg_size - 1]);
  322. prv = sg;
  323. prv_max_ents = curr_max_ents;
  324. curr_max_ents = max_ents;
  325. } while (left);
  326. return 0;
  327. }
  328. EXPORT_SYMBOL(__sg_alloc_table);
  329. /**
  330. * sg_alloc_table - Allocate and initialize an sg table
  331. * @table: The sg table header to use
  332. * @nents: Number of entries in sg list
  333. * @gfp_mask: GFP allocation mask
  334. *
  335. * Description:
  336. * Allocate and initialize an sg table. If @nents is larger than
  337. * SG_MAX_SINGLE_ALLOC a chained sg table will be setup.
  338. *
  339. **/
  340. int sg_alloc_table(struct sg_table *table, unsigned int nents, gfp_t gfp_mask)
  341. {
  342. int ret;
  343. ret = __sg_alloc_table(table, nents, SG_MAX_SINGLE_ALLOC,
  344. NULL, 0, gfp_mask, sg_kmalloc);
  345. if (unlikely(ret))
  346. sg_free_table(table);
  347. return ret;
  348. }
  349. EXPORT_SYMBOL(sg_alloc_table);
  350. static struct scatterlist *get_next_sg(struct sg_append_table *table,
  351. struct scatterlist *cur,
  352. unsigned long needed_sges,
  353. gfp_t gfp_mask)
  354. {
  355. struct scatterlist *new_sg, *next_sg;
  356. unsigned int alloc_size;
  357. if (cur) {
  358. next_sg = sg_next(cur);
  359. /* Check if last entry should be keeped for chainning */
  360. if (!sg_is_last(next_sg) || needed_sges == 1)
  361. return next_sg;
  362. }
  363. alloc_size = min_t(unsigned long, needed_sges, SG_MAX_SINGLE_ALLOC);
  364. new_sg = sg_kmalloc(alloc_size, gfp_mask);
  365. if (!new_sg)
  366. return ERR_PTR(-ENOMEM);
  367. sg_init_table(new_sg, alloc_size);
  368. if (cur) {
  369. table->total_nents += alloc_size - 1;
  370. __sg_chain(next_sg, new_sg);
  371. } else {
  372. table->sgt.sgl = new_sg;
  373. table->total_nents = alloc_size;
  374. }
  375. return new_sg;
  376. }
  377. static bool pages_are_mergeable(struct page *a, struct page *b)
  378. {
  379. if (page_to_pfn(a) != page_to_pfn(b) + 1)
  380. return false;
  381. if (!zone_device_pages_have_same_pgmap(a, b))
  382. return false;
  383. return true;
  384. }
  385. /**
  386. * sg_alloc_append_table_from_pages - Allocate and initialize an append sg
  387. * table from an array of pages
  388. * @sgt_append: The sg append table to use
  389. * @pages: Pointer to an array of page pointers
  390. * @n_pages: Number of pages in the pages array
  391. * @offset: Offset from start of the first page to the start of a buffer
  392. * @size: Number of valid bytes in the buffer (after offset)
  393. * @max_segment: Maximum size of a scatterlist element in bytes
  394. * @left_pages: Left pages caller have to set after this call
  395. * @gfp_mask: GFP allocation mask
  396. *
  397. * Description:
  398. * In the first call it allocate and initialize an sg table from a list of
  399. * pages, else reuse the scatterlist from sgt_append. Contiguous ranges of
  400. * the pages are squashed into a single scatterlist entry up to the maximum
  401. * size specified in @max_segment. A user may provide an offset at a start
  402. * and a size of valid data in a buffer specified by the page array. The
  403. * returned sg table is released by sg_free_append_table
  404. *
  405. * Returns:
  406. * 0 on success, negative error on failure
  407. *
  408. * Notes:
  409. * If this function returns non-0 (eg failure), the caller must call
  410. * sg_free_append_table() to cleanup any leftover allocations.
  411. *
  412. * In the fist call, sgt_append must by initialized.
  413. */
  414. int sg_alloc_append_table_from_pages(struct sg_append_table *sgt_append,
  415. struct page **pages, unsigned int n_pages, unsigned int offset,
  416. unsigned long size, unsigned int max_segment,
  417. unsigned int left_pages, gfp_t gfp_mask)
  418. {
  419. unsigned int chunks, cur_page, seg_len, i, prv_len = 0;
  420. unsigned int added_nents = 0;
  421. struct scatterlist *s = sgt_append->prv;
  422. struct page *last_pg;
  423. /*
  424. * The algorithm below requires max_segment to be aligned to PAGE_SIZE
  425. * otherwise it can overshoot.
  426. */
  427. max_segment = ALIGN_DOWN(max_segment, PAGE_SIZE);
  428. if (WARN_ON(max_segment < PAGE_SIZE))
  429. return -EINVAL;
  430. if (IS_ENABLED(CONFIG_ARCH_NO_SG_CHAIN) && sgt_append->prv)
  431. return -EOPNOTSUPP;
  432. if (sgt_append->prv) {
  433. unsigned long next_pfn;
  434. if (WARN_ON(offset))
  435. return -EINVAL;
  436. /* Merge contiguous pages into the last SG */
  437. prv_len = sgt_append->prv->length;
  438. next_pfn = (sg_phys(sgt_append->prv) + prv_len) / PAGE_SIZE;
  439. if (page_to_pfn(pages[0]) == next_pfn) {
  440. last_pg = pfn_to_page(next_pfn - 1);
  441. while (n_pages && pages_are_mergeable(pages[0], last_pg)) {
  442. if (sgt_append->prv->length + PAGE_SIZE > max_segment)
  443. break;
  444. sgt_append->prv->length += PAGE_SIZE;
  445. last_pg = pages[0];
  446. pages++;
  447. n_pages--;
  448. }
  449. if (!n_pages)
  450. goto out;
  451. }
  452. }
  453. /* compute number of contiguous chunks */
  454. chunks = 1;
  455. seg_len = 0;
  456. for (i = 1; i < n_pages; i++) {
  457. seg_len += PAGE_SIZE;
  458. if (seg_len >= max_segment ||
  459. !pages_are_mergeable(pages[i], pages[i - 1])) {
  460. chunks++;
  461. seg_len = 0;
  462. }
  463. }
  464. /* merging chunks and putting them into the scatterlist */
  465. cur_page = 0;
  466. for (i = 0; i < chunks; i++) {
  467. unsigned int j, chunk_size;
  468. /* look for the end of the current chunk */
  469. seg_len = 0;
  470. for (j = cur_page + 1; j < n_pages; j++) {
  471. seg_len += PAGE_SIZE;
  472. if (seg_len >= max_segment ||
  473. !pages_are_mergeable(pages[j], pages[j - 1]))
  474. break;
  475. }
  476. /* Pass how many chunks might be left */
  477. s = get_next_sg(sgt_append, s, chunks - i + left_pages,
  478. gfp_mask);
  479. if (IS_ERR(s)) {
  480. /*
  481. * Adjust entry length to be as before function was
  482. * called.
  483. */
  484. if (sgt_append->prv)
  485. sgt_append->prv->length = prv_len;
  486. return PTR_ERR(s);
  487. }
  488. chunk_size = ((j - cur_page) << PAGE_SHIFT) - offset;
  489. sg_set_page(s, pages[cur_page],
  490. min_t(unsigned long, size, chunk_size), offset);
  491. added_nents++;
  492. size -= chunk_size;
  493. offset = 0;
  494. cur_page = j;
  495. }
  496. sgt_append->sgt.nents += added_nents;
  497. sgt_append->sgt.orig_nents = sgt_append->sgt.nents;
  498. sgt_append->prv = s;
  499. out:
  500. if (!left_pages)
  501. sg_mark_end(s);
  502. return 0;
  503. }
  504. EXPORT_SYMBOL(sg_alloc_append_table_from_pages);
  505. /**
  506. * sg_alloc_table_from_pages_segment - Allocate and initialize an sg table from
  507. * an array of pages and given maximum
  508. * segment.
  509. * @sgt: The sg table header to use
  510. * @pages: Pointer to an array of page pointers
  511. * @n_pages: Number of pages in the pages array
  512. * @offset: Offset from start of the first page to the start of a buffer
  513. * @size: Number of valid bytes in the buffer (after offset)
  514. * @max_segment: Maximum size of a scatterlist element in bytes
  515. * @gfp_mask: GFP allocation mask
  516. *
  517. * Description:
  518. * Allocate and initialize an sg table from a list of pages. Contiguous
  519. * ranges of the pages are squashed into a single scatterlist node up to the
  520. * maximum size specified in @max_segment. A user may provide an offset at a
  521. * start and a size of valid data in a buffer specified by the page array.
  522. *
  523. * The returned sg table is released by sg_free_table.
  524. *
  525. * Returns:
  526. * 0 on success, negative error on failure
  527. */
  528. int sg_alloc_table_from_pages_segment(struct sg_table *sgt, struct page **pages,
  529. unsigned int n_pages, unsigned int offset,
  530. unsigned long size, unsigned int max_segment,
  531. gfp_t gfp_mask)
  532. {
  533. struct sg_append_table append = {};
  534. int err;
  535. err = sg_alloc_append_table_from_pages(&append, pages, n_pages, offset,
  536. size, max_segment, 0, gfp_mask);
  537. if (err) {
  538. sg_free_append_table(&append);
  539. return err;
  540. }
  541. memcpy(sgt, &append.sgt, sizeof(*sgt));
  542. WARN_ON(append.total_nents != sgt->orig_nents);
  543. return 0;
  544. }
  545. EXPORT_SYMBOL(sg_alloc_table_from_pages_segment);
  546. #ifdef CONFIG_SGL_ALLOC
  547. /**
  548. * sgl_alloc_order - allocate a scatterlist and its pages
  549. * @length: Length in bytes of the scatterlist. Must be at least one
  550. * @order: Second argument for alloc_pages()
  551. * @chainable: Whether or not to allocate an extra element in the scatterlist
  552. * for scatterlist chaining purposes
  553. * @gfp: Memory allocation flags
  554. * @nent_p: [out] Number of entries in the scatterlist that have pages
  555. *
  556. * Returns: A pointer to an initialized scatterlist or %NULL upon failure.
  557. */
  558. struct scatterlist *sgl_alloc_order(unsigned long long length,
  559. unsigned int order, bool chainable,
  560. gfp_t gfp, unsigned int *nent_p)
  561. {
  562. struct scatterlist *sgl, *sg;
  563. struct page *page;
  564. unsigned int nent, nalloc;
  565. u32 elem_len;
  566. nent = round_up(length, PAGE_SIZE << order) >> (PAGE_SHIFT + order);
  567. /* Check for integer overflow */
  568. if (length > (nent << (PAGE_SHIFT + order)))
  569. return NULL;
  570. nalloc = nent;
  571. if (chainable) {
  572. /* Check for integer overflow */
  573. if (nalloc + 1 < nalloc)
  574. return NULL;
  575. nalloc++;
  576. }
  577. sgl = kmalloc_objs(struct scatterlist, nalloc, gfp & ~GFP_DMA);
  578. if (!sgl)
  579. return NULL;
  580. sg_init_table(sgl, nalloc);
  581. sg = sgl;
  582. while (length) {
  583. elem_len = min_t(u64, length, PAGE_SIZE << order);
  584. page = alloc_pages(gfp, order);
  585. if (!page) {
  586. sgl_free_order(sgl, order);
  587. return NULL;
  588. }
  589. sg_set_page(sg, page, elem_len, 0);
  590. length -= elem_len;
  591. sg = sg_next(sg);
  592. }
  593. WARN_ONCE(length, "length = %lld\n", length);
  594. if (nent_p)
  595. *nent_p = nent;
  596. return sgl;
  597. }
  598. EXPORT_SYMBOL(sgl_alloc_order);
  599. /**
  600. * sgl_alloc - allocate a scatterlist and its pages
  601. * @length: Length in bytes of the scatterlist
  602. * @gfp: Memory allocation flags
  603. * @nent_p: [out] Number of entries in the scatterlist
  604. *
  605. * Returns: A pointer to an initialized scatterlist or %NULL upon failure.
  606. */
  607. struct scatterlist *sgl_alloc(unsigned long long length, gfp_t gfp,
  608. unsigned int *nent_p)
  609. {
  610. return sgl_alloc_order(length, 0, false, gfp, nent_p);
  611. }
  612. EXPORT_SYMBOL(sgl_alloc);
  613. /**
  614. * sgl_free_n_order - free a scatterlist and its pages
  615. * @sgl: Scatterlist with one or more elements
  616. * @nents: Maximum number of elements to free
  617. * @order: Second argument for __free_pages()
  618. *
  619. * Notes:
  620. * - If several scatterlists have been chained and each chain element is
  621. * freed separately then it's essential to set nents correctly to avoid that a
  622. * page would get freed twice.
  623. * - All pages in a chained scatterlist can be freed at once by setting @nents
  624. * to a high number.
  625. */
  626. void sgl_free_n_order(struct scatterlist *sgl, int nents, int order)
  627. {
  628. struct scatterlist *sg;
  629. struct page *page;
  630. int i;
  631. for_each_sg(sgl, sg, nents, i) {
  632. if (!sg)
  633. break;
  634. page = sg_page(sg);
  635. if (page)
  636. __free_pages(page, order);
  637. }
  638. kfree(sgl);
  639. }
  640. EXPORT_SYMBOL(sgl_free_n_order);
  641. /**
  642. * sgl_free_order - free a scatterlist and its pages
  643. * @sgl: Scatterlist with one or more elements
  644. * @order: Second argument for __free_pages()
  645. */
  646. void sgl_free_order(struct scatterlist *sgl, int order)
  647. {
  648. sgl_free_n_order(sgl, INT_MAX, order);
  649. }
  650. EXPORT_SYMBOL(sgl_free_order);
  651. /**
  652. * sgl_free - free a scatterlist and its pages
  653. * @sgl: Scatterlist with one or more elements
  654. */
  655. void sgl_free(struct scatterlist *sgl)
  656. {
  657. sgl_free_order(sgl, 0);
  658. }
  659. EXPORT_SYMBOL(sgl_free);
  660. #endif /* CONFIG_SGL_ALLOC */
  661. void __sg_page_iter_start(struct sg_page_iter *piter,
  662. struct scatterlist *sglist, unsigned int nents,
  663. unsigned long pgoffset)
  664. {
  665. piter->__pg_advance = 0;
  666. piter->__nents = nents;
  667. piter->sg = sglist;
  668. piter->sg_pgoffset = pgoffset;
  669. }
  670. EXPORT_SYMBOL(__sg_page_iter_start);
  671. static int sg_page_count(struct scatterlist *sg)
  672. {
  673. return PAGE_ALIGN(sg->offset + sg->length) >> PAGE_SHIFT;
  674. }
  675. bool __sg_page_iter_next(struct sg_page_iter *piter)
  676. {
  677. if (!piter->__nents || !piter->sg)
  678. return false;
  679. piter->sg_pgoffset += piter->__pg_advance;
  680. piter->__pg_advance = 1;
  681. while (piter->sg_pgoffset >= sg_page_count(piter->sg)) {
  682. piter->sg_pgoffset -= sg_page_count(piter->sg);
  683. piter->sg = sg_next(piter->sg);
  684. if (!--piter->__nents || !piter->sg)
  685. return false;
  686. }
  687. return true;
  688. }
  689. EXPORT_SYMBOL(__sg_page_iter_next);
  690. static int sg_dma_page_count(struct scatterlist *sg)
  691. {
  692. return PAGE_ALIGN(sg->offset + sg_dma_len(sg)) >> PAGE_SHIFT;
  693. }
  694. bool __sg_page_iter_dma_next(struct sg_dma_page_iter *dma_iter)
  695. {
  696. struct sg_page_iter *piter = &dma_iter->base;
  697. if (!piter->__nents || !piter->sg)
  698. return false;
  699. piter->sg_pgoffset += piter->__pg_advance;
  700. piter->__pg_advance = 1;
  701. while (piter->sg_pgoffset >= sg_dma_page_count(piter->sg)) {
  702. piter->sg_pgoffset -= sg_dma_page_count(piter->sg);
  703. piter->sg = sg_next(piter->sg);
  704. if (!--piter->__nents || !piter->sg)
  705. return false;
  706. }
  707. return true;
  708. }
  709. EXPORT_SYMBOL(__sg_page_iter_dma_next);
  710. /**
  711. * sg_miter_start - start mapping iteration over a sg list
  712. * @miter: sg mapping iter to be started
  713. * @sgl: sg list to iterate over
  714. * @nents: number of sg entries
  715. * @flags: sg iterator flags
  716. *
  717. * Description:
  718. * Starts mapping iterator @miter.
  719. *
  720. * Context:
  721. * Don't care.
  722. */
  723. void sg_miter_start(struct sg_mapping_iter *miter, struct scatterlist *sgl,
  724. unsigned int nents, unsigned int flags)
  725. {
  726. memset(miter, 0, sizeof(struct sg_mapping_iter));
  727. __sg_page_iter_start(&miter->piter, sgl, nents, 0);
  728. WARN_ON(!(flags & (SG_MITER_TO_SG | SG_MITER_FROM_SG)));
  729. miter->__flags = flags;
  730. }
  731. EXPORT_SYMBOL(sg_miter_start);
  732. static bool sg_miter_get_next_page(struct sg_mapping_iter *miter)
  733. {
  734. if (!miter->__remaining) {
  735. struct scatterlist *sg;
  736. if (!__sg_page_iter_next(&miter->piter))
  737. return false;
  738. sg = miter->piter.sg;
  739. miter->__offset = miter->piter.sg_pgoffset ? 0 : sg->offset;
  740. miter->piter.sg_pgoffset += miter->__offset >> PAGE_SHIFT;
  741. miter->__offset &= PAGE_SIZE - 1;
  742. miter->__remaining = sg->offset + sg->length -
  743. (miter->piter.sg_pgoffset << PAGE_SHIFT) -
  744. miter->__offset;
  745. miter->__remaining = min_t(unsigned long, miter->__remaining,
  746. PAGE_SIZE - miter->__offset);
  747. }
  748. return true;
  749. }
  750. /**
  751. * sg_miter_skip - reposition mapping iterator
  752. * @miter: sg mapping iter to be skipped
  753. * @offset: number of bytes to plus the current location
  754. *
  755. * Description:
  756. * Sets the offset of @miter to its current location plus @offset bytes.
  757. * If mapping iterator @miter has been proceeded by sg_miter_next(), this
  758. * stops @miter.
  759. *
  760. * Context:
  761. * Don't care.
  762. *
  763. * Returns:
  764. * true if @miter contains the valid mapping. false if end of sg
  765. * list is reached.
  766. */
  767. bool sg_miter_skip(struct sg_mapping_iter *miter, off_t offset)
  768. {
  769. sg_miter_stop(miter);
  770. while (offset) {
  771. off_t consumed;
  772. if (!sg_miter_get_next_page(miter))
  773. return false;
  774. consumed = min_t(off_t, offset, miter->__remaining);
  775. miter->__offset += consumed;
  776. miter->__remaining -= consumed;
  777. offset -= consumed;
  778. }
  779. return true;
  780. }
  781. EXPORT_SYMBOL(sg_miter_skip);
  782. /**
  783. * sg_miter_next - proceed mapping iterator to the next mapping
  784. * @miter: sg mapping iter to proceed
  785. *
  786. * Description:
  787. * Proceeds @miter to the next mapping. @miter should have been started
  788. * using sg_miter_start(). On successful return, @miter->page,
  789. * @miter->addr and @miter->length point to the current mapping.
  790. *
  791. * Context:
  792. * May sleep if !SG_MITER_ATOMIC && !SG_MITER_LOCAL.
  793. *
  794. * Returns:
  795. * true if @miter contains the next mapping. false if end of sg
  796. * list is reached.
  797. */
  798. bool sg_miter_next(struct sg_mapping_iter *miter)
  799. {
  800. sg_miter_stop(miter);
  801. /*
  802. * Get to the next page if necessary.
  803. * __remaining, __offset is adjusted by sg_miter_stop
  804. */
  805. if (!sg_miter_get_next_page(miter))
  806. return false;
  807. miter->page = sg_page_iter_page(&miter->piter);
  808. miter->consumed = miter->length = miter->__remaining;
  809. if (miter->__flags & SG_MITER_ATOMIC)
  810. miter->addr = kmap_atomic(miter->page) + miter->__offset;
  811. else if (miter->__flags & SG_MITER_LOCAL)
  812. miter->addr = kmap_local_page(miter->page) + miter->__offset;
  813. else
  814. miter->addr = kmap(miter->page) + miter->__offset;
  815. return true;
  816. }
  817. EXPORT_SYMBOL(sg_miter_next);
  818. /**
  819. * sg_miter_stop - stop mapping iteration
  820. * @miter: sg mapping iter to be stopped
  821. *
  822. * Description:
  823. * Stops mapping iterator @miter. @miter should have been started
  824. * using sg_miter_start(). A stopped iteration can be resumed by
  825. * calling sg_miter_next() on it. This is useful when resources (kmap)
  826. * need to be released during iteration.
  827. *
  828. * Context:
  829. * Don't care otherwise.
  830. */
  831. void sg_miter_stop(struct sg_mapping_iter *miter)
  832. {
  833. WARN_ON(miter->consumed > miter->length);
  834. /* drop resources from the last iteration */
  835. if (miter->addr) {
  836. miter->__offset += miter->consumed;
  837. miter->__remaining -= miter->consumed;
  838. if (miter->__flags & SG_MITER_TO_SG)
  839. flush_dcache_page(miter->page);
  840. if (miter->__flags & SG_MITER_ATOMIC) {
  841. WARN_ON_ONCE(!pagefault_disabled());
  842. kunmap_atomic(miter->addr);
  843. } else if (miter->__flags & SG_MITER_LOCAL)
  844. kunmap_local(miter->addr);
  845. else
  846. kunmap(miter->page);
  847. miter->page = NULL;
  848. miter->addr = NULL;
  849. miter->length = 0;
  850. miter->consumed = 0;
  851. }
  852. }
  853. EXPORT_SYMBOL(sg_miter_stop);
  854. /**
  855. * sg_copy_buffer - Copy data between a linear buffer and an SG list
  856. * @sgl: The SG list
  857. * @nents: Number of SG entries
  858. * @buf: Where to copy from
  859. * @buflen: The number of bytes to copy
  860. * @skip: Number of bytes to skip before copying
  861. * @to_buffer: transfer direction (true == from an sg list to a
  862. * buffer, false == from a buffer to an sg list)
  863. *
  864. * Returns the number of copied bytes.
  865. *
  866. **/
  867. size_t sg_copy_buffer(struct scatterlist *sgl, unsigned int nents, void *buf,
  868. size_t buflen, off_t skip, bool to_buffer)
  869. {
  870. unsigned int offset = 0;
  871. struct sg_mapping_iter miter;
  872. unsigned int sg_flags = SG_MITER_LOCAL;
  873. if (to_buffer)
  874. sg_flags |= SG_MITER_FROM_SG;
  875. else
  876. sg_flags |= SG_MITER_TO_SG;
  877. sg_miter_start(&miter, sgl, nents, sg_flags);
  878. if (!sg_miter_skip(&miter, skip))
  879. return 0;
  880. while ((offset < buflen) && sg_miter_next(&miter)) {
  881. unsigned int len;
  882. len = min(miter.length, buflen - offset);
  883. if (to_buffer)
  884. memcpy(buf + offset, miter.addr, len);
  885. else
  886. memcpy(miter.addr, buf + offset, len);
  887. offset += len;
  888. }
  889. sg_miter_stop(&miter);
  890. return offset;
  891. }
  892. EXPORT_SYMBOL(sg_copy_buffer);
  893. /**
  894. * sg_copy_from_buffer - Copy from a linear buffer to an SG list
  895. * @sgl: The SG list
  896. * @nents: Number of SG entries
  897. * @buf: Where to copy from
  898. * @buflen: The number of bytes to copy
  899. *
  900. * Returns the number of copied bytes.
  901. *
  902. **/
  903. size_t sg_copy_from_buffer(struct scatterlist *sgl, unsigned int nents,
  904. const void *buf, size_t buflen)
  905. {
  906. return sg_copy_buffer(sgl, nents, (void *)buf, buflen, 0, false);
  907. }
  908. EXPORT_SYMBOL(sg_copy_from_buffer);
  909. /**
  910. * sg_copy_to_buffer - Copy from an SG list to a linear buffer
  911. * @sgl: The SG list
  912. * @nents: Number of SG entries
  913. * @buf: Where to copy to
  914. * @buflen: The number of bytes to copy
  915. *
  916. * Returns the number of copied bytes.
  917. *
  918. **/
  919. size_t sg_copy_to_buffer(struct scatterlist *sgl, unsigned int nents,
  920. void *buf, size_t buflen)
  921. {
  922. return sg_copy_buffer(sgl, nents, buf, buflen, 0, true);
  923. }
  924. EXPORT_SYMBOL(sg_copy_to_buffer);
  925. /**
  926. * sg_pcopy_from_buffer - Copy from a linear buffer to an SG list
  927. * @sgl: The SG list
  928. * @nents: Number of SG entries
  929. * @buf: Where to copy from
  930. * @buflen: The number of bytes to copy
  931. * @skip: Number of bytes to skip before copying
  932. *
  933. * Returns the number of copied bytes.
  934. *
  935. **/
  936. size_t sg_pcopy_from_buffer(struct scatterlist *sgl, unsigned int nents,
  937. const void *buf, size_t buflen, off_t skip)
  938. {
  939. return sg_copy_buffer(sgl, nents, (void *)buf, buflen, skip, false);
  940. }
  941. EXPORT_SYMBOL(sg_pcopy_from_buffer);
  942. /**
  943. * sg_pcopy_to_buffer - Copy from an SG list to a linear buffer
  944. * @sgl: The SG list
  945. * @nents: Number of SG entries
  946. * @buf: Where to copy to
  947. * @buflen: The number of bytes to copy
  948. * @skip: Number of bytes to skip before copying
  949. *
  950. * Returns the number of copied bytes.
  951. *
  952. **/
  953. size_t sg_pcopy_to_buffer(struct scatterlist *sgl, unsigned int nents,
  954. void *buf, size_t buflen, off_t skip)
  955. {
  956. return sg_copy_buffer(sgl, nents, buf, buflen, skip, true);
  957. }
  958. EXPORT_SYMBOL(sg_pcopy_to_buffer);
  959. /**
  960. * sg_zero_buffer - Zero-out a part of a SG list
  961. * @sgl: The SG list
  962. * @nents: Number of SG entries
  963. * @buflen: The number of bytes to zero out
  964. * @skip: Number of bytes to skip before zeroing
  965. *
  966. * Returns the number of bytes zeroed.
  967. **/
  968. size_t sg_zero_buffer(struct scatterlist *sgl, unsigned int nents,
  969. size_t buflen, off_t skip)
  970. {
  971. unsigned int offset = 0;
  972. struct sg_mapping_iter miter;
  973. unsigned int sg_flags = SG_MITER_LOCAL | SG_MITER_TO_SG;
  974. sg_miter_start(&miter, sgl, nents, sg_flags);
  975. if (!sg_miter_skip(&miter, skip))
  976. return false;
  977. while (offset < buflen && sg_miter_next(&miter)) {
  978. unsigned int len;
  979. len = min(miter.length, buflen - offset);
  980. memset(miter.addr, 0, len);
  981. offset += len;
  982. }
  983. sg_miter_stop(&miter);
  984. return offset;
  985. }
  986. EXPORT_SYMBOL(sg_zero_buffer);
  987. /*
  988. * Extract and pin a list of up to sg_max pages from UBUF- or IOVEC-class
  989. * iterators, and add them to the scatterlist.
  990. */
  991. static ssize_t extract_user_to_sg(struct iov_iter *iter,
  992. ssize_t maxsize,
  993. struct sg_table *sgtable,
  994. unsigned int sg_max,
  995. iov_iter_extraction_t extraction_flags)
  996. {
  997. struct scatterlist *sg = sgtable->sgl + sgtable->nents;
  998. struct page **pages;
  999. unsigned int npages;
  1000. ssize_t ret = 0, res;
  1001. size_t len, off;
  1002. /* We decant the page list into the tail of the scatterlist */
  1003. pages = (void *)sgtable->sgl +
  1004. array_size(sg_max, sizeof(struct scatterlist));
  1005. pages -= sg_max;
  1006. do {
  1007. res = iov_iter_extract_pages(iter, &pages, maxsize, sg_max,
  1008. extraction_flags, &off);
  1009. if (res <= 0)
  1010. goto failed;
  1011. len = res;
  1012. maxsize -= len;
  1013. ret += len;
  1014. npages = DIV_ROUND_UP(off + len, PAGE_SIZE);
  1015. sg_max -= npages;
  1016. for (; npages > 0; npages--) {
  1017. struct page *page = *pages;
  1018. size_t seg = min_t(size_t, PAGE_SIZE - off, len);
  1019. *pages++ = NULL;
  1020. sg_set_page(sg, page, seg, off);
  1021. sgtable->nents++;
  1022. sg++;
  1023. len -= seg;
  1024. off = 0;
  1025. }
  1026. } while (maxsize > 0 && sg_max > 0);
  1027. return ret;
  1028. failed:
  1029. while (sgtable->nents > sgtable->orig_nents)
  1030. unpin_user_page(sg_page(&sgtable->sgl[--sgtable->nents]));
  1031. return res;
  1032. }
  1033. /*
  1034. * Extract up to sg_max pages from a BVEC-type iterator and add them to the
  1035. * scatterlist. The pages are not pinned.
  1036. */
  1037. static ssize_t extract_bvec_to_sg(struct iov_iter *iter,
  1038. ssize_t maxsize,
  1039. struct sg_table *sgtable,
  1040. unsigned int sg_max,
  1041. iov_iter_extraction_t extraction_flags)
  1042. {
  1043. const struct bio_vec *bv = iter->bvec;
  1044. struct scatterlist *sg = sgtable->sgl + sgtable->nents;
  1045. unsigned long start = iter->iov_offset;
  1046. unsigned int i;
  1047. ssize_t ret = 0;
  1048. for (i = 0; i < iter->nr_segs; i++) {
  1049. size_t off, len;
  1050. len = bv[i].bv_len;
  1051. if (start >= len) {
  1052. start -= len;
  1053. continue;
  1054. }
  1055. len = min_t(size_t, maxsize, len - start);
  1056. off = bv[i].bv_offset + start;
  1057. sg_set_page(sg, bv[i].bv_page, len, off);
  1058. sgtable->nents++;
  1059. sg++;
  1060. sg_max--;
  1061. ret += len;
  1062. maxsize -= len;
  1063. if (maxsize <= 0 || sg_max == 0)
  1064. break;
  1065. start = 0;
  1066. }
  1067. if (ret > 0)
  1068. iov_iter_advance(iter, ret);
  1069. return ret;
  1070. }
  1071. /*
  1072. * Extract up to sg_max pages from a KVEC-type iterator and add them to the
  1073. * scatterlist. This can deal with vmalloc'd buffers as well as kmalloc'd or
  1074. * static buffers. The pages are not pinned.
  1075. */
  1076. static ssize_t extract_kvec_to_sg(struct iov_iter *iter,
  1077. ssize_t maxsize,
  1078. struct sg_table *sgtable,
  1079. unsigned int sg_max,
  1080. iov_iter_extraction_t extraction_flags)
  1081. {
  1082. const struct kvec *kv = iter->kvec;
  1083. struct scatterlist *sg = sgtable->sgl + sgtable->nents;
  1084. unsigned long start = iter->iov_offset;
  1085. unsigned int i;
  1086. ssize_t ret = 0;
  1087. for (i = 0; i < iter->nr_segs; i++) {
  1088. struct page *page;
  1089. unsigned long kaddr;
  1090. size_t off, len, seg;
  1091. len = kv[i].iov_len;
  1092. if (start >= len) {
  1093. start -= len;
  1094. continue;
  1095. }
  1096. kaddr = (unsigned long)kv[i].iov_base + start;
  1097. off = kaddr & ~PAGE_MASK;
  1098. len = min_t(size_t, maxsize, len - start);
  1099. kaddr &= PAGE_MASK;
  1100. maxsize -= len;
  1101. ret += len;
  1102. do {
  1103. seg = min_t(size_t, len, PAGE_SIZE - off);
  1104. if (is_vmalloc_or_module_addr((void *)kaddr))
  1105. page = vmalloc_to_page((void *)kaddr);
  1106. else
  1107. page = virt_to_page((void *)kaddr);
  1108. sg_set_page(sg, page, len, off);
  1109. sgtable->nents++;
  1110. sg++;
  1111. sg_max--;
  1112. len -= seg;
  1113. kaddr += PAGE_SIZE;
  1114. off = 0;
  1115. } while (len > 0 && sg_max > 0);
  1116. if (maxsize <= 0 || sg_max == 0)
  1117. break;
  1118. start = 0;
  1119. }
  1120. if (ret > 0)
  1121. iov_iter_advance(iter, ret);
  1122. return ret;
  1123. }
  1124. /*
  1125. * Extract up to sg_max folios from an FOLIOQ-type iterator and add them to
  1126. * the scatterlist. The pages are not pinned.
  1127. */
  1128. static ssize_t extract_folioq_to_sg(struct iov_iter *iter,
  1129. ssize_t maxsize,
  1130. struct sg_table *sgtable,
  1131. unsigned int sg_max,
  1132. iov_iter_extraction_t extraction_flags)
  1133. {
  1134. const struct folio_queue *folioq = iter->folioq;
  1135. struct scatterlist *sg = sgtable->sgl + sgtable->nents;
  1136. unsigned int slot = iter->folioq_slot;
  1137. ssize_t ret = 0;
  1138. size_t offset = iter->iov_offset;
  1139. BUG_ON(!folioq);
  1140. if (slot >= folioq_nr_slots(folioq)) {
  1141. folioq = folioq->next;
  1142. if (WARN_ON_ONCE(!folioq))
  1143. return 0;
  1144. slot = 0;
  1145. }
  1146. do {
  1147. struct folio *folio = folioq_folio(folioq, slot);
  1148. size_t fsize = folioq_folio_size(folioq, slot);
  1149. if (offset < fsize) {
  1150. size_t part = umin(maxsize - ret, fsize - offset);
  1151. sg_set_page(sg, folio_page(folio, 0), part, offset);
  1152. sgtable->nents++;
  1153. sg++;
  1154. sg_max--;
  1155. offset += part;
  1156. ret += part;
  1157. }
  1158. if (offset >= fsize) {
  1159. offset = 0;
  1160. slot++;
  1161. if (slot >= folioq_nr_slots(folioq)) {
  1162. if (!folioq->next) {
  1163. WARN_ON_ONCE(ret < iter->count);
  1164. break;
  1165. }
  1166. folioq = folioq->next;
  1167. slot = 0;
  1168. }
  1169. }
  1170. } while (sg_max > 0 && ret < maxsize);
  1171. iter->folioq = folioq;
  1172. iter->folioq_slot = slot;
  1173. iter->iov_offset = offset;
  1174. iter->count -= ret;
  1175. return ret;
  1176. }
  1177. /*
  1178. * Extract up to sg_max folios from an XARRAY-type iterator and add them to
  1179. * the scatterlist. The pages are not pinned.
  1180. */
  1181. static ssize_t extract_xarray_to_sg(struct iov_iter *iter,
  1182. ssize_t maxsize,
  1183. struct sg_table *sgtable,
  1184. unsigned int sg_max,
  1185. iov_iter_extraction_t extraction_flags)
  1186. {
  1187. struct scatterlist *sg = sgtable->sgl + sgtable->nents;
  1188. struct xarray *xa = iter->xarray;
  1189. struct folio *folio;
  1190. loff_t start = iter->xarray_start + iter->iov_offset;
  1191. pgoff_t index = start / PAGE_SIZE;
  1192. ssize_t ret = 0;
  1193. size_t offset, len;
  1194. XA_STATE(xas, xa, index);
  1195. rcu_read_lock();
  1196. xas_for_each(&xas, folio, ULONG_MAX) {
  1197. if (xas_retry(&xas, folio))
  1198. continue;
  1199. if (WARN_ON(xa_is_value(folio)))
  1200. break;
  1201. if (WARN_ON(folio_test_hugetlb(folio)))
  1202. break;
  1203. offset = offset_in_folio(folio, start);
  1204. len = min_t(size_t, maxsize, folio_size(folio) - offset);
  1205. sg_set_page(sg, folio_page(folio, 0), len, offset);
  1206. sgtable->nents++;
  1207. sg++;
  1208. sg_max--;
  1209. maxsize -= len;
  1210. ret += len;
  1211. if (maxsize <= 0 || sg_max == 0)
  1212. break;
  1213. }
  1214. rcu_read_unlock();
  1215. if (ret > 0)
  1216. iov_iter_advance(iter, ret);
  1217. return ret;
  1218. }
  1219. /**
  1220. * extract_iter_to_sg - Extract pages from an iterator and add to an sglist
  1221. * @iter: The iterator to extract from
  1222. * @maxsize: The amount of iterator to copy
  1223. * @sgtable: The scatterlist table to fill in
  1224. * @sg_max: Maximum number of elements in @sgtable that may be filled
  1225. * @extraction_flags: Flags to qualify the request
  1226. *
  1227. * Extract the page fragments from the given amount of the source iterator and
  1228. * add them to a scatterlist that refers to all of those bits, to a maximum
  1229. * addition of @sg_max elements.
  1230. *
  1231. * The pages referred to by UBUF- and IOVEC-type iterators are extracted and
  1232. * pinned; BVEC-, KVEC-, FOLIOQ- and XARRAY-type are extracted but aren't
  1233. * pinned; DISCARD-type is not supported.
  1234. *
  1235. * No end mark is placed on the scatterlist; that's left to the caller.
  1236. *
  1237. * @extraction_flags can have ITER_ALLOW_P2PDMA set to request peer-to-peer DMA
  1238. * be allowed on the pages extracted.
  1239. *
  1240. * If successful, @sgtable->nents is updated to include the number of elements
  1241. * added and the number of bytes added is returned. @sgtable->orig_nents is
  1242. * left unaltered.
  1243. *
  1244. * The iov_iter_extract_mode() function should be used to query how cleanup
  1245. * should be performed.
  1246. */
  1247. ssize_t extract_iter_to_sg(struct iov_iter *iter, size_t maxsize,
  1248. struct sg_table *sgtable, unsigned int sg_max,
  1249. iov_iter_extraction_t extraction_flags)
  1250. {
  1251. if (maxsize == 0)
  1252. return 0;
  1253. switch (iov_iter_type(iter)) {
  1254. case ITER_UBUF:
  1255. case ITER_IOVEC:
  1256. return extract_user_to_sg(iter, maxsize, sgtable, sg_max,
  1257. extraction_flags);
  1258. case ITER_BVEC:
  1259. return extract_bvec_to_sg(iter, maxsize, sgtable, sg_max,
  1260. extraction_flags);
  1261. case ITER_KVEC:
  1262. return extract_kvec_to_sg(iter, maxsize, sgtable, sg_max,
  1263. extraction_flags);
  1264. case ITER_FOLIOQ:
  1265. return extract_folioq_to_sg(iter, maxsize, sgtable, sg_max,
  1266. extraction_flags);
  1267. case ITER_XARRAY:
  1268. return extract_xarray_to_sg(iter, maxsize, sgtable, sg_max,
  1269. extraction_flags);
  1270. default:
  1271. pr_err("%s(%u) unsupported\n", __func__, iov_iter_type(iter));
  1272. WARN_ON_ONCE(1);
  1273. return -EIO;
  1274. }
  1275. }
  1276. EXPORT_SYMBOL_GPL(extract_iter_to_sg);