blk-lib.c 9.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369
  1. // SPDX-License-Identifier: GPL-2.0
  2. /*
  3. * Functions related to generic helpers functions
  4. */
  5. #include <linux/kernel.h>
  6. #include <linux/module.h>
  7. #include <linux/bio.h>
  8. #include <linux/blkdev.h>
  9. #include <linux/scatterlist.h>
  10. #include "blk.h"
  11. static sector_t bio_discard_limit(struct block_device *bdev, sector_t sector)
  12. {
  13. unsigned int discard_granularity = bdev_discard_granularity(bdev);
  14. sector_t granularity_aligned_sector;
  15. if (bdev_is_partition(bdev))
  16. sector += bdev->bd_start_sect;
  17. granularity_aligned_sector =
  18. round_up(sector, discard_granularity >> SECTOR_SHIFT);
  19. /*
  20. * Make sure subsequent bios start aligned to the discard granularity if
  21. * it needs to be split.
  22. */
  23. if (granularity_aligned_sector != sector)
  24. return granularity_aligned_sector - sector;
  25. /*
  26. * Align the bio size to the discard granularity to make splitting the bio
  27. * at discard granularity boundaries easier in the driver if needed.
  28. */
  29. return round_down(BIO_MAX_SIZE, discard_granularity) >> SECTOR_SHIFT;
  30. }
  31. struct bio *blk_alloc_discard_bio(struct block_device *bdev,
  32. sector_t *sector, sector_t *nr_sects, gfp_t gfp_mask)
  33. {
  34. sector_t bio_sects = min(*nr_sects, bio_discard_limit(bdev, *sector));
  35. struct bio *bio;
  36. if (!bio_sects)
  37. return NULL;
  38. bio = bio_alloc(bdev, 0, REQ_OP_DISCARD, gfp_mask);
  39. if (!bio)
  40. return NULL;
  41. bio->bi_iter.bi_sector = *sector;
  42. bio->bi_iter.bi_size = bio_sects << SECTOR_SHIFT;
  43. *sector += bio_sects;
  44. *nr_sects -= bio_sects;
  45. /*
  46. * We can loop for a long time in here if someone does full device
  47. * discards (like mkfs). Be nice and allow us to schedule out to avoid
  48. * softlocking if preempt is disabled.
  49. */
  50. cond_resched();
  51. return bio;
  52. }
  53. void __blkdev_issue_discard(struct block_device *bdev, sector_t sector,
  54. sector_t nr_sects, gfp_t gfp_mask, struct bio **biop)
  55. {
  56. struct bio *bio;
  57. while ((bio = blk_alloc_discard_bio(bdev, &sector, &nr_sects,
  58. gfp_mask)))
  59. *biop = bio_chain_and_submit(*biop, bio);
  60. }
  61. EXPORT_SYMBOL(__blkdev_issue_discard);
  62. /**
  63. * blkdev_issue_discard - queue a discard
  64. * @bdev: blockdev to issue discard for
  65. * @sector: start sector
  66. * @nr_sects: number of sectors to discard
  67. * @gfp_mask: memory allocation flags (for bio_alloc)
  68. *
  69. * Description:
  70. * Issue a discard request for the sectors in question.
  71. */
  72. int blkdev_issue_discard(struct block_device *bdev, sector_t sector,
  73. sector_t nr_sects, gfp_t gfp_mask)
  74. {
  75. struct bio *bio = NULL;
  76. struct blk_plug plug;
  77. int ret = 0;
  78. blk_start_plug(&plug);
  79. __blkdev_issue_discard(bdev, sector, nr_sects, gfp_mask, &bio);
  80. if (bio) {
  81. ret = submit_bio_wait(bio);
  82. if (ret == -EOPNOTSUPP)
  83. ret = 0;
  84. bio_put(bio);
  85. }
  86. blk_finish_plug(&plug);
  87. return ret;
  88. }
  89. EXPORT_SYMBOL(blkdev_issue_discard);
  90. static sector_t bio_write_zeroes_limit(struct block_device *bdev)
  91. {
  92. sector_t bs_mask = (bdev_logical_block_size(bdev) >> 9) - 1;
  93. return min(bdev_write_zeroes_sectors(bdev), BIO_MAX_SECTORS & ~bs_mask);
  94. }
  95. /*
  96. * There is no reliable way for the SCSI subsystem to determine whether a
  97. * device supports a WRITE SAME operation without actually performing a write
  98. * to media. As a result, write_zeroes is enabled by default and will be
  99. * disabled if a zeroing operation subsequently fails. This means that this
  100. * queue limit is likely to change at runtime.
  101. */
  102. static void __blkdev_issue_write_zeroes(struct block_device *bdev,
  103. sector_t sector, sector_t nr_sects, gfp_t gfp_mask,
  104. struct bio **biop, unsigned flags, sector_t limit)
  105. {
  106. while (nr_sects) {
  107. unsigned int len = min(nr_sects, limit);
  108. struct bio *bio;
  109. if ((flags & BLKDEV_ZERO_KILLABLE) &&
  110. fatal_signal_pending(current))
  111. break;
  112. bio = bio_alloc(bdev, 0, REQ_OP_WRITE_ZEROES, gfp_mask);
  113. bio->bi_iter.bi_sector = sector;
  114. if (flags & BLKDEV_ZERO_NOUNMAP)
  115. bio->bi_opf |= REQ_NOUNMAP;
  116. bio->bi_iter.bi_size = len << SECTOR_SHIFT;
  117. *biop = bio_chain_and_submit(*biop, bio);
  118. nr_sects -= len;
  119. sector += len;
  120. cond_resched();
  121. }
  122. }
  123. static int blkdev_issue_write_zeroes(struct block_device *bdev, sector_t sector,
  124. sector_t nr_sects, gfp_t gfp, unsigned flags)
  125. {
  126. sector_t limit = bio_write_zeroes_limit(bdev);
  127. struct bio *bio = NULL;
  128. struct blk_plug plug;
  129. int ret = 0;
  130. blk_start_plug(&plug);
  131. __blkdev_issue_write_zeroes(bdev, sector, nr_sects, gfp, &bio,
  132. flags, limit);
  133. if (bio) {
  134. if ((flags & BLKDEV_ZERO_KILLABLE) &&
  135. fatal_signal_pending(current)) {
  136. bio_await_chain(bio);
  137. blk_finish_plug(&plug);
  138. return -EINTR;
  139. }
  140. ret = submit_bio_wait(bio);
  141. bio_put(bio);
  142. }
  143. blk_finish_plug(&plug);
  144. /*
  145. * For some devices there is no non-destructive way to verify whether
  146. * WRITE ZEROES is actually supported. These will clear the capability
  147. * on an I/O error, in which case we'll turn any error into
  148. * "not supported" here.
  149. */
  150. if (ret && !bdev_write_zeroes_sectors(bdev))
  151. return -EOPNOTSUPP;
  152. return ret;
  153. }
  154. /*
  155. * Convert a number of 512B sectors to a number of pages.
  156. * The result is limited to a number of pages that can fit into a BIO.
  157. * Also make sure that the result is always at least 1 (page) for the cases
  158. * where nr_sects is lower than the number of sectors in a page.
  159. */
  160. static unsigned int __blkdev_sectors_to_bio_pages(sector_t nr_sects)
  161. {
  162. sector_t pages = DIV_ROUND_UP_SECTOR_T(nr_sects, PAGE_SIZE / 512);
  163. return min(pages, (sector_t)BIO_MAX_VECS);
  164. }
  165. static void __blkdev_issue_zero_pages(struct block_device *bdev,
  166. sector_t sector, sector_t nr_sects, gfp_t gfp_mask,
  167. struct bio **biop, unsigned int flags)
  168. {
  169. struct folio *zero_folio = largest_zero_folio();
  170. while (nr_sects) {
  171. unsigned int nr_vecs = __blkdev_sectors_to_bio_pages(nr_sects);
  172. struct bio *bio;
  173. if ((flags & BLKDEV_ZERO_KILLABLE) &&
  174. fatal_signal_pending(current))
  175. break;
  176. bio = bio_alloc(bdev, nr_vecs, REQ_OP_WRITE, gfp_mask);
  177. bio->bi_iter.bi_sector = sector;
  178. do {
  179. unsigned int len;
  180. len = min_t(sector_t, folio_size(zero_folio),
  181. nr_sects << SECTOR_SHIFT);
  182. if (!bio_add_folio(bio, zero_folio, len, 0))
  183. break;
  184. nr_sects -= len >> SECTOR_SHIFT;
  185. sector += len >> SECTOR_SHIFT;
  186. } while (nr_sects);
  187. *biop = bio_chain_and_submit(*biop, bio);
  188. cond_resched();
  189. }
  190. }
  191. static int blkdev_issue_zero_pages(struct block_device *bdev, sector_t sector,
  192. sector_t nr_sects, gfp_t gfp, unsigned flags)
  193. {
  194. struct bio *bio = NULL;
  195. struct blk_plug plug;
  196. int ret = 0;
  197. if (flags & BLKDEV_ZERO_NOFALLBACK)
  198. return -EOPNOTSUPP;
  199. blk_start_plug(&plug);
  200. __blkdev_issue_zero_pages(bdev, sector, nr_sects, gfp, &bio, flags);
  201. if (bio) {
  202. if ((flags & BLKDEV_ZERO_KILLABLE) &&
  203. fatal_signal_pending(current)) {
  204. bio_await_chain(bio);
  205. blk_finish_plug(&plug);
  206. return -EINTR;
  207. }
  208. ret = submit_bio_wait(bio);
  209. bio_put(bio);
  210. }
  211. blk_finish_plug(&plug);
  212. return ret;
  213. }
  214. /**
  215. * __blkdev_issue_zeroout - generate number of zero filed write bios
  216. * @bdev: blockdev to issue
  217. * @sector: start sector
  218. * @nr_sects: number of sectors to write
  219. * @gfp_mask: memory allocation flags (for bio_alloc)
  220. * @biop: pointer to anchor bio
  221. * @flags: controls detailed behavior
  222. *
  223. * Description:
  224. * Zero-fill a block range, either using hardware offload or by explicitly
  225. * writing zeroes to the device.
  226. *
  227. * If a device is using logical block provisioning, the underlying space will
  228. * not be released if %flags contains BLKDEV_ZERO_NOUNMAP.
  229. *
  230. * If %flags contains BLKDEV_ZERO_NOFALLBACK, the function will return
  231. * -EOPNOTSUPP if no explicit hardware offload for zeroing is provided.
  232. */
  233. int __blkdev_issue_zeroout(struct block_device *bdev, sector_t sector,
  234. sector_t nr_sects, gfp_t gfp_mask, struct bio **biop,
  235. unsigned flags)
  236. {
  237. sector_t limit = bio_write_zeroes_limit(bdev);
  238. if (bdev_read_only(bdev))
  239. return -EPERM;
  240. if (limit) {
  241. __blkdev_issue_write_zeroes(bdev, sector, nr_sects,
  242. gfp_mask, biop, flags, limit);
  243. } else {
  244. if (flags & BLKDEV_ZERO_NOFALLBACK)
  245. return -EOPNOTSUPP;
  246. __blkdev_issue_zero_pages(bdev, sector, nr_sects, gfp_mask,
  247. biop, flags);
  248. }
  249. return 0;
  250. }
  251. EXPORT_SYMBOL(__blkdev_issue_zeroout);
  252. /**
  253. * blkdev_issue_zeroout - zero-fill a block range
  254. * @bdev: blockdev to write
  255. * @sector: start sector
  256. * @nr_sects: number of sectors to write
  257. * @gfp_mask: memory allocation flags (for bio_alloc)
  258. * @flags: controls detailed behavior
  259. *
  260. * Description:
  261. * Zero-fill a block range, either using hardware offload or by explicitly
  262. * writing zeroes to the device. See __blkdev_issue_zeroout() for the
  263. * valid values for %flags.
  264. */
  265. int blkdev_issue_zeroout(struct block_device *bdev, sector_t sector,
  266. sector_t nr_sects, gfp_t gfp_mask, unsigned flags)
  267. {
  268. int ret;
  269. if ((sector | nr_sects) & ((bdev_logical_block_size(bdev) >> 9) - 1))
  270. return -EINVAL;
  271. if (bdev_read_only(bdev))
  272. return -EPERM;
  273. if (bdev_write_zeroes_sectors(bdev)) {
  274. ret = blkdev_issue_write_zeroes(bdev, sector, nr_sects,
  275. gfp_mask, flags);
  276. if (ret != -EOPNOTSUPP)
  277. return ret;
  278. }
  279. return blkdev_issue_zero_pages(bdev, sector, nr_sects, gfp_mask, flags);
  280. }
  281. EXPORT_SYMBOL(blkdev_issue_zeroout);
  282. int blkdev_issue_secure_erase(struct block_device *bdev, sector_t sector,
  283. sector_t nr_sects, gfp_t gfp)
  284. {
  285. sector_t bs_mask = (bdev_logical_block_size(bdev) >> 9) - 1;
  286. unsigned int max_sectors = bdev_max_secure_erase_sectors(bdev);
  287. struct bio *bio = NULL;
  288. struct blk_plug plug;
  289. int ret = 0;
  290. /* make sure that "len << SECTOR_SHIFT" doesn't overflow */
  291. if (max_sectors > BIO_MAX_SECTORS)
  292. max_sectors = BIO_MAX_SECTORS;
  293. max_sectors &= ~bs_mask;
  294. if (max_sectors == 0)
  295. return -EOPNOTSUPP;
  296. if ((sector | nr_sects) & bs_mask)
  297. return -EINVAL;
  298. if (bdev_read_only(bdev))
  299. return -EPERM;
  300. blk_start_plug(&plug);
  301. while (nr_sects) {
  302. unsigned int len = min_t(sector_t, nr_sects, max_sectors);
  303. bio = blk_next_bio(bio, bdev, 0, REQ_OP_SECURE_ERASE, gfp);
  304. bio->bi_iter.bi_sector = sector;
  305. bio->bi_iter.bi_size = len << SECTOR_SHIFT;
  306. sector += len;
  307. nr_sects -= len;
  308. cond_resched();
  309. }
  310. if (bio) {
  311. ret = submit_bio_wait(bio);
  312. bio_put(bio);
  313. }
  314. blk_finish_plug(&plug);
  315. return ret;
  316. }
  317. EXPORT_SYMBOL(blkdev_issue_secure_erase);