read_retry.c 8.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296
  1. // SPDX-License-Identifier: GPL-2.0-only
  2. /* Network filesystem read subrequest retrying.
  3. *
  4. * Copyright (C) 2024 Red Hat, Inc. All Rights Reserved.
  5. * Written by David Howells (dhowells@redhat.com)
  6. */
  7. #include <linux/fs.h>
  8. #include <linux/slab.h>
  9. #include "internal.h"
  10. static void netfs_reissue_read(struct netfs_io_request *rreq,
  11. struct netfs_io_subrequest *subreq)
  12. {
  13. subreq->error = 0;
  14. __clear_bit(NETFS_SREQ_MADE_PROGRESS, &subreq->flags);
  15. __set_bit(NETFS_SREQ_IN_PROGRESS, &subreq->flags);
  16. netfs_stat(&netfs_n_rh_retry_read_subreq);
  17. subreq->rreq->netfs_ops->issue_read(subreq);
  18. }
  19. /*
  20. * Go through the list of failed/short reads, retrying all retryable ones. We
  21. * need to switch failed cache reads to network downloads.
  22. */
  23. static void netfs_retry_read_subrequests(struct netfs_io_request *rreq)
  24. {
  25. struct netfs_io_subrequest *subreq;
  26. struct netfs_io_stream *stream = &rreq->io_streams[0];
  27. struct list_head *next;
  28. _enter("R=%x", rreq->debug_id);
  29. if (list_empty(&stream->subrequests))
  30. return;
  31. if (rreq->netfs_ops->retry_request)
  32. rreq->netfs_ops->retry_request(rreq, NULL);
  33. /* If there's no renegotiation to do, just resend each retryable subreq
  34. * up to the first permanently failed one.
  35. */
  36. if (!rreq->netfs_ops->prepare_read &&
  37. !rreq->cache_resources.ops) {
  38. list_for_each_entry(subreq, &stream->subrequests, rreq_link) {
  39. if (test_bit(NETFS_SREQ_FAILED, &subreq->flags))
  40. break;
  41. if (__test_and_clear_bit(NETFS_SREQ_NEED_RETRY, &subreq->flags)) {
  42. __clear_bit(NETFS_SREQ_MADE_PROGRESS, &subreq->flags);
  43. subreq->retry_count++;
  44. netfs_reset_iter(subreq);
  45. netfs_get_subrequest(subreq, netfs_sreq_trace_get_resubmit);
  46. netfs_reissue_read(rreq, subreq);
  47. }
  48. }
  49. return;
  50. }
  51. /* Okay, we need to renegotiate all the download requests and flip any
  52. * failed cache reads over to being download requests and negotiate
  53. * those also. All fully successful subreqs have been removed from the
  54. * list and any spare data from those has been donated.
  55. *
  56. * What we do is decant the list and rebuild it one subreq at a time so
  57. * that we don't end up with donations jumping over a gap we're busy
  58. * populating with smaller subrequests. In the event that the subreq
  59. * we just launched finishes before we insert the next subreq, it'll
  60. * fill in rreq->prev_donated instead.
  61. *
  62. * Note: Alternatively, we could split the tail subrequest right before
  63. * we reissue it and fix up the donations under lock.
  64. */
  65. next = stream->subrequests.next;
  66. do {
  67. struct netfs_io_subrequest *from, *to, *tmp;
  68. struct iov_iter source;
  69. unsigned long long start, len;
  70. size_t part;
  71. bool boundary = false, subreq_superfluous = false;
  72. /* Go through the subreqs and find the next span of contiguous
  73. * buffer that we then rejig (cifs, for example, needs the
  74. * rsize renegotiating) and reissue.
  75. */
  76. from = list_entry(next, struct netfs_io_subrequest, rreq_link);
  77. to = from;
  78. start = from->start + from->transferred;
  79. len = from->len - from->transferred;
  80. _debug("from R=%08x[%x] s=%llx ctl=%zx/%zx",
  81. rreq->debug_id, from->debug_index,
  82. from->start, from->transferred, from->len);
  83. if (test_bit(NETFS_SREQ_FAILED, &from->flags) ||
  84. !test_bit(NETFS_SREQ_NEED_RETRY, &from->flags)) {
  85. subreq = from;
  86. goto abandon;
  87. }
  88. list_for_each_continue(next, &stream->subrequests) {
  89. subreq = list_entry(next, struct netfs_io_subrequest, rreq_link);
  90. if (subreq->start + subreq->transferred != start + len ||
  91. test_bit(NETFS_SREQ_BOUNDARY, &subreq->flags) ||
  92. !test_bit(NETFS_SREQ_NEED_RETRY, &subreq->flags))
  93. break;
  94. to = subreq;
  95. len += to->len;
  96. }
  97. _debug(" - range: %llx-%llx %llx", start, start + len - 1, len);
  98. /* Determine the set of buffers we're going to use. Each
  99. * subreq gets a subset of a single overall contiguous buffer.
  100. */
  101. netfs_reset_iter(from);
  102. source = from->io_iter;
  103. source.count = len;
  104. /* Work through the sublist. */
  105. subreq = from;
  106. list_for_each_entry_from(subreq, &stream->subrequests, rreq_link) {
  107. if (!len) {
  108. subreq_superfluous = true;
  109. break;
  110. }
  111. subreq->source = NETFS_DOWNLOAD_FROM_SERVER;
  112. subreq->start = start - subreq->transferred;
  113. subreq->len = len + subreq->transferred;
  114. __clear_bit(NETFS_SREQ_NEED_RETRY, &subreq->flags);
  115. __clear_bit(NETFS_SREQ_MADE_PROGRESS, &subreq->flags);
  116. subreq->retry_count++;
  117. trace_netfs_sreq(subreq, netfs_sreq_trace_retry);
  118. /* Renegotiate max_len (rsize) */
  119. stream->sreq_max_len = subreq->len;
  120. if (rreq->netfs_ops->prepare_read &&
  121. rreq->netfs_ops->prepare_read(subreq) < 0) {
  122. trace_netfs_sreq(subreq, netfs_sreq_trace_reprep_failed);
  123. __set_bit(NETFS_SREQ_FAILED, &subreq->flags);
  124. goto abandon;
  125. }
  126. part = umin(len, stream->sreq_max_len);
  127. if (unlikely(stream->sreq_max_segs))
  128. part = netfs_limit_iter(&source, 0, part, stream->sreq_max_segs);
  129. subreq->len = subreq->transferred + part;
  130. subreq->io_iter = source;
  131. iov_iter_truncate(&subreq->io_iter, part);
  132. iov_iter_advance(&source, part);
  133. len -= part;
  134. start += part;
  135. if (!len) {
  136. if (boundary)
  137. __set_bit(NETFS_SREQ_BOUNDARY, &subreq->flags);
  138. } else {
  139. __clear_bit(NETFS_SREQ_BOUNDARY, &subreq->flags);
  140. }
  141. netfs_get_subrequest(subreq, netfs_sreq_trace_get_resubmit);
  142. netfs_reissue_read(rreq, subreq);
  143. if (subreq == to) {
  144. subreq_superfluous = false;
  145. break;
  146. }
  147. }
  148. /* If we managed to use fewer subreqs, we can discard the
  149. * excess; if we used the same number, then we're done.
  150. */
  151. if (!len) {
  152. if (!subreq_superfluous)
  153. continue;
  154. list_for_each_entry_safe_from(subreq, tmp,
  155. &stream->subrequests, rreq_link) {
  156. trace_netfs_sreq(subreq, netfs_sreq_trace_superfluous);
  157. list_del(&subreq->rreq_link);
  158. netfs_put_subrequest(subreq, netfs_sreq_trace_put_done);
  159. if (subreq == to)
  160. break;
  161. }
  162. subreq = NULL;
  163. continue;
  164. }
  165. /* We ran out of subrequests, so we need to allocate some more
  166. * and insert them after.
  167. */
  168. do {
  169. subreq = netfs_alloc_subrequest(rreq);
  170. if (!subreq) {
  171. subreq = to;
  172. goto abandon_after;
  173. }
  174. subreq->source = NETFS_DOWNLOAD_FROM_SERVER;
  175. subreq->start = start;
  176. subreq->len = len;
  177. subreq->stream_nr = stream->stream_nr;
  178. subreq->retry_count = 1;
  179. trace_netfs_sreq_ref(rreq->debug_id, subreq->debug_index,
  180. refcount_read(&subreq->ref),
  181. netfs_sreq_trace_new);
  182. list_add(&subreq->rreq_link, &to->rreq_link);
  183. to = list_next_entry(to, rreq_link);
  184. trace_netfs_sreq(subreq, netfs_sreq_trace_retry);
  185. stream->sreq_max_len = umin(len, rreq->rsize);
  186. stream->sreq_max_segs = 0;
  187. if (unlikely(stream->sreq_max_segs))
  188. part = netfs_limit_iter(&source, 0, part, stream->sreq_max_segs);
  189. netfs_stat(&netfs_n_rh_download);
  190. if (rreq->netfs_ops->prepare_read(subreq) < 0) {
  191. trace_netfs_sreq(subreq, netfs_sreq_trace_reprep_failed);
  192. __set_bit(NETFS_SREQ_FAILED, &subreq->flags);
  193. goto abandon;
  194. }
  195. part = umin(len, stream->sreq_max_len);
  196. subreq->len = subreq->transferred + part;
  197. subreq->io_iter = source;
  198. iov_iter_truncate(&subreq->io_iter, part);
  199. iov_iter_advance(&source, part);
  200. len -= part;
  201. start += part;
  202. if (!len && boundary) {
  203. __set_bit(NETFS_SREQ_BOUNDARY, &to->flags);
  204. boundary = false;
  205. }
  206. netfs_reissue_read(rreq, subreq);
  207. } while (len);
  208. } while (!list_is_head(next, &stream->subrequests));
  209. return;
  210. /* If we hit an error, fail all remaining incomplete subrequests */
  211. abandon_after:
  212. if (list_is_last(&subreq->rreq_link, &stream->subrequests))
  213. return;
  214. subreq = list_next_entry(subreq, rreq_link);
  215. abandon:
  216. list_for_each_entry_from(subreq, &stream->subrequests, rreq_link) {
  217. if (!test_bit(NETFS_SREQ_FAILED, &subreq->flags) &&
  218. !test_bit(NETFS_SREQ_NEED_RETRY, &subreq->flags))
  219. continue;
  220. subreq->error = -ENOMEM;
  221. __set_bit(NETFS_SREQ_FAILED, &subreq->flags);
  222. __clear_bit(NETFS_SREQ_NEED_RETRY, &subreq->flags);
  223. }
  224. }
  225. /*
  226. * Retry reads.
  227. */
  228. void netfs_retry_reads(struct netfs_io_request *rreq)
  229. {
  230. struct netfs_io_stream *stream = &rreq->io_streams[0];
  231. netfs_stat(&netfs_n_rh_retry_read_req);
  232. /* Wait for all outstanding I/O to quiesce before performing retries as
  233. * we may need to renegotiate the I/O sizes.
  234. */
  235. set_bit(NETFS_RREQ_RETRYING, &rreq->flags);
  236. netfs_wait_for_in_progress_stream(rreq, stream);
  237. clear_bit(NETFS_RREQ_RETRYING, &rreq->flags);
  238. trace_netfs_rreq(rreq, netfs_rreq_trace_resubmit);
  239. netfs_retry_read_subrequests(rreq);
  240. }
  241. /*
  242. * Unlock any the pages that haven't been unlocked yet due to abandoned
  243. * subrequests.
  244. */
  245. void netfs_unlock_abandoned_read_pages(struct netfs_io_request *rreq)
  246. {
  247. struct folio_queue *p;
  248. for (p = rreq->buffer.tail; p; p = p->next) {
  249. for (int slot = 0; slot < folioq_count(p); slot++) {
  250. struct folio *folio = folioq_folio(p, slot);
  251. if (folio && !folioq_is_marked2(p, slot)) {
  252. trace_netfs_folio(folio, netfs_folio_trace_abandon);
  253. folio_unlock(folio);
  254. }
  255. }
  256. }
  257. }