backing-file.c 8.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357
  1. // SPDX-License-Identifier: GPL-2.0-only
  2. /*
  3. * Common helpers for stackable filesystems and backing files.
  4. *
  5. * Forked from fs/overlayfs/file.c.
  6. *
  7. * Copyright (C) 2017 Red Hat, Inc.
  8. * Copyright (C) 2023 CTERA Networks.
  9. */
  10. #include <linux/fs.h>
  11. #include <linux/backing-file.h>
  12. #include <linux/splice.h>
  13. #include <linux/mm.h>
  14. #include "internal.h"
  15. /**
  16. * backing_file_open - open a backing file for kernel internal use
  17. * @user_path: path that the user reuqested to open
  18. * @flags: open flags
  19. * @real_path: path of the backing file
  20. * @cred: credentials for open
  21. *
  22. * Open a backing file for a stackable filesystem (e.g., overlayfs).
  23. * @user_path may be on the stackable filesystem and @real_path on the
  24. * underlying filesystem. In this case, we want to be able to return the
  25. * @user_path of the stackable filesystem. This is done by embedding the
  26. * returned file into a container structure that also stores the stacked
  27. * file's path, which can be retrieved using backing_file_user_path().
  28. */
  29. struct file *backing_file_open(const struct path *user_path, int flags,
  30. const struct path *real_path,
  31. const struct cred *cred)
  32. {
  33. struct file *f;
  34. int error;
  35. f = alloc_empty_backing_file(flags, cred);
  36. if (IS_ERR(f))
  37. return f;
  38. path_get(user_path);
  39. backing_file_set_user_path(f, user_path);
  40. error = vfs_open(real_path, f);
  41. if (error) {
  42. fput(f);
  43. f = ERR_PTR(error);
  44. }
  45. return f;
  46. }
  47. EXPORT_SYMBOL_GPL(backing_file_open);
  48. struct file *backing_tmpfile_open(const struct path *user_path, int flags,
  49. const struct path *real_parentpath,
  50. umode_t mode, const struct cred *cred)
  51. {
  52. struct mnt_idmap *real_idmap = mnt_idmap(real_parentpath->mnt);
  53. struct file *f;
  54. int error;
  55. f = alloc_empty_backing_file(flags, cred);
  56. if (IS_ERR(f))
  57. return f;
  58. path_get(user_path);
  59. backing_file_set_user_path(f, user_path);
  60. error = vfs_tmpfile(real_idmap, real_parentpath, f, mode);
  61. if (error) {
  62. fput(f);
  63. f = ERR_PTR(error);
  64. }
  65. return f;
  66. }
  67. EXPORT_SYMBOL(backing_tmpfile_open);
  68. struct backing_aio {
  69. struct kiocb iocb;
  70. refcount_t ref;
  71. struct kiocb *orig_iocb;
  72. /* used for aio completion */
  73. void (*end_write)(struct kiocb *iocb, ssize_t);
  74. struct work_struct work;
  75. long res;
  76. };
  77. static struct kmem_cache *backing_aio_cachep;
  78. #define BACKING_IOCB_MASK \
  79. (IOCB_NOWAIT | IOCB_HIPRI | IOCB_DSYNC | IOCB_SYNC | IOCB_APPEND)
  80. static rwf_t iocb_to_rw_flags(int flags)
  81. {
  82. return (__force rwf_t)(flags & BACKING_IOCB_MASK);
  83. }
  84. static void backing_aio_put(struct backing_aio *aio)
  85. {
  86. if (refcount_dec_and_test(&aio->ref)) {
  87. fput(aio->iocb.ki_filp);
  88. kmem_cache_free(backing_aio_cachep, aio);
  89. }
  90. }
  91. static void backing_aio_cleanup(struct backing_aio *aio, long res)
  92. {
  93. struct kiocb *iocb = &aio->iocb;
  94. struct kiocb *orig_iocb = aio->orig_iocb;
  95. orig_iocb->ki_pos = iocb->ki_pos;
  96. if (aio->end_write)
  97. aio->end_write(orig_iocb, res);
  98. backing_aio_put(aio);
  99. }
  100. static void backing_aio_rw_complete(struct kiocb *iocb, long res)
  101. {
  102. struct backing_aio *aio = container_of(iocb, struct backing_aio, iocb);
  103. struct kiocb *orig_iocb = aio->orig_iocb;
  104. if (iocb->ki_flags & IOCB_WRITE)
  105. kiocb_end_write(iocb);
  106. backing_aio_cleanup(aio, res);
  107. orig_iocb->ki_complete(orig_iocb, res);
  108. }
  109. static void backing_aio_complete_work(struct work_struct *work)
  110. {
  111. struct backing_aio *aio = container_of(work, struct backing_aio, work);
  112. backing_aio_rw_complete(&aio->iocb, aio->res);
  113. }
  114. static void backing_aio_queue_completion(struct kiocb *iocb, long res)
  115. {
  116. struct backing_aio *aio = container_of(iocb, struct backing_aio, iocb);
  117. /*
  118. * Punt to a work queue to serialize updates of mtime/size.
  119. */
  120. aio->res = res;
  121. INIT_WORK(&aio->work, backing_aio_complete_work);
  122. queue_work(file_inode(aio->orig_iocb->ki_filp)->i_sb->s_dio_done_wq,
  123. &aio->work);
  124. }
  125. static int backing_aio_init_wq(struct kiocb *iocb)
  126. {
  127. struct super_block *sb = file_inode(iocb->ki_filp)->i_sb;
  128. if (sb->s_dio_done_wq)
  129. return 0;
  130. return sb_init_dio_done_wq(sb);
  131. }
  132. static int do_backing_file_read_iter(struct file *file, struct iov_iter *iter,
  133. struct kiocb *iocb, int flags)
  134. {
  135. struct backing_aio *aio = NULL;
  136. int ret;
  137. if (is_sync_kiocb(iocb)) {
  138. rwf_t rwf = iocb_to_rw_flags(flags);
  139. return vfs_iter_read(file, iter, &iocb->ki_pos, rwf);
  140. }
  141. aio = kmem_cache_zalloc(backing_aio_cachep, GFP_KERNEL);
  142. if (!aio)
  143. return -ENOMEM;
  144. aio->orig_iocb = iocb;
  145. kiocb_clone(&aio->iocb, iocb, get_file(file));
  146. aio->iocb.ki_complete = backing_aio_rw_complete;
  147. refcount_set(&aio->ref, 2);
  148. ret = vfs_iocb_iter_read(file, &aio->iocb, iter);
  149. backing_aio_put(aio);
  150. if (ret != -EIOCBQUEUED)
  151. backing_aio_cleanup(aio, ret);
  152. return ret;
  153. }
  154. ssize_t backing_file_read_iter(struct file *file, struct iov_iter *iter,
  155. struct kiocb *iocb, int flags,
  156. struct backing_file_ctx *ctx)
  157. {
  158. ssize_t ret;
  159. if (WARN_ON_ONCE(!(file->f_mode & FMODE_BACKING)))
  160. return -EIO;
  161. if (!iov_iter_count(iter))
  162. return 0;
  163. if (iocb->ki_flags & IOCB_DIRECT &&
  164. !(file->f_mode & FMODE_CAN_ODIRECT))
  165. return -EINVAL;
  166. scoped_with_creds(ctx->cred)
  167. ret = do_backing_file_read_iter(file, iter, iocb, flags);
  168. if (ctx->accessed)
  169. ctx->accessed(iocb->ki_filp);
  170. return ret;
  171. }
  172. EXPORT_SYMBOL_GPL(backing_file_read_iter);
  173. static int do_backing_file_write_iter(struct file *file, struct iov_iter *iter,
  174. struct kiocb *iocb, int flags,
  175. void (*end_write)(struct kiocb *, ssize_t))
  176. {
  177. struct backing_aio *aio;
  178. int ret;
  179. if (is_sync_kiocb(iocb)) {
  180. rwf_t rwf = iocb_to_rw_flags(flags);
  181. ret = vfs_iter_write(file, iter, &iocb->ki_pos, rwf);
  182. if (end_write)
  183. end_write(iocb, ret);
  184. return ret;
  185. }
  186. ret = backing_aio_init_wq(iocb);
  187. if (ret)
  188. return ret;
  189. aio = kmem_cache_zalloc(backing_aio_cachep, GFP_KERNEL);
  190. if (!aio)
  191. return -ENOMEM;
  192. aio->orig_iocb = iocb;
  193. aio->end_write = end_write;
  194. kiocb_clone(&aio->iocb, iocb, get_file(file));
  195. aio->iocb.ki_flags = flags;
  196. aio->iocb.ki_complete = backing_aio_queue_completion;
  197. refcount_set(&aio->ref, 2);
  198. ret = vfs_iocb_iter_write(file, &aio->iocb, iter);
  199. backing_aio_put(aio);
  200. if (ret != -EIOCBQUEUED)
  201. backing_aio_cleanup(aio, ret);
  202. return ret;
  203. }
  204. ssize_t backing_file_write_iter(struct file *file, struct iov_iter *iter,
  205. struct kiocb *iocb, int flags,
  206. struct backing_file_ctx *ctx)
  207. {
  208. ssize_t ret;
  209. if (WARN_ON_ONCE(!(file->f_mode & FMODE_BACKING)))
  210. return -EIO;
  211. if (!iov_iter_count(iter))
  212. return 0;
  213. ret = file_remove_privs(iocb->ki_filp);
  214. if (ret)
  215. return ret;
  216. if (iocb->ki_flags & IOCB_DIRECT &&
  217. !(file->f_mode & FMODE_CAN_ODIRECT))
  218. return -EINVAL;
  219. scoped_with_creds(ctx->cred)
  220. return do_backing_file_write_iter(file, iter, iocb, flags, ctx->end_write);
  221. }
  222. EXPORT_SYMBOL_GPL(backing_file_write_iter);
  223. ssize_t backing_file_splice_read(struct file *in, struct kiocb *iocb,
  224. struct pipe_inode_info *pipe, size_t len,
  225. unsigned int flags,
  226. struct backing_file_ctx *ctx)
  227. {
  228. ssize_t ret;
  229. if (WARN_ON_ONCE(!(in->f_mode & FMODE_BACKING)))
  230. return -EIO;
  231. scoped_with_creds(ctx->cred)
  232. ret = vfs_splice_read(in, &iocb->ki_pos, pipe, len, flags);
  233. if (ctx->accessed)
  234. ctx->accessed(iocb->ki_filp);
  235. return ret;
  236. }
  237. EXPORT_SYMBOL_GPL(backing_file_splice_read);
  238. ssize_t backing_file_splice_write(struct pipe_inode_info *pipe,
  239. struct file *out, struct kiocb *iocb,
  240. size_t len, unsigned int flags,
  241. struct backing_file_ctx *ctx)
  242. {
  243. ssize_t ret;
  244. if (WARN_ON_ONCE(!(out->f_mode & FMODE_BACKING)))
  245. return -EIO;
  246. if (!out->f_op->splice_write)
  247. return -EINVAL;
  248. ret = file_remove_privs(iocb->ki_filp);
  249. if (ret)
  250. return ret;
  251. scoped_with_creds(ctx->cred) {
  252. file_start_write(out);
  253. ret = out->f_op->splice_write(pipe, out, &iocb->ki_pos, len, flags);
  254. file_end_write(out);
  255. }
  256. if (ctx->end_write)
  257. ctx->end_write(iocb, ret);
  258. return ret;
  259. }
  260. EXPORT_SYMBOL_GPL(backing_file_splice_write);
  261. int backing_file_mmap(struct file *file, struct vm_area_struct *vma,
  262. struct backing_file_ctx *ctx)
  263. {
  264. struct file *user_file = vma->vm_file;
  265. int ret;
  266. if (WARN_ON_ONCE(!(file->f_mode & FMODE_BACKING)))
  267. return -EIO;
  268. if (!can_mmap_file(file))
  269. return -ENODEV;
  270. vma_set_file(vma, file);
  271. scoped_with_creds(ctx->cred)
  272. ret = vfs_mmap(vma->vm_file, vma);
  273. if (ctx->accessed)
  274. ctx->accessed(user_file);
  275. return ret;
  276. }
  277. EXPORT_SYMBOL_GPL(backing_file_mmap);
  278. static int __init backing_aio_init(void)
  279. {
  280. backing_aio_cachep = KMEM_CACHE(backing_aio, SLAB_HWCACHE_ALIGN);
  281. if (!backing_aio_cachep)
  282. return -ENOMEM;
  283. return 0;
  284. }
  285. fs_initcall(backing_aio_init);