extents_status.h 7.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254
  1. // SPDX-License-Identifier: GPL-2.0
  2. /*
  3. * fs/ext4/extents_status.h
  4. *
  5. * Written by Yongqiang Yang <xiaoqiangnk@gmail.com>
  6. * Modified by
  7. * Allison Henderson <achender@linux.vnet.ibm.com>
  8. * Zheng Liu <wenqing.lz@taobao.com>
  9. *
  10. */
  11. #ifndef _EXT4_EXTENTS_STATUS_H
  12. #define _EXT4_EXTENTS_STATUS_H
  13. /*
  14. * Turn on ES_DEBUG__ to get lots of info about extent status operations.
  15. */
  16. #ifdef ES_DEBUG__
  17. #define es_debug(fmt, ...) printk(fmt, ##__VA_ARGS__)
  18. #else
  19. #define es_debug(fmt, ...) no_printk(fmt, ##__VA_ARGS__)
  20. #endif
  21. /*
  22. * With ES_AGGRESSIVE_TEST defined, the result of es caching will be
  23. * checked with old map_block's result.
  24. */
  25. #define ES_AGGRESSIVE_TEST__
  26. /*
  27. * These flags live in the high bits of extent_status.es_pblk
  28. */
  29. enum {
  30. ES_WRITTEN_B,
  31. ES_UNWRITTEN_B,
  32. ES_DELAYED_B,
  33. ES_HOLE_B,
  34. ES_REFERENCED_B,
  35. ES_FLAGS
  36. };
  37. #define ES_SHIFT (sizeof(ext4_fsblk_t)*8 - ES_FLAGS)
  38. #define ES_MASK (~((ext4_fsblk_t)0) << ES_SHIFT)
  39. /*
  40. * Besides EXTENT_STATUS_REFERENCED, all these extent type masks
  41. * are exclusive, only one type can be set at a time.
  42. */
  43. #define EXTENT_STATUS_WRITTEN (1 << ES_WRITTEN_B)
  44. #define EXTENT_STATUS_UNWRITTEN (1 << ES_UNWRITTEN_B)
  45. #define EXTENT_STATUS_DELAYED (1 << ES_DELAYED_B)
  46. #define EXTENT_STATUS_HOLE (1 << ES_HOLE_B)
  47. #define EXTENT_STATUS_REFERENCED (1 << ES_REFERENCED_B)
  48. #define ES_TYPE_MASK ((ext4_fsblk_t)(EXTENT_STATUS_WRITTEN | \
  49. EXTENT_STATUS_UNWRITTEN | \
  50. EXTENT_STATUS_DELAYED | \
  51. EXTENT_STATUS_HOLE))
  52. #define ES_TYPE_VALID(type) ((type) && !((type) & ((type) - 1)))
  53. struct ext4_sb_info;
  54. struct ext4_extent;
  55. struct extent_status {
  56. struct rb_node rb_node;
  57. ext4_lblk_t es_lblk; /* first logical block extent covers */
  58. ext4_lblk_t es_len; /* length of extent in block */
  59. ext4_fsblk_t es_pblk; /* first physical block */
  60. };
  61. struct ext4_es_tree {
  62. struct rb_root root;
  63. struct extent_status *cache_es; /* recently accessed extent */
  64. };
  65. struct ext4_es_stats {
  66. unsigned long es_stats_shrunk;
  67. struct percpu_counter es_stats_cache_hits;
  68. struct percpu_counter es_stats_cache_misses;
  69. u64 es_stats_scan_time;
  70. u64 es_stats_max_scan_time;
  71. struct percpu_counter es_stats_all_cnt;
  72. struct percpu_counter es_stats_shk_cnt;
  73. };
  74. /*
  75. * Pending cluster reservations for bigalloc file systems
  76. *
  77. * A cluster with a pending reservation is a logical cluster shared by at
  78. * least one extent in the extents status tree with delayed and unwritten
  79. * status and at least one other written or unwritten extent. The
  80. * reservation is said to be pending because a cluster reservation would
  81. * have to be taken in the event all blocks in the cluster shared with
  82. * written or unwritten extents were deleted while the delayed and
  83. * unwritten blocks remained.
  84. *
  85. * The set of pending cluster reservations is an auxiliary data structure
  86. * used with the extents status tree to implement reserved cluster/block
  87. * accounting for bigalloc file systems. The set is kept in memory and
  88. * records all pending cluster reservations.
  89. *
  90. * Its primary function is to avoid the need to read extents from the
  91. * disk when invalidating pages as a result of a truncate, punch hole, or
  92. * collapse range operation. Page invalidation requires a decrease in the
  93. * reserved cluster count if it results in the removal of all delayed
  94. * and unwritten extents (blocks) from a cluster that is not shared with a
  95. * written or unwritten extent, and no decrease otherwise. Determining
  96. * whether the cluster is shared can be done by searching for a pending
  97. * reservation on it.
  98. *
  99. * Secondarily, it provides a potentially faster method for determining
  100. * whether the reserved cluster count should be increased when a physical
  101. * cluster is deallocated as a result of a truncate, punch hole, or
  102. * collapse range operation. The necessary information is also present
  103. * in the extents status tree, but might be more rapidly accessed in
  104. * the pending reservation set in many cases due to smaller size.
  105. *
  106. * The pending cluster reservation set is implemented as a red-black tree
  107. * with the goal of minimizing per page search time overhead.
  108. */
  109. struct pending_reservation {
  110. struct rb_node rb_node;
  111. ext4_lblk_t lclu;
  112. };
  113. struct ext4_pending_tree {
  114. struct rb_root root;
  115. };
  116. extern int __init ext4_init_es(void);
  117. extern void ext4_exit_es(void);
  118. extern void ext4_es_init_tree(struct ext4_es_tree *tree);
  119. extern void ext4_es_insert_extent(struct inode *inode, ext4_lblk_t lblk,
  120. ext4_lblk_t len, ext4_fsblk_t pblk,
  121. unsigned int status,
  122. bool delalloc_reserve_used);
  123. extern void ext4_es_cache_extent(struct inode *inode, ext4_lblk_t lblk,
  124. ext4_lblk_t len, ext4_fsblk_t pblk,
  125. unsigned int status);
  126. extern void ext4_es_remove_extent(struct inode *inode, ext4_lblk_t lblk,
  127. ext4_lblk_t len);
  128. extern void ext4_es_find_extent_range(struct inode *inode,
  129. int (*match_fn)(struct extent_status *es),
  130. ext4_lblk_t lblk, ext4_lblk_t end,
  131. struct extent_status *es);
  132. extern int ext4_es_lookup_extent(struct inode *inode, ext4_lblk_t lblk,
  133. ext4_lblk_t *next_lblk,
  134. struct extent_status *es, u64 *pseq);
  135. extern bool ext4_es_scan_range(struct inode *inode,
  136. int (*matching_fn)(struct extent_status *es),
  137. ext4_lblk_t lblk, ext4_lblk_t end);
  138. extern bool ext4_es_scan_clu(struct inode *inode,
  139. int (*matching_fn)(struct extent_status *es),
  140. ext4_lblk_t lblk);
  141. static inline unsigned int ext4_es_status(struct extent_status *es)
  142. {
  143. return es->es_pblk >> ES_SHIFT;
  144. }
  145. static inline unsigned int ext4_es_type(struct extent_status *es)
  146. {
  147. return (es->es_pblk >> ES_SHIFT) & ES_TYPE_MASK;
  148. }
  149. static inline int ext4_es_is_written(struct extent_status *es)
  150. {
  151. return (ext4_es_type(es) & EXTENT_STATUS_WRITTEN) != 0;
  152. }
  153. static inline int ext4_es_is_unwritten(struct extent_status *es)
  154. {
  155. return (ext4_es_type(es) & EXTENT_STATUS_UNWRITTEN) != 0;
  156. }
  157. static inline int ext4_es_is_delayed(struct extent_status *es)
  158. {
  159. return (ext4_es_type(es) & EXTENT_STATUS_DELAYED) != 0;
  160. }
  161. static inline int ext4_es_is_hole(struct extent_status *es)
  162. {
  163. return (ext4_es_type(es) & EXTENT_STATUS_HOLE) != 0;
  164. }
  165. static inline int ext4_es_is_mapped(struct extent_status *es)
  166. {
  167. return (ext4_es_is_written(es) || ext4_es_is_unwritten(es));
  168. }
  169. static inline void ext4_es_set_referenced(struct extent_status *es)
  170. {
  171. es->es_pblk |= ((ext4_fsblk_t)EXTENT_STATUS_REFERENCED) << ES_SHIFT;
  172. }
  173. static inline void ext4_es_clear_referenced(struct extent_status *es)
  174. {
  175. es->es_pblk &= ~(((ext4_fsblk_t)EXTENT_STATUS_REFERENCED) << ES_SHIFT);
  176. }
  177. static inline int ext4_es_is_referenced(struct extent_status *es)
  178. {
  179. return (ext4_es_status(es) & EXTENT_STATUS_REFERENCED) != 0;
  180. }
  181. static inline ext4_fsblk_t ext4_es_pblock(struct extent_status *es)
  182. {
  183. return es->es_pblk & ~ES_MASK;
  184. }
  185. static inline ext4_fsblk_t ext4_es_show_pblock(struct extent_status *es)
  186. {
  187. ext4_fsblk_t pblock = ext4_es_pblock(es);
  188. return pblock == ~ES_MASK ? 0 : pblock;
  189. }
  190. static inline void ext4_es_store_pblock(struct extent_status *es,
  191. ext4_fsblk_t pb)
  192. {
  193. ext4_fsblk_t block;
  194. block = (pb & ~ES_MASK) | (es->es_pblk & ES_MASK);
  195. es->es_pblk = block;
  196. }
  197. static inline void ext4_es_store_pblock_status(struct extent_status *es,
  198. ext4_fsblk_t pb,
  199. unsigned int status)
  200. {
  201. WARN_ON_ONCE(!ES_TYPE_VALID(status & ES_TYPE_MASK));
  202. es->es_pblk = (((ext4_fsblk_t)status << ES_SHIFT) & ES_MASK) |
  203. (pb & ~ES_MASK);
  204. }
  205. extern int ext4_es_register_shrinker(struct ext4_sb_info *sbi);
  206. extern void ext4_es_unregister_shrinker(struct ext4_sb_info *sbi);
  207. extern int ext4_seq_es_shrinker_info_show(struct seq_file *seq, void *v);
  208. extern int __init ext4_init_pending(void);
  209. extern void ext4_exit_pending(void);
  210. extern void ext4_init_pending_tree(struct ext4_pending_tree *tree);
  211. extern void ext4_remove_pending(struct inode *inode, ext4_lblk_t lblk);
  212. extern bool ext4_is_pending(struct inode *inode, ext4_lblk_t lblk);
  213. extern void ext4_es_insert_delayed_extent(struct inode *inode, ext4_lblk_t lblk,
  214. ext4_lblk_t len, bool lclu_allocated,
  215. bool end_allocated);
  216. extern void ext4_clear_inode_es(struct inode *inode);
  217. #endif /* _EXT4_EXTENTS_STATUS_H */