1  // SPDX-License-Identifier: GPL-2.0
2  /*
3   *  fs/ext4/extents_status.h
4   *
5   * Written by Yongqiang Yang <xiaoqiangnk@gmail.com>
6   * Modified by
7   *	Allison Henderson <achender@linux.vnet.ibm.com>
8   *	Zheng Liu <wenqing.lz@taobao.com>
9   *
10   */
11  
12  #ifndef _EXT4_EXTENTS_STATUS_H
13  #define _EXT4_EXTENTS_STATUS_H
14  
15  /*
16   * Turn on ES_DEBUG__ to get lots of info about extent status operations.
17   */
18  #ifdef ES_DEBUG__
19  #define es_debug(fmt, ...)	printk(fmt, ##__VA_ARGS__)
20  #else
21  #define es_debug(fmt, ...)	no_printk(fmt, ##__VA_ARGS__)
22  #endif
23  
24  /*
25   * With ES_AGGRESSIVE_TEST defined, the result of es caching will be
26   * checked with old map_block's result.
27   */
28  #define ES_AGGRESSIVE_TEST__
29  
30  /*
31   * These flags live in the high bits of extent_status.es_pblk
32   */
33  enum {
34  	ES_WRITTEN_B,
35  	ES_UNWRITTEN_B,
36  	ES_DELAYED_B,
37  	ES_HOLE_B,
38  	ES_REFERENCED_B,
39  	ES_FLAGS
40  };
41  
42  #define ES_SHIFT (sizeof(ext4_fsblk_t)*8 - ES_FLAGS)
43  #define ES_MASK (~((ext4_fsblk_t)0) << ES_SHIFT)
44  
45  /*
46   * Besides EXTENT_STATUS_REFERENCED, all these extent type masks
47   * are exclusive, only one type can be set at a time.
48   */
49  #define EXTENT_STATUS_WRITTEN	(1 << ES_WRITTEN_B)
50  #define EXTENT_STATUS_UNWRITTEN (1 << ES_UNWRITTEN_B)
51  #define EXTENT_STATUS_DELAYED	(1 << ES_DELAYED_B)
52  #define EXTENT_STATUS_HOLE	(1 << ES_HOLE_B)
53  #define EXTENT_STATUS_REFERENCED	(1 << ES_REFERENCED_B)
54  
55  #define ES_TYPE_MASK	((ext4_fsblk_t)(EXTENT_STATUS_WRITTEN | \
56  			  EXTENT_STATUS_UNWRITTEN | \
57  			  EXTENT_STATUS_DELAYED | \
58  			  EXTENT_STATUS_HOLE))
59  
60  #define ES_TYPE_VALID(type)	((type) && !((type) & ((type) - 1)))
61  
62  struct ext4_sb_info;
63  struct ext4_extent;
64  
65  struct extent_status {
66  	struct rb_node rb_node;
67  	ext4_lblk_t es_lblk;	/* first logical block extent covers */
68  	ext4_lblk_t es_len;	/* length of extent in block */
69  	ext4_fsblk_t es_pblk;	/* first physical block */
70  };
71  
72  struct ext4_es_tree {
73  	struct rb_root root;
74  	struct extent_status *cache_es;	/* recently accessed extent */
75  };
76  
77  struct ext4_es_stats {
78  	unsigned long es_stats_shrunk;
79  	struct percpu_counter es_stats_cache_hits;
80  	struct percpu_counter es_stats_cache_misses;
81  	u64 es_stats_scan_time;
82  	u64 es_stats_max_scan_time;
83  	struct percpu_counter es_stats_all_cnt;
84  	struct percpu_counter es_stats_shk_cnt;
85  };
86  
87  /*
88   * Pending cluster reservations for bigalloc file systems
89   *
90   * A cluster with a pending reservation is a logical cluster shared by at
91   * least one extent in the extents status tree with delayed and unwritten
92   * status and at least one other written or unwritten extent.  The
93   * reservation is said to be pending because a cluster reservation would
94   * have to be taken in the event all blocks in the cluster shared with
95   * written or unwritten extents were deleted while the delayed and
96   * unwritten blocks remained.
97   *
98   * The set of pending cluster reservations is an auxiliary data structure
99   * used with the extents status tree to implement reserved cluster/block
100   * accounting for bigalloc file systems.  The set is kept in memory and
101   * records all pending cluster reservations.
102   *
103   * Its primary function is to avoid the need to read extents from the
104   * disk when invalidating pages as a result of a truncate, punch hole, or
105   * collapse range operation.  Page invalidation requires a decrease in the
106   * reserved cluster count if it results in the removal of all delayed
107   * and unwritten extents (blocks) from a cluster that is not shared with a
108   * written or unwritten extent, and no decrease otherwise.  Determining
109   * whether the cluster is shared can be done by searching for a pending
110   * reservation on it.
111   *
112   * Secondarily, it provides a potentially faster method for determining
113   * whether the reserved cluster count should be increased when a physical
114   * cluster is deallocated as a result of a truncate, punch hole, or
115   * collapse range operation.  The necessary information is also present
116   * in the extents status tree, but might be more rapidly accessed in
117   * the pending reservation set in many cases due to smaller size.
118   *
119   * The pending cluster reservation set is implemented as a red-black tree
120   * with the goal of minimizing per page search time overhead.
121   */
122  
123  struct pending_reservation {
124  	struct rb_node rb_node;
125  	ext4_lblk_t lclu;
126  };
127  
128  struct ext4_pending_tree {
129  	struct rb_root root;
130  };
131  
132  extern int __init ext4_init_es(void);
133  extern void ext4_exit_es(void);
134  extern void ext4_es_init_tree(struct ext4_es_tree *tree);
135  
136  extern void ext4_es_insert_extent(struct inode *inode, ext4_lblk_t lblk,
137  				  ext4_lblk_t len, ext4_fsblk_t pblk,
138  				  unsigned int status, int flags);
139  extern void ext4_es_cache_extent(struct inode *inode, ext4_lblk_t lblk,
140  				 ext4_lblk_t len, ext4_fsblk_t pblk,
141  				 unsigned int status);
142  extern void ext4_es_remove_extent(struct inode *inode, ext4_lblk_t lblk,
143  				  ext4_lblk_t len);
144  extern void ext4_es_find_extent_range(struct inode *inode,
145  				      int (*match_fn)(struct extent_status *es),
146  				      ext4_lblk_t lblk, ext4_lblk_t end,
147  				      struct extent_status *es);
148  extern int ext4_es_lookup_extent(struct inode *inode, ext4_lblk_t lblk,
149  				 ext4_lblk_t *next_lblk,
150  				 struct extent_status *es);
151  extern bool ext4_es_scan_range(struct inode *inode,
152  			       int (*matching_fn)(struct extent_status *es),
153  			       ext4_lblk_t lblk, ext4_lblk_t end);
154  extern bool ext4_es_scan_clu(struct inode *inode,
155  			     int (*matching_fn)(struct extent_status *es),
156  			     ext4_lblk_t lblk);
157  
ext4_es_status(struct extent_status * es)158  static inline unsigned int ext4_es_status(struct extent_status *es)
159  {
160  	return es->es_pblk >> ES_SHIFT;
161  }
162  
ext4_es_type(struct extent_status * es)163  static inline unsigned int ext4_es_type(struct extent_status *es)
164  {
165  	return (es->es_pblk >> ES_SHIFT) & ES_TYPE_MASK;
166  }
167  
ext4_es_is_written(struct extent_status * es)168  static inline int ext4_es_is_written(struct extent_status *es)
169  {
170  	return (ext4_es_type(es) & EXTENT_STATUS_WRITTEN) != 0;
171  }
172  
ext4_es_is_unwritten(struct extent_status * es)173  static inline int ext4_es_is_unwritten(struct extent_status *es)
174  {
175  	return (ext4_es_type(es) & EXTENT_STATUS_UNWRITTEN) != 0;
176  }
177  
ext4_es_is_delayed(struct extent_status * es)178  static inline int ext4_es_is_delayed(struct extent_status *es)
179  {
180  	return (ext4_es_type(es) & EXTENT_STATUS_DELAYED) != 0;
181  }
182  
ext4_es_is_hole(struct extent_status * es)183  static inline int ext4_es_is_hole(struct extent_status *es)
184  {
185  	return (ext4_es_type(es) & EXTENT_STATUS_HOLE) != 0;
186  }
187  
ext4_es_is_mapped(struct extent_status * es)188  static inline int ext4_es_is_mapped(struct extent_status *es)
189  {
190  	return (ext4_es_is_written(es) || ext4_es_is_unwritten(es));
191  }
192  
ext4_es_set_referenced(struct extent_status * es)193  static inline void ext4_es_set_referenced(struct extent_status *es)
194  {
195  	es->es_pblk |= ((ext4_fsblk_t)EXTENT_STATUS_REFERENCED) << ES_SHIFT;
196  }
197  
ext4_es_clear_referenced(struct extent_status * es)198  static inline void ext4_es_clear_referenced(struct extent_status *es)
199  {
200  	es->es_pblk &= ~(((ext4_fsblk_t)EXTENT_STATUS_REFERENCED) << ES_SHIFT);
201  }
202  
ext4_es_is_referenced(struct extent_status * es)203  static inline int ext4_es_is_referenced(struct extent_status *es)
204  {
205  	return (ext4_es_status(es) & EXTENT_STATUS_REFERENCED) != 0;
206  }
207  
ext4_es_pblock(struct extent_status * es)208  static inline ext4_fsblk_t ext4_es_pblock(struct extent_status *es)
209  {
210  	return es->es_pblk & ~ES_MASK;
211  }
212  
ext4_es_show_pblock(struct extent_status * es)213  static inline ext4_fsblk_t ext4_es_show_pblock(struct extent_status *es)
214  {
215  	ext4_fsblk_t pblock = ext4_es_pblock(es);
216  	return pblock == ~ES_MASK ? 0 : pblock;
217  }
218  
ext4_es_store_pblock(struct extent_status * es,ext4_fsblk_t pb)219  static inline void ext4_es_store_pblock(struct extent_status *es,
220  					ext4_fsblk_t pb)
221  {
222  	ext4_fsblk_t block;
223  
224  	block = (pb & ~ES_MASK) | (es->es_pblk & ES_MASK);
225  	es->es_pblk = block;
226  }
227  
ext4_es_store_pblock_status(struct extent_status * es,ext4_fsblk_t pb,unsigned int status)228  static inline void ext4_es_store_pblock_status(struct extent_status *es,
229  					       ext4_fsblk_t pb,
230  					       unsigned int status)
231  {
232  	WARN_ON_ONCE(!ES_TYPE_VALID(status & ES_TYPE_MASK));
233  
234  	es->es_pblk = (((ext4_fsblk_t)status << ES_SHIFT) & ES_MASK) |
235  		      (pb & ~ES_MASK);
236  }
237  
238  extern int ext4_es_register_shrinker(struct ext4_sb_info *sbi);
239  extern void ext4_es_unregister_shrinker(struct ext4_sb_info *sbi);
240  
241  extern int ext4_seq_es_shrinker_info_show(struct seq_file *seq, void *v);
242  
243  extern int __init ext4_init_pending(void);
244  extern void ext4_exit_pending(void);
245  extern void ext4_init_pending_tree(struct ext4_pending_tree *tree);
246  extern void ext4_remove_pending(struct inode *inode, ext4_lblk_t lblk);
247  extern bool ext4_is_pending(struct inode *inode, ext4_lblk_t lblk);
248  extern void ext4_es_insert_delayed_extent(struct inode *inode, ext4_lblk_t lblk,
249  					  ext4_lblk_t len, bool lclu_allocated,
250  					  bool end_allocated);
251  extern void ext4_clear_inode_es(struct inode *inode);
252  
253  #endif /* _EXT4_EXTENTS_STATUS_H */
254