Commit | Line | Data |
---|---|---|
d1310b2e CM |
1 | #ifndef __EXTENTIO__ |
2 | #define __EXTENTIO__ | |
3 | ||
4 | #include <linux/rbtree.h> | |
5 | ||
6 | /* bits for the extent state */ | |
7 | #define EXTENT_DIRTY 1 | |
8 | #define EXTENT_WRITEBACK (1 << 1) | |
9 | #define EXTENT_UPTODATE (1 << 2) | |
10 | #define EXTENT_LOCKED (1 << 3) | |
11 | #define EXTENT_NEW (1 << 4) | |
12 | #define EXTENT_DELALLOC (1 << 5) | |
13 | #define EXTENT_DEFRAG (1 << 6) | |
14 | #define EXTENT_DEFRAG_DONE (1 << 7) | |
15 | #define EXTENT_BUFFER_FILLED (1 << 8) | |
8b62b72b CM |
16 | #define EXTENT_BOUNDARY (1 << 9) |
17 | #define EXTENT_NODATASUM (1 << 10) | |
32c00aff | 18 | #define EXTENT_DO_ACCOUNTING (1 << 11) |
0ca1f7ce | 19 | #define EXTENT_FIRST_DELALLOC (1 << 12) |
1728366e | 20 | #define EXTENT_NEED_WAIT (1 << 13) |
806468f8 | 21 | #define EXTENT_DAMAGED (1 << 14) |
7ee9e440 | 22 | #define EXTENT_NORESERVE (1 << 15) |
d1310b2e | 23 | #define EXTENT_IOBITS (EXTENT_LOCKED | EXTENT_WRITEBACK) |
0ca1f7ce | 24 | #define EXTENT_CTLBITS (EXTENT_DO_ACCOUNTING | EXTENT_FIRST_DELALLOC) |
d1310b2e | 25 | |
261507a0 LZ |
26 | /* |
27 | * flags for bio submission. The high bits indicate the compression | |
28 | * type for this bio | |
29 | */ | |
c8b97818 | 30 | #define EXTENT_BIO_COMPRESSED 1 |
de0022b9 | 31 | #define EXTENT_BIO_TREE_LOG 2 |
4b384318 | 32 | #define EXTENT_BIO_PARENT_LOCKED 4 |
261507a0 | 33 | #define EXTENT_BIO_FLAG_SHIFT 16 |
c8b97818 | 34 | |
b4ce94de CM |
35 | /* these are bit numbers for test/set bit */ |
36 | #define EXTENT_BUFFER_UPTODATE 0 | |
37 | #define EXTENT_BUFFER_BLOCKING 1 | |
b9473439 | 38 | #define EXTENT_BUFFER_DIRTY 2 |
a826d6dc | 39 | #define EXTENT_BUFFER_CORRUPT 3 |
ab0fff03 | 40 | #define EXTENT_BUFFER_READAHEAD 4 /* this got triggered by readahead */ |
3083ee2e JB |
41 | #define EXTENT_BUFFER_TREE_REF 5 |
42 | #define EXTENT_BUFFER_STALE 6 | |
0b32f4bb | 43 | #define EXTENT_BUFFER_WRITEBACK 7 |
656f30db | 44 | #define EXTENT_BUFFER_READ_ERR 8 /* read IO error */ |
815a51c7 | 45 | #define EXTENT_BUFFER_DUMMY 9 |
34b41ace | 46 | #define EXTENT_BUFFER_IN_TREE 10 |
656f30db | 47 | #define EXTENT_BUFFER_WRITE_ERR 11 /* write IO error */ |
b4ce94de | 48 | |
a791e35e | 49 | /* these are flags for extent_clear_unlock_delalloc */ |
c2790a2e JB |
50 | #define PAGE_UNLOCK (1 << 0) |
51 | #define PAGE_CLEAR_DIRTY (1 << 1) | |
52 | #define PAGE_SET_WRITEBACK (1 << 2) | |
53 | #define PAGE_END_WRITEBACK (1 << 3) | |
54 | #define PAGE_SET_PRIVATE2 (1 << 4) | |
a791e35e | 55 | |
d1310b2e CM |
56 | /* |
57 | * page->private values. Every page that is controlled by the extent | |
58 | * map has page->private set to one. | |
59 | */ | |
60 | #define EXTENT_PAGE_PRIVATE 1 | |
61 | #define EXTENT_PAGE_PRIVATE_FIRST_PAGE 3 | |
62 | ||
70dec807 | 63 | struct extent_state; |
ea466794 | 64 | struct btrfs_root; |
facc8a22 | 65 | struct btrfs_io_bio; |
70dec807 | 66 | |
44b8bd7e | 67 | typedef int (extent_submit_bio_hook_t)(struct inode *inode, int rw, |
c8b97818 | 68 | struct bio *bio, int mirror_num, |
eaf25d93 | 69 | unsigned long bio_flags, u64 bio_offset); |
d1310b2e | 70 | struct extent_io_ops { |
c8b97818 | 71 | int (*fill_delalloc)(struct inode *inode, struct page *locked_page, |
771ed689 CM |
72 | u64 start, u64 end, int *page_started, |
73 | unsigned long *nr_written); | |
247e743c | 74 | int (*writepage_start_hook)(struct page *page, u64 start, u64 end); |
d1310b2e | 75 | int (*writepage_io_hook)(struct page *page, u64 start, u64 end); |
44b8bd7e | 76 | extent_submit_bio_hook_t *submit_bio_hook; |
64a16701 | 77 | int (*merge_bio_hook)(int rw, struct page *page, unsigned long offset, |
c8b97818 CM |
78 | size_t size, struct bio *bio, |
79 | unsigned long bio_flags); | |
ea466794 | 80 | int (*readpage_io_failed_hook)(struct page *page, int failed_mirror); |
facc8a22 MX |
81 | int (*readpage_end_io_hook)(struct btrfs_io_bio *io_bio, u64 phy_offset, |
82 | struct page *page, u64 start, u64 end, | |
83 | int mirror); | |
1259ab75 | 84 | int (*writepage_end_io_hook)(struct page *page, u64 start, u64 end, |
e6dcd2dc | 85 | struct extent_state *state, int uptodate); |
1bf85046 | 86 | void (*set_bit_hook)(struct inode *inode, struct extent_state *state, |
41074888 | 87 | unsigned long *bits); |
1bf85046 | 88 | void (*clear_bit_hook)(struct inode *inode, struct extent_state *state, |
41074888 | 89 | unsigned long *bits); |
1bf85046 JM |
90 | void (*merge_extent_hook)(struct inode *inode, |
91 | struct extent_state *new, | |
92 | struct extent_state *other); | |
93 | void (*split_extent_hook)(struct inode *inode, | |
94 | struct extent_state *orig, u64 split); | |
d1310b2e CM |
95 | }; |
96 | ||
97 | struct extent_io_tree { | |
98 | struct rb_root state; | |
99 | struct address_space *mapping; | |
100 | u64 dirty_bytes; | |
0b32f4bb | 101 | int track_uptodate; |
70dec807 | 102 | spinlock_t lock; |
d1310b2e | 103 | struct extent_io_ops *ops; |
d1310b2e CM |
104 | }; |
105 | ||
106 | struct extent_state { | |
107 | u64 start; | |
108 | u64 end; /* inclusive */ | |
d1310b2e | 109 | struct rb_node rb_node; |
9ed74f2d JB |
110 | |
111 | /* ADD NEW ELEMENTS AFTER THIS */ | |
d1310b2e CM |
112 | wait_queue_head_t wq; |
113 | atomic_t refs; | |
114 | unsigned long state; | |
115 | ||
116 | /* for use by the FS */ | |
117 | u64 private; | |
118 | ||
6d49ba1b | 119 | #ifdef CONFIG_BTRFS_DEBUG |
2d2ae547 | 120 | struct list_head leak_list; |
6d49ba1b | 121 | #endif |
d1310b2e CM |
122 | }; |
123 | ||
727011e0 CM |
124 | #define INLINE_EXTENT_BUFFER_PAGES 16 |
125 | #define MAX_INLINE_EXTENT_BUFFER_SIZE (INLINE_EXTENT_BUFFER_PAGES * PAGE_CACHE_SIZE) | |
d1310b2e CM |
126 | struct extent_buffer { |
127 | u64 start; | |
128 | unsigned long len; | |
b4ce94de | 129 | unsigned long bflags; |
f28491e0 | 130 | struct btrfs_fs_info *fs_info; |
3083ee2e | 131 | spinlock_t refs_lock; |
727011e0 | 132 | atomic_t refs; |
0b32f4bb | 133 | atomic_t io_pages; |
5cf1ab56 | 134 | int read_mirror; |
19fe0a8b | 135 | struct rcu_head rcu_head; |
5b25f70f | 136 | pid_t lock_owner; |
b4ce94de | 137 | |
bd681513 CM |
138 | /* count of read lock holders on the extent buffer */ |
139 | atomic_t write_locks; | |
140 | atomic_t read_locks; | |
141 | atomic_t blocking_writers; | |
142 | atomic_t blocking_readers; | |
143 | atomic_t spinning_readers; | |
144 | atomic_t spinning_writers; | |
656f30db FM |
145 | short lock_nested; |
146 | /* >= 0 if eb belongs to a log tree, -1 otherwise */ | |
147 | short log_index; | |
bd681513 CM |
148 | |
149 | /* protects write locks */ | |
150 | rwlock_t lock; | |
151 | ||
152 | /* readers use lock_wq while they wait for the write | |
153 | * lock holders to unlock | |
154 | */ | |
155 | wait_queue_head_t write_lock_wq; | |
b4ce94de | 156 | |
bd681513 CM |
157 | /* writers use read_lock_wq while they wait for readers |
158 | * to unlock | |
b4ce94de | 159 | */ |
bd681513 | 160 | wait_queue_head_t read_lock_wq; |
b8dae313 | 161 | struct page *pages[INLINE_EXTENT_BUFFER_PAGES]; |
6d49ba1b ES |
162 | #ifdef CONFIG_BTRFS_DEBUG |
163 | struct list_head leak_list; | |
164 | #endif | |
d1310b2e CM |
165 | }; |
166 | ||
261507a0 LZ |
167 | static inline void extent_set_compress_type(unsigned long *bio_flags, |
168 | int compress_type) | |
169 | { | |
170 | *bio_flags |= compress_type << EXTENT_BIO_FLAG_SHIFT; | |
171 | } | |
172 | ||
173 | static inline int extent_compress_type(unsigned long bio_flags) | |
174 | { | |
175 | return bio_flags >> EXTENT_BIO_FLAG_SHIFT; | |
176 | } | |
177 | ||
d1310b2e CM |
178 | struct extent_map_tree; |
179 | ||
180 | typedef struct extent_map *(get_extent_t)(struct inode *inode, | |
181 | struct page *page, | |
306e16ce | 182 | size_t pg_offset, |
d1310b2e CM |
183 | u64 start, u64 len, |
184 | int create); | |
185 | ||
186 | void extent_io_tree_init(struct extent_io_tree *tree, | |
f993c883 | 187 | struct address_space *mapping); |
d1310b2e | 188 | int try_release_extent_mapping(struct extent_map_tree *map, |
70dec807 CM |
189 | struct extent_io_tree *tree, struct page *page, |
190 | gfp_t mask); | |
f7a52a40 | 191 | int try_release_extent_buffer(struct page *page); |
d0082371 | 192 | int lock_extent(struct extent_io_tree *tree, u64 start, u64 end); |
1edbb734 | 193 | int lock_extent_bits(struct extent_io_tree *tree, u64 start, u64 end, |
41074888 | 194 | unsigned long bits, struct extent_state **cached); |
d0082371 | 195 | int unlock_extent(struct extent_io_tree *tree, u64 start, u64 end); |
2ac55d41 JB |
196 | int unlock_extent_cached(struct extent_io_tree *tree, u64 start, u64 end, |
197 | struct extent_state **cached, gfp_t mask); | |
d0082371 | 198 | int try_lock_extent(struct extent_io_tree *tree, u64 start, u64 end); |
d1310b2e | 199 | int extent_read_full_page(struct extent_io_tree *tree, struct page *page, |
8ddc7d9c | 200 | get_extent_t *get_extent, int mirror_num); |
4b384318 MF |
201 | int extent_read_full_page_nolock(struct extent_io_tree *tree, struct page *page, |
202 | get_extent_t *get_extent, int mirror_num); | |
d1310b2e CM |
203 | int __init extent_io_init(void); |
204 | void extent_io_exit(void); | |
205 | ||
206 | u64 count_range_bits(struct extent_io_tree *tree, | |
207 | u64 *start, u64 search_end, | |
ec29ed5b | 208 | u64 max_bytes, unsigned long bits, int contig); |
d1310b2e | 209 | |
4845e44f | 210 | void free_extent_state(struct extent_state *state); |
d1310b2e | 211 | int test_range_bit(struct extent_io_tree *tree, u64 start, u64 end, |
41074888 DS |
212 | unsigned long bits, int filled, |
213 | struct extent_state *cached_state); | |
d1310b2e | 214 | int clear_extent_bits(struct extent_io_tree *tree, u64 start, u64 end, |
41074888 | 215 | unsigned long bits, gfp_t mask); |
e6dcd2dc | 216 | int clear_extent_bit(struct extent_io_tree *tree, u64 start, u64 end, |
41074888 DS |
217 | unsigned long bits, int wake, int delete, |
218 | struct extent_state **cached, gfp_t mask); | |
d1310b2e | 219 | int set_extent_bits(struct extent_io_tree *tree, u64 start, u64 end, |
41074888 | 220 | unsigned long bits, gfp_t mask); |
4845e44f | 221 | int set_extent_bit(struct extent_io_tree *tree, u64 start, u64 end, |
41074888 | 222 | unsigned long bits, u64 *failed_start, |
4845e44f | 223 | struct extent_state **cached_state, gfp_t mask); |
d1310b2e | 224 | int set_extent_uptodate(struct extent_io_tree *tree, u64 start, u64 end, |
507903b8 | 225 | struct extent_state **cached_state, gfp_t mask); |
5fd02043 JB |
226 | int clear_extent_uptodate(struct extent_io_tree *tree, u64 start, u64 end, |
227 | struct extent_state **cached_state, gfp_t mask); | |
d1310b2e CM |
228 | int set_extent_new(struct extent_io_tree *tree, u64 start, u64 end, |
229 | gfp_t mask); | |
230 | int set_extent_dirty(struct extent_io_tree *tree, u64 start, u64 end, | |
231 | gfp_t mask); | |
232 | int clear_extent_dirty(struct extent_io_tree *tree, u64 start, u64 end, | |
233 | gfp_t mask); | |
462d6fac | 234 | int convert_extent_bit(struct extent_io_tree *tree, u64 start, u64 end, |
41074888 | 235 | unsigned long bits, unsigned long clear_bits, |
e6138876 | 236 | struct extent_state **cached_state, gfp_t mask); |
d1310b2e | 237 | int set_extent_delalloc(struct extent_io_tree *tree, u64 start, u64 end, |
2ac55d41 | 238 | struct extent_state **cached_state, gfp_t mask); |
9e8a4a8b LB |
239 | int set_extent_defrag(struct extent_io_tree *tree, u64 start, u64 end, |
240 | struct extent_state **cached_state, gfp_t mask); | |
d1310b2e | 241 | int find_first_extent_bit(struct extent_io_tree *tree, u64 start, |
41074888 | 242 | u64 *start_ret, u64 *end_ret, unsigned long bits, |
e6138876 | 243 | struct extent_state **cached_state); |
d1310b2e CM |
244 | int extent_invalidatepage(struct extent_io_tree *tree, |
245 | struct page *page, unsigned long offset); | |
246 | int extent_write_full_page(struct extent_io_tree *tree, struct page *page, | |
247 | get_extent_t *get_extent, | |
248 | struct writeback_control *wbc); | |
771ed689 CM |
249 | int extent_write_locked_range(struct extent_io_tree *tree, struct inode *inode, |
250 | u64 start, u64 end, get_extent_t *get_extent, | |
251 | int mode); | |
d1310b2e CM |
252 | int extent_writepages(struct extent_io_tree *tree, |
253 | struct address_space *mapping, | |
254 | get_extent_t *get_extent, | |
255 | struct writeback_control *wbc); | |
0b32f4bb JB |
256 | int btree_write_cache_pages(struct address_space *mapping, |
257 | struct writeback_control *wbc); | |
d1310b2e CM |
258 | int extent_readpages(struct extent_io_tree *tree, |
259 | struct address_space *mapping, | |
260 | struct list_head *pages, unsigned nr_pages, | |
261 | get_extent_t get_extent); | |
1506fcc8 YS |
262 | int extent_fiemap(struct inode *inode, struct fiemap_extent_info *fieinfo, |
263 | __u64 start, __u64 len, get_extent_t *get_extent); | |
d1310b2e CM |
264 | int get_state_private(struct extent_io_tree *tree, u64 start, u64 *private); |
265 | void set_page_extent_mapped(struct page *page); | |
266 | ||
f28491e0 | 267 | struct extent_buffer *alloc_extent_buffer(struct btrfs_fs_info *fs_info, |
727011e0 | 268 | u64 start, unsigned long len); |
815a51c7 JS |
269 | struct extent_buffer *alloc_dummy_extent_buffer(u64 start, unsigned long len); |
270 | struct extent_buffer *btrfs_clone_extent_buffer(struct extent_buffer *src); | |
f28491e0 | 271 | struct extent_buffer *find_extent_buffer(struct btrfs_fs_info *fs_info, |
452c75c3 | 272 | u64 start); |
d1310b2e | 273 | void free_extent_buffer(struct extent_buffer *eb); |
3083ee2e | 274 | void free_extent_buffer_stale(struct extent_buffer *eb); |
bb82ab88 AJ |
275 | #define WAIT_NONE 0 |
276 | #define WAIT_COMPLETE 1 | |
277 | #define WAIT_PAGE_LOCK 2 | |
d1310b2e | 278 | int read_extent_buffer_pages(struct extent_io_tree *tree, |
a86c12c7 | 279 | struct extent_buffer *eb, u64 start, int wait, |
f188591e | 280 | get_extent_t *get_extent, int mirror_num); |
fd8b2b61 | 281 | void wait_on_extent_buffer_writeback(struct extent_buffer *eb); |
479ed9ab RD |
282 | |
283 | static inline unsigned long num_extent_pages(u64 start, u64 len) | |
284 | { | |
285 | return ((start + len + PAGE_CACHE_SIZE - 1) >> PAGE_CACHE_SHIFT) - | |
286 | (start >> PAGE_CACHE_SHIFT); | |
287 | } | |
288 | ||
289 | static inline struct page *extent_buffer_page(struct extent_buffer *eb, | |
290 | unsigned long i) | |
291 | { | |
292 | return eb->pages[i]; | |
293 | } | |
d1310b2e CM |
294 | |
295 | static inline void extent_buffer_get(struct extent_buffer *eb) | |
296 | { | |
297 | atomic_inc(&eb->refs); | |
298 | } | |
299 | ||
300 | int memcmp_extent_buffer(struct extent_buffer *eb, const void *ptrv, | |
301 | unsigned long start, | |
302 | unsigned long len); | |
303 | void read_extent_buffer(struct extent_buffer *eb, void *dst, | |
304 | unsigned long start, | |
305 | unsigned long len); | |
550ac1d8 GH |
306 | int read_extent_buffer_to_user(struct extent_buffer *eb, void __user *dst, |
307 | unsigned long start, | |
308 | unsigned long len); | |
d1310b2e CM |
309 | void write_extent_buffer(struct extent_buffer *eb, const void *src, |
310 | unsigned long start, unsigned long len); | |
311 | void copy_extent_buffer(struct extent_buffer *dst, struct extent_buffer *src, | |
312 | unsigned long dst_offset, unsigned long src_offset, | |
313 | unsigned long len); | |
314 | void memcpy_extent_buffer(struct extent_buffer *dst, unsigned long dst_offset, | |
315 | unsigned long src_offset, unsigned long len); | |
316 | void memmove_extent_buffer(struct extent_buffer *dst, unsigned long dst_offset, | |
317 | unsigned long src_offset, unsigned long len); | |
318 | void memset_extent_buffer(struct extent_buffer *eb, char c, | |
319 | unsigned long start, unsigned long len); | |
1d4284bd | 320 | void clear_extent_buffer_dirty(struct extent_buffer *eb); |
0b32f4bb JB |
321 | int set_extent_buffer_dirty(struct extent_buffer *eb); |
322 | int set_extent_buffer_uptodate(struct extent_buffer *eb); | |
323 | int clear_extent_buffer_uptodate(struct extent_buffer *eb); | |
324 | int extent_buffer_uptodate(struct extent_buffer *eb); | |
a26e8c9f | 325 | int extent_buffer_under_io(struct extent_buffer *eb); |
d1310b2e | 326 | int map_private_extent_buffer(struct extent_buffer *eb, unsigned long offset, |
a6591715 | 327 | unsigned long min_len, char **map, |
d1310b2e | 328 | unsigned long *map_start, |
a6591715 | 329 | unsigned long *map_len); |
4adaa611 CM |
330 | int extent_range_clear_dirty_for_io(struct inode *inode, u64 start, u64 end); |
331 | int extent_range_redirty_for_io(struct inode *inode, u64 start, u64 end); | |
c2790a2e JB |
332 | int extent_clear_unlock_delalloc(struct inode *inode, u64 start, u64 end, |
333 | struct page *locked_page, | |
334 | unsigned long bits_to_clear, | |
335 | unsigned long page_ops); | |
88f794ed MX |
336 | struct bio * |
337 | btrfs_bio_alloc(struct block_device *bdev, u64 first_sector, int nr_vecs, | |
338 | gfp_t gfp_flags); | |
9be3395b CM |
339 | struct bio *btrfs_io_bio_alloc(gfp_t gfp_mask, unsigned int nr_iovecs); |
340 | struct bio *btrfs_bio_clone(struct bio *bio, gfp_t gfp_mask); | |
4a54c8c1 | 341 | |
3ec706c8 | 342 | struct btrfs_fs_info; |
4a54c8c1 | 343 | |
1203b681 MX |
344 | int repair_io_failure(struct inode *inode, u64 start, u64 length, u64 logical, |
345 | struct page *page, unsigned int pg_offset, | |
346 | int mirror_num); | |
8b110e39 MX |
347 | int clean_io_failure(struct inode *inode, u64 start, struct page *page, |
348 | unsigned int pg_offset); | |
87826df0 | 349 | int end_extent_writepage(struct page *page, int err, u64 start, u64 end); |
ea466794 JB |
350 | int repair_eb_io_failure(struct btrfs_root *root, struct extent_buffer *eb, |
351 | int mirror_num); | |
2fe6303e MX |
352 | |
353 | /* | |
354 | * When IO fails, either with EIO or csum verification fails, we | |
355 | * try other mirrors that might have a good copy of the data. This | |
356 | * io_failure_record is used to record state as we go through all the | |
357 | * mirrors. If another mirror has good data, the page is set up to date | |
358 | * and things continue. If a good mirror can't be found, the original | |
359 | * bio end_io callback is called to indicate things have failed. | |
360 | */ | |
361 | struct io_failure_record { | |
362 | struct page *page; | |
363 | u64 start; | |
364 | u64 len; | |
365 | u64 logical; | |
366 | unsigned long bio_flags; | |
367 | int this_mirror; | |
368 | int failed_mirror; | |
369 | int in_validation; | |
370 | }; | |
371 | ||
f612496b | 372 | void btrfs_free_io_failure_record(struct inode *inode, u64 start, u64 end); |
2fe6303e MX |
373 | int btrfs_get_io_failure_record(struct inode *inode, u64 start, u64 end, |
374 | struct io_failure_record **failrec_ret); | |
375 | int btrfs_check_repairable(struct inode *inode, struct bio *failed_bio, | |
376 | struct io_failure_record *failrec, int fail_mirror); | |
377 | struct bio *btrfs_create_repair_bio(struct inode *inode, struct bio *failed_bio, | |
378 | struct io_failure_record *failrec, | |
379 | struct page *page, int pg_offset, int icsum, | |
8b110e39 MX |
380 | bio_end_io_t *endio_func, void *data); |
381 | int free_io_failure(struct inode *inode, struct io_failure_record *rec); | |
294e30fe JB |
382 | #ifdef CONFIG_BTRFS_FS_RUN_SANITY_TESTS |
383 | noinline u64 find_lock_delalloc_range(struct inode *inode, | |
384 | struct extent_io_tree *tree, | |
385 | struct page *locked_page, u64 *start, | |
386 | u64 *end, u64 max_bytes); | |
faa2dbf0 JB |
387 | struct extent_buffer *alloc_test_extent_buffer(struct btrfs_fs_info *fs_info, |
388 | u64 start, unsigned long len); | |
294e30fe | 389 | #endif |
d1310b2e | 390 | #endif |