extent_io.h 12.2 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
#ifndef __EXTENTIO__
#define __EXTENTIO__

#include <linux/rbtree.h>

/* bits for the extent state */
#define EXTENT_DIRTY 1
#define EXTENT_WRITEBACK (1 << 1)
#define EXTENT_UPTODATE (1 << 2)
#define EXTENT_LOCKED (1 << 3)
#define EXTENT_NEW (1 << 4)
#define EXTENT_DELALLOC (1 << 5)
#define EXTENT_DEFRAG (1 << 6)
#define EXTENT_DEFRAG_DONE (1 << 7)
#define EXTENT_BUFFER_FILLED (1 << 8)
16 17
#define EXTENT_BOUNDARY (1 << 9)
#define EXTENT_NODATASUM (1 << 10)
18
#define EXTENT_DO_ACCOUNTING (1 << 11)
19
#define EXTENT_FIRST_DELALLOC (1 << 12)
J
Josef Bacik 已提交
20
#define EXTENT_NEED_WAIT (1 << 13)
21
#define EXTENT_DAMAGED (1 << 14)
22
#define EXTENT_IOBITS (EXTENT_LOCKED | EXTENT_WRITEBACK)
23
#define EXTENT_CTLBITS (EXTENT_DO_ACCOUNTING | EXTENT_FIRST_DELALLOC)
24

25 26 27 28
/*
 * flags for bio submission. The high bits indicate the compression
 * type for this bio
 */
C
Chris Mason 已提交
29
#define EXTENT_BIO_COMPRESSED 1
30
#define EXTENT_BIO_FLAG_SHIFT 16
C
Chris Mason 已提交
31

32 33 34
/* these are bit numbers for test/set bit */
#define EXTENT_BUFFER_UPTODATE 0
#define EXTENT_BUFFER_BLOCKING 1
35
#define EXTENT_BUFFER_DIRTY 2
36
#define EXTENT_BUFFER_CORRUPT 3
37
#define EXTENT_BUFFER_READAHEAD 4	/* this got triggered by readahead */
38 39
#define EXTENT_BUFFER_TREE_REF 5
#define EXTENT_BUFFER_STALE 6
40 41
#define EXTENT_BUFFER_WRITEBACK 7
#define EXTENT_BUFFER_IOERR 8
42
#define EXTENT_BUFFER_DUMMY 9
43

44 45 46 47 48 49 50 51
/* these are flags for extent_clear_unlock_delalloc */
#define EXTENT_CLEAR_UNLOCK_PAGE 0x1
#define EXTENT_CLEAR_UNLOCK	 0x2
#define EXTENT_CLEAR_DELALLOC	 0x4
#define EXTENT_CLEAR_DIRTY	 0x8
#define EXTENT_SET_WRITEBACK	 0x10
#define EXTENT_END_WRITEBACK	 0x20
#define EXTENT_SET_PRIVATE2	 0x40
52
#define EXTENT_CLEAR_ACCOUNTING  0x80
53

54 55 56 57 58 59 60
/*
 * page->private values.  Every page that is controlled by the extent
 * map has page->private set to one.
 */
#define EXTENT_PAGE_PRIVATE 1
#define EXTENT_PAGE_PRIVATE_FIRST_PAGE 3

61
struct extent_state;
62
struct btrfs_root;
63

64
typedef	int (extent_submit_bio_hook_t)(struct inode *inode, int rw,
C
Chris Mason 已提交
65
				       struct bio *bio, int mirror_num,
66
				       unsigned long bio_flags, u64 bio_offset);
67
struct extent_io_ops {
C
Chris Mason 已提交
68
	int (*fill_delalloc)(struct inode *inode, struct page *locked_page,
69 70
			     u64 start, u64 end, int *page_started,
			     unsigned long *nr_written);
71
	int (*writepage_start_hook)(struct page *page, u64 start, u64 end);
72
	int (*writepage_io_hook)(struct page *page, u64 start, u64 end);
73
	extent_submit_bio_hook_t *submit_bio_hook;
74
	int (*merge_bio_hook)(struct page *page, unsigned long offset,
C
Chris Mason 已提交
75 76
			      size_t size, struct bio *bio,
			      unsigned long bio_flags);
77
	int (*readpage_io_hook)(struct page *page, u64 start, u64 end);
78
	int (*readpage_io_failed_hook)(struct page *page, int failed_mirror);
79
	int (*readpage_end_io_hook)(struct page *page, u64 start, u64 end,
80
				    struct extent_state *state, int mirror);
81
	int (*writepage_end_io_hook)(struct page *page, u64 start, u64 end,
82
				      struct extent_state *state, int uptodate);
83 84 85 86 87 88 89 90 91
	void (*set_bit_hook)(struct inode *inode, struct extent_state *state,
			     int *bits);
	void (*clear_bit_hook)(struct inode *inode, struct extent_state *state,
			       int *bits);
	void (*merge_extent_hook)(struct inode *inode,
				  struct extent_state *new,
				  struct extent_state *other);
	void (*split_extent_hook)(struct inode *inode,
				  struct extent_state *orig, u64 split);
92 93
	int (*write_cache_pages_lock_hook)(struct page *page, void *data,
					   void (*flush_fn)(void *));
94 95 96 97
};

struct extent_io_tree {
	struct rb_root state;
98
	struct radix_tree_root buffer;
99 100
	struct address_space *mapping;
	u64 dirty_bytes;
101
	int track_uptodate;
102
	spinlock_t lock;
103
	spinlock_t buffer_lock;
104 105 106 107 108 109 110
	struct extent_io_ops *ops;
};

struct extent_state {
	u64 start;
	u64 end; /* inclusive */
	struct rb_node rb_node;
J
Josef Bacik 已提交
111 112

	/* ADD NEW ELEMENTS AFTER THIS */
113
	struct extent_io_tree *tree;
114 115 116 117 118 119 120
	wait_queue_head_t wq;
	atomic_t refs;
	unsigned long state;

	/* for use by the FS */
	u64 private;

121
	struct list_head leak_list;
122 123
};

124 125
#define INLINE_EXTENT_BUFFER_PAGES 16
#define MAX_INLINE_EXTENT_BUFFER_SIZE (INLINE_EXTENT_BUFFER_PAGES * PAGE_CACHE_SIZE)
126 127 128 129 130
struct extent_buffer {
	u64 start;
	unsigned long len;
	unsigned long map_start;
	unsigned long map_len;
131
	unsigned long bflags;
J
Josef Bacik 已提交
132
	struct extent_io_tree *tree;
133
	spinlock_t refs_lock;
134
	atomic_t refs;
135
	atomic_t io_pages;
136
	int read_mirror;
137
	struct list_head leak_list;
138
	struct rcu_head rcu_head;
139
	pid_t lock_owner;
140

141 142 143 144 145 146 147
	/* count of read lock holders on the extent buffer */
	atomic_t write_locks;
	atomic_t read_locks;
	atomic_t blocking_writers;
	atomic_t blocking_readers;
	atomic_t spinning_readers;
	atomic_t spinning_writers;
148
	int lock_nested;
149 150 151 152 153 154 155 156

	/* protects write locks */
	rwlock_t lock;

	/* readers use lock_wq while they wait for the write
	 * lock holders to unlock
	 */
	wait_queue_head_t write_lock_wq;
157

158 159
	/* writers use read_lock_wq while they wait for readers
	 * to unlock
160
	 */
161
	wait_queue_head_t read_lock_wq;
162 163 164
	wait_queue_head_t lock_wq;
	struct page *inline_pages[INLINE_EXTENT_BUFFER_PAGES];
	struct page **pages;
165 166
};

167 168 169 170 171 172 173 174 175 176 177
static inline void extent_set_compress_type(unsigned long *bio_flags,
					    int compress_type)
{
	*bio_flags |= compress_type << EXTENT_BIO_FLAG_SHIFT;
}

static inline int extent_compress_type(unsigned long bio_flags)
{
	return bio_flags >> EXTENT_BIO_FLAG_SHIFT;
}

178 179 180 181
struct extent_map_tree;

typedef struct extent_map *(get_extent_t)(struct inode *inode,
					  struct page *page,
182
					  size_t pg_offset,
183 184 185 186
					  u64 start, u64 len,
					  int create);

void extent_io_tree_init(struct extent_io_tree *tree,
187
			 struct address_space *mapping);
188
int try_release_extent_mapping(struct extent_map_tree *map,
189 190
			       struct extent_io_tree *tree, struct page *page,
			       gfp_t mask);
191
int try_release_extent_buffer(struct page *page, gfp_t mask);
192 193 194
int try_release_extent_state(struct extent_map_tree *map,
			     struct extent_io_tree *tree, struct page *page,
			     gfp_t mask);
195
int lock_extent(struct extent_io_tree *tree, u64 start, u64 end);
196
int lock_extent_bits(struct extent_io_tree *tree, u64 start, u64 end,
197 198
		     int bits, struct extent_state **cached);
int unlock_extent(struct extent_io_tree *tree, u64 start, u64 end);
199 200
int unlock_extent_cached(struct extent_io_tree *tree, u64 start, u64 end,
			 struct extent_state **cached, gfp_t mask);
201
int try_lock_extent(struct extent_io_tree *tree, u64 start, u64 end);
202
int extent_read_full_page(struct extent_io_tree *tree, struct page *page,
203
			  get_extent_t *get_extent, int mirror_num);
204 205 206 207 208
int __init extent_io_init(void);
void extent_io_exit(void);

u64 count_range_bits(struct extent_io_tree *tree,
		     u64 *start, u64 search_end,
209
		     u64 max_bytes, unsigned long bits, int contig);
210

211
void free_extent_state(struct extent_state *state);
212
int test_range_bit(struct extent_io_tree *tree, u64 start, u64 end,
213
		   int bits, int filled, struct extent_state *cached_state);
214 215
int clear_extent_bits(struct extent_io_tree *tree, u64 start, u64 end,
		      int bits, gfp_t mask);
216
int clear_extent_bit(struct extent_io_tree *tree, u64 start, u64 end,
217 218
		     int bits, int wake, int delete, struct extent_state **cached,
		     gfp_t mask);
219 220
int set_extent_bits(struct extent_io_tree *tree, u64 start, u64 end,
		    int bits, gfp_t mask);
221
int set_extent_bit(struct extent_io_tree *tree, u64 start, u64 end,
J
Jeff Mahoney 已提交
222
		   int bits, u64 *failed_start,
223
		   struct extent_state **cached_state, gfp_t mask);
224
int set_extent_uptodate(struct extent_io_tree *tree, u64 start, u64 end,
225
			struct extent_state **cached_state, gfp_t mask);
226 227
int clear_extent_uptodate(struct extent_io_tree *tree, u64 start, u64 end,
			  struct extent_state **cached_state, gfp_t mask);
228 229 230 231 232 233
int set_extent_new(struct extent_io_tree *tree, u64 start, u64 end,
		   gfp_t mask);
int set_extent_dirty(struct extent_io_tree *tree, u64 start, u64 end,
		     gfp_t mask);
int clear_extent_dirty(struct extent_io_tree *tree, u64 start, u64 end,
		       gfp_t mask);
J
Josef Bacik 已提交
234 235
int convert_extent_bit(struct extent_io_tree *tree, u64 start, u64 end,
		       int bits, int clear_bits, gfp_t mask);
236
int set_extent_delalloc(struct extent_io_tree *tree, u64 start, u64 end,
237
			struct extent_state **cached_state, gfp_t mask);
238 239
int find_first_extent_bit(struct extent_io_tree *tree, u64 start,
			  u64 *start_ret, u64 *end_ret, int bits);
C
Chris Mason 已提交
240 241
struct extent_state *find_first_extent_bit_state(struct extent_io_tree *tree,
						 u64 start, int bits);
242 243 244 245 246
int extent_invalidatepage(struct extent_io_tree *tree,
			  struct page *page, unsigned long offset);
int extent_write_full_page(struct extent_io_tree *tree, struct page *page,
			  get_extent_t *get_extent,
			  struct writeback_control *wbc);
247 248 249
int extent_write_locked_range(struct extent_io_tree *tree, struct inode *inode,
			      u64 start, u64 end, get_extent_t *get_extent,
			      int mode);
250 251 252 253
int extent_writepages(struct extent_io_tree *tree,
		      struct address_space *mapping,
		      get_extent_t *get_extent,
		      struct writeback_control *wbc);
254 255
int btree_write_cache_pages(struct address_space *mapping,
			    struct writeback_control *wbc);
256 257 258 259
int extent_readpages(struct extent_io_tree *tree,
		     struct address_space *mapping,
		     struct list_head *pages, unsigned nr_pages,
		     get_extent_t get_extent);
Y
Yehuda Sadeh 已提交
260 261
int extent_fiemap(struct inode *inode, struct fiemap_extent_info *fieinfo,
		__u64 start, __u64 len, get_extent_t *get_extent);
262 263 264 265 266
int set_state_private(struct extent_io_tree *tree, u64 start, u64 private);
int get_state_private(struct extent_io_tree *tree, u64 start, u64 *private);
void set_page_extent_mapped(struct page *page);

struct extent_buffer *alloc_extent_buffer(struct extent_io_tree *tree,
267
					  u64 start, unsigned long len);
268 269
struct extent_buffer *alloc_dummy_extent_buffer(u64 start, unsigned long len);
struct extent_buffer *btrfs_clone_extent_buffer(struct extent_buffer *src);
270
struct extent_buffer *find_extent_buffer(struct extent_io_tree *tree,
271
					 u64 start, unsigned long len);
272
void free_extent_buffer(struct extent_buffer *eb);
273
void free_extent_buffer_stale(struct extent_buffer *eb);
274 275 276
#define WAIT_NONE	0
#define WAIT_COMPLETE	1
#define WAIT_PAGE_LOCK	2
277
int read_extent_buffer_pages(struct extent_io_tree *tree,
278
			     struct extent_buffer *eb, u64 start, int wait,
279
			     get_extent_t *get_extent, int mirror_num);
280 281
unsigned long num_extent_pages(u64 start, u64 len);
struct page *extent_buffer_page(struct extent_buffer *eb, unsigned long i);
282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304

static inline void extent_buffer_get(struct extent_buffer *eb)
{
	atomic_inc(&eb->refs);
}

int memcmp_extent_buffer(struct extent_buffer *eb, const void *ptrv,
			  unsigned long start,
			  unsigned long len);
void read_extent_buffer(struct extent_buffer *eb, void *dst,
			unsigned long start,
			unsigned long len);
void write_extent_buffer(struct extent_buffer *eb, const void *src,
			 unsigned long start, unsigned long len);
void copy_extent_buffer(struct extent_buffer *dst, struct extent_buffer *src,
			unsigned long dst_offset, unsigned long src_offset,
			unsigned long len);
void memcpy_extent_buffer(struct extent_buffer *dst, unsigned long dst_offset,
			   unsigned long src_offset, unsigned long len);
void memmove_extent_buffer(struct extent_buffer *dst, unsigned long dst_offset,
			   unsigned long src_offset, unsigned long len);
void memset_extent_buffer(struct extent_buffer *eb, char c,
			  unsigned long start, unsigned long len);
305
void wait_extent_bit(struct extent_io_tree *tree, u64 start, u64 end, int bits);
306
void clear_extent_buffer_dirty(struct extent_buffer *eb);
307 308 309 310
int set_extent_buffer_dirty(struct extent_buffer *eb);
int set_extent_buffer_uptodate(struct extent_buffer *eb);
int clear_extent_buffer_uptodate(struct extent_buffer *eb);
int extent_buffer_uptodate(struct extent_buffer *eb);
311
int map_private_extent_buffer(struct extent_buffer *eb, unsigned long offset,
312
		      unsigned long min_len, char **map,
313
		      unsigned long *map_start,
314
		      unsigned long *map_len);
315 316
int extent_range_uptodate(struct extent_io_tree *tree,
			  u64 start, u64 end);
C
Chris Mason 已提交
317 318 319
int extent_clear_unlock_delalloc(struct inode *inode,
				struct extent_io_tree *tree,
				u64 start, u64 end, struct page *locked_page,
320
				unsigned long op);
321 322 323
struct bio *
btrfs_bio_alloc(struct block_device *bdev, u64 first_sector, int nr_vecs,
		gfp_t gfp_flags);
324 325 326 327 328 329

struct btrfs_mapping_tree;

int repair_io_failure(struct btrfs_mapping_tree *map_tree, u64 start,
			u64 length, u64 logical, struct page *page,
			int mirror_num);
330
int end_extent_writepage(struct page *page, int err, u64 start, u64 end);
331 332
int repair_eb_io_failure(struct btrfs_root *root, struct extent_buffer *eb,
			 int mirror_num);
333
#endif