extent_io.h 9.89 KB
Newer Older
1
/* SPDX-License-Identifier: GPL-2.0 */
2 3 4

#ifndef BTRFS_EXTENT_IO_H
#define BTRFS_EXTENT_IO_H
5 6

#include <linux/rbtree.h>
7
#include <linux/refcount.h>
8
#include <linux/fiemap.h>
9
#include <linux/btrfs_tree.h>
10
#include "compression.h"
11
#include "ulist.h"
12

13 14 15 16 17 18 19 20 21 22 23 24 25 26 27
enum {
	EXTENT_BUFFER_UPTODATE,
	EXTENT_BUFFER_DIRTY,
	EXTENT_BUFFER_CORRUPT,
	/* this got triggered by readahead */
	EXTENT_BUFFER_READAHEAD,
	EXTENT_BUFFER_TREE_REF,
	EXTENT_BUFFER_STALE,
	EXTENT_BUFFER_WRITEBACK,
	/* read IO error */
	EXTENT_BUFFER_READ_ERR,
	EXTENT_BUFFER_UNMAPPED,
	EXTENT_BUFFER_IN_TREE,
	/* write IO error */
	EXTENT_BUFFER_WRITE_ERR,
28
	EXTENT_BUFFER_NO_CHECK,
29
	EXTENT_BUFFER_ZONE_FINISH,
30
};
31

32
/* these are flags for __process_pages_contig */
33
#define PAGE_UNLOCK		(1 << 0)
34 35 36
/* Page starts writeback, clear dirty bit and set writeback bit */
#define PAGE_START_WRITEBACK	(1 << 1)
#define PAGE_END_WRITEBACK	(1 << 2)
37
#define PAGE_SET_ORDERED	(1 << 3)
38 39
#define PAGE_SET_ERROR		(1 << 4)
#define PAGE_LOCK		(1 << 5)
40

41 42 43 44 45 46
/*
 * page->private values.  Every page that is controlled by the extent
 * map has page->private set to one.
 */
#define EXTENT_PAGE_PRIVATE 1

47 48 49 50 51 52 53 54 55 56 57 58 59 60
/*
 * The extent buffer bitmap operations are done with byte granularity instead of
 * word granularity for two reasons:
 * 1. The bitmaps must be little-endian on disk.
 * 2. Bitmap items are not guaranteed to be aligned to a word and therefore a
 *    single word in a bitmap may straddle two pages in the extent buffer.
 */
#define BIT_BYTE(nr) ((nr) / BITS_PER_BYTE)
#define BYTE_MASK ((1 << BITS_PER_BYTE) - 1)
#define BITMAP_FIRST_BYTE_MASK(start) \
	((BYTE_MASK << ((start) & (BITS_PER_BYTE - 1))) & BYTE_MASK)
#define BITMAP_LAST_BYTE_MASK(nbits) \
	(BYTE_MASK >> (-(nbits) & (BITS_PER_BYTE - 1)))

61
struct btrfs_root;
62
struct btrfs_inode;
63
struct btrfs_io_bio;
64
struct btrfs_fs_info;
65
struct io_failure_record;
66
struct extent_io_tree;
67

68
typedef void (submit_bio_hook_t)(struct inode *inode, struct bio *bio,
69 70 71
					 int mirror_num,
					 unsigned long bio_flags);

72
typedef blk_status_t (extent_submit_bio_start_t)(struct inode *inode,
73
		struct bio *bio, u64 dio_file_offset);
74

75
#define INLINE_EXTENT_BUFFER_PAGES     (BTRFS_MAX_METADATA_BLOCKSIZE / PAGE_SIZE)
76 77 78
struct extent_buffer {
	u64 start;
	unsigned long len;
79
	unsigned long bflags;
80
	struct btrfs_fs_info *fs_info;
81
	spinlock_t refs_lock;
82
	atomic_t refs;
83
	atomic_t io_pages;
84
	int read_mirror;
85
	struct rcu_head rcu_head;
86
	pid_t lock_owner;
87
	/* >= 0 if eb belongs to a log tree, -1 otherwise */
88 89 90
	s8 log_index;

	struct rw_semaphore lock;
91

92
	struct page *pages[INLINE_EXTENT_BUFFER_PAGES];
93
	struct list_head release_list;
94 95 96
#ifdef CONFIG_BTRFS_DEBUG
	struct list_head leak_list;
#endif
97 98
};

99 100 101 102 103
/*
 * Structure to record how many bytes and which ranges are set/cleared
 */
struct extent_changeset {
	/* How many bytes are set/cleared in this operation */
104
	u64 bytes_changed;
105 106

	/* Changed ranges */
107
	struct ulist range_changed;
108 109
};

110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143
static inline void extent_changeset_init(struct extent_changeset *changeset)
{
	changeset->bytes_changed = 0;
	ulist_init(&changeset->range_changed);
}

static inline struct extent_changeset *extent_changeset_alloc(void)
{
	struct extent_changeset *ret;

	ret = kmalloc(sizeof(*ret), GFP_KERNEL);
	if (!ret)
		return NULL;

	extent_changeset_init(ret);
	return ret;
}

static inline void extent_changeset_release(struct extent_changeset *changeset)
{
	if (!changeset)
		return;
	changeset->bytes_changed = 0;
	ulist_release(&changeset->range_changed);
}

static inline void extent_changeset_free(struct extent_changeset *changeset)
{
	if (!changeset)
		return;
	extent_changeset_release(changeset);
	kfree(changeset);
}

144 145
struct extent_map_tree;

146
typedef struct extent_map *(get_extent_t)(struct btrfs_inode *inode,
147 148
					  struct page *page, size_t pg_offset,
					  u64 start, u64 len);
149

150
int try_release_extent_mapping(struct page *page, gfp_t mask);
151
int try_release_extent_buffer(struct page *page);
152

153
int btrfs_readpage(struct file *file, struct page *page);
154
int extent_write_full_page(struct page *page, struct writeback_control *wbc);
155
int extent_write_locked_range(struct inode *inode, u64 start, u64 end);
156
int extent_writepages(struct address_space *mapping,
157
		      struct writeback_control *wbc);
158 159
int btree_write_cache_pages(struct address_space *mapping,
			    struct writeback_control *wbc);
160
void extent_readahead(struct readahead_control *rac);
161
int extent_fiemap(struct btrfs_inode *inode, struct fiemap_extent_info *fieinfo,
162
		  u64 start, u64 len);
163 164
int set_page_extent_mapped(struct page *page);
void clear_page_extent_mapped(struct page *page);
165

166
struct extent_buffer *alloc_extent_buffer(struct btrfs_fs_info *fs_info,
167
					  u64 start, u64 owner_root, int level);
168 169
struct extent_buffer *__alloc_dummy_extent_buffer(struct btrfs_fs_info *fs_info,
						  u64 start, unsigned long len);
170
struct extent_buffer *alloc_dummy_extent_buffer(struct btrfs_fs_info *fs_info,
171
						u64 start);
172
struct extent_buffer *btrfs_clone_extent_buffer(const struct extent_buffer *src);
173
struct extent_buffer *find_extent_buffer(struct btrfs_fs_info *fs_info,
174
					 u64 start);
175
void free_extent_buffer(struct extent_buffer *eb);
176
void free_extent_buffer_stale(struct extent_buffer *eb);
177 178 179
#define WAIT_NONE	0
#define WAIT_COMPLETE	1
#define WAIT_PAGE_LOCK	2
180
int read_extent_buffer_pages(struct extent_buffer *eb, int wait,
181
			     int mirror_num);
182
void wait_on_extent_buffer_writeback(struct extent_buffer *eb);
183
void btrfs_readahead_tree_block(struct btrfs_fs_info *fs_info,
184
				u64 bytenr, u64 owner_root, u64 gen, int level);
185
void btrfs_readahead_node_child(struct extent_buffer *node, int slot);
186

187
static inline int num_extent_pages(const struct extent_buffer *eb)
188
{
189 190 191 192 193 194 195 196
	/*
	 * For sectorsize == PAGE_SIZE case, since nodesize is always aligned to
	 * sectorsize, it's just eb->len >> PAGE_SHIFT.
	 *
	 * For sectorsize < PAGE_SIZE case, we could have nodesize < PAGE_SIZE,
	 * thus have to ensure we get at least one page.
	 */
	return (eb->len >> PAGE_SHIFT) ?: 1;
197 198
}

199
static inline int extent_buffer_uptodate(const struct extent_buffer *eb)
200 201 202 203
{
	return test_bit(EXTENT_BUFFER_UPTODATE, &eb->bflags);
}

204 205 206
int memcmp_extent_buffer(const struct extent_buffer *eb, const void *ptrv,
			 unsigned long start, unsigned long len);
void read_extent_buffer(const struct extent_buffer *eb, void *dst,
207 208
			unsigned long start,
			unsigned long len);
209 210 211
int read_extent_buffer_to_user_nofault(const struct extent_buffer *eb,
				       void __user *dst, unsigned long start,
				       unsigned long len);
212 213
void write_extent_buffer_fsid(const struct extent_buffer *eb, const void *src);
void write_extent_buffer_chunk_tree_uuid(const struct extent_buffer *eb,
214
		const void *src);
215
void write_extent_buffer(const struct extent_buffer *eb, const void *src,
216
			 unsigned long start, unsigned long len);
217 218 219 220
void copy_extent_buffer_full(const struct extent_buffer *dst,
			     const struct extent_buffer *src);
void copy_extent_buffer(const struct extent_buffer *dst,
			const struct extent_buffer *src,
221 222
			unsigned long dst_offset, unsigned long src_offset,
			unsigned long len);
223 224 225 226 227
void memcpy_extent_buffer(const struct extent_buffer *dst,
			  unsigned long dst_offset, unsigned long src_offset,
			  unsigned long len);
void memmove_extent_buffer(const struct extent_buffer *dst,
			   unsigned long dst_offset, unsigned long src_offset,
228
			   unsigned long len);
229
void memzero_extent_buffer(const struct extent_buffer *eb, unsigned long start,
230
			   unsigned long len);
231
int extent_buffer_test_bit(const struct extent_buffer *eb, unsigned long start,
232
			   unsigned long pos);
233
void extent_buffer_bitmap_set(const struct extent_buffer *eb, unsigned long start,
234
			      unsigned long pos, unsigned long len);
235 236 237 238
void extent_buffer_bitmap_clear(const struct extent_buffer *eb,
				unsigned long start, unsigned long pos,
				unsigned long len);
void clear_extent_buffer_dirty(const struct extent_buffer *eb);
239
bool set_extent_buffer_dirty(struct extent_buffer *eb);
240
void set_extent_buffer_uptodate(struct extent_buffer *eb);
241
void clear_extent_buffer_uptodate(struct extent_buffer *eb);
242
int extent_buffer_under_io(const struct extent_buffer *eb);
243
void extent_range_clear_dirty_for_io(struct inode *inode, u64 start, u64 end);
244
void extent_range_redirty_for_io(struct inode *inode, u64 start, u64 end);
245
void extent_clear_unlock_delalloc(struct btrfs_inode *inode, u64 start, u64 end,
246
				  struct page *locked_page,
247
				  u32 bits_to_clear, unsigned long page_ops);
248 249

int btrfs_alloc_page_array(unsigned int nr_pages, struct page **page_array);
250
struct bio *btrfs_bio_alloc(unsigned int nr_iovecs);
251
struct bio *btrfs_bio_clone(struct block_device *bdev, struct bio *bio);
252
struct bio *btrfs_bio_clone_partial(struct bio *orig, u64 offset, u64 size);
253

254
void end_extent_writepage(struct page *page, int err, u64 start, u64 end);
255
int btrfs_repair_eb_io_failure(const struct extent_buffer *eb, int mirror_num);
256 257 258 259 260

/*
 * When IO fails, either with EIO or csum verification fails, we
 * try other mirrors that might have a good copy of the data.  This
 * io_failure_record is used to record state as we go through all the
261
 * mirrors.  If another mirror has good data, the sector is set up to date
262 263 264 265 266 267 268 269
 * and things continue.  If a good mirror can't be found, the original
 * bio end_io callback is called to indicate things have failed.
 */
struct io_failure_record {
	struct page *page;
	u64 start;
	u64 len;
	u64 logical;
270
	enum btrfs_compression_type compress_type;
271 272 273 274
	int this_mirror;
	int failed_mirror;
};

275 276 277 278 279
int btrfs_repair_one_sector(struct inode *inode,
			    struct bio *failed_bio, u32 bio_offset,
			    struct page *page, unsigned int pgoff,
			    u64 start, int failed_mirror,
			    submit_bio_hook_t *submit_bio_hook);
280

281
#ifdef CONFIG_BTRFS_FS_RUN_SANITY_TESTS
282
bool find_lock_delalloc_range(struct inode *inode,
283 284
			     struct page *locked_page, u64 *start,
			     u64 *end);
285
#endif
286
struct extent_buffer *alloc_test_extent_buffer(struct btrfs_fs_info *fs_info,
287
					       u64 start);
288 289 290 291 292 293 294

#ifdef CONFIG_BTRFS_DEBUG
void btrfs_extent_buffer_leak_debug_check(struct btrfs_fs_info *fs_info);
#else
#define btrfs_extent_buffer_leak_debug_check(fs_info)	do {} while (0)
#endif

295
#endif