iomap.h 8.7 KB
Newer Older
1
/* SPDX-License-Identifier: GPL-2.0 */
2 3 4
#ifndef LINUX_IOMAP_H
#define LINUX_IOMAP_H 1

5 6
#include <linux/atomic.h>
#include <linux/bitmap.h>
7
#include <linux/blk_types.h>
8
#include <linux/mm.h>
9
#include <linux/types.h>
10
#include <linux/mm_types.h>
11
#include <linux/blkdev.h>
12

13
struct address_space;
14
struct fiemap_extent_info;
15
struct inode;
16
struct iomap_writepage_ctx;
17 18
struct iov_iter;
struct kiocb;
19
struct page;
20 21 22 23 24 25
struct vm_area_struct;
struct vm_fault;

/*
 * Types of block ranges for iomap mappings:
 */
26 27
#define IOMAP_HOLE	0x01	/* no blocks allocated, need allocation */
#define IOMAP_DELALLOC	0x02	/* delayed allocation blocks */
28 29
#define IOMAP_MAPPED	0x03	/* blocks allocated at @addr */
#define IOMAP_UNWRITTEN	0x04	/* blocks allocated at @addr in unwritten state */
30
#define IOMAP_INLINE	0x05	/* data inline in the inode */
31

32
/*
C
Christoph Hellwig 已提交
33
 * Flags for all iomap mappings:
34
 *
35 36
 * IOMAP_F_DIRTY indicates the inode has uncommitted metadata needed to access
 * written data and requires fdatasync to commit them to persistent storage.
37 38
 * This needs to take into account metadata changes that *may* be made at IO
 * completion, such as file size updates from direct IO.
39
 */
B
Bob Peterson 已提交
40
#define IOMAP_F_NEW		0x01	/* blocks have been newly allocated */
41
#define IOMAP_F_DIRTY		0x02	/* uncommitted metadata */
42
#define IOMAP_F_BUFFER_HEAD	0x04	/* file system requires buffer heads */
43
#define IOMAP_F_SIZE_CHANGED	0x08	/* file size has changed */
C
Christoph Hellwig 已提交
44 45 46 47

/*
 * Flags that only need to be reported for IOMAP_REPORT requests:
 */
48 49
#define IOMAP_F_MERGED		0x10	/* contains multiple blocks/extents */
#define IOMAP_F_SHARED		0x20	/* block shared with another file */
50

51 52 53 54 55 56
/*
 * Flags from 0x1000 up are for file system specific usage:
 */
#define IOMAP_F_PRIVATE		0x1000


57
/*
58
 * Magic value for addr:
59
 */
60
#define IOMAP_NULL_ADDR -1ULL	/* addr is not valid */
61

62 63
struct iomap_page_ops;

64
struct iomap {
65
	u64			addr; /* disk offset of mapping, bytes */
66 67
	loff_t			offset;	/* file offset of mapping, bytes */
	u64			length;	/* length of mapping, bytes */
68 69
	u16			type;	/* type of mapping */
	u16			flags;	/* flags for mapping */
70
	struct block_device	*bdev;	/* block device for I/O */
71
	struct dax_device	*dax_dev; /* dax_dev for dax operations */
72
	void			*inline_data;
73
	void			*private; /* filesystem private */
74 75
	const struct iomap_page_ops *page_ops;
};
76

77 78 79 80 81 82
static inline sector_t
iomap_sector(struct iomap *iomap, loff_t pos)
{
	return (iomap->addr + pos - iomap->offset) >> SECTOR_SHIFT;
}

83 84 85 86 87 88 89 90 91 92 93 94 95
/*
 * When a filesystem sets page_ops in an iomap mapping it returns, page_prepare
 * and page_done will be called for each page written to.  This only applies to
 * buffered writes as unbuffered writes will not typically have pages
 * associated with them.
 *
 * When page_prepare succeeds, page_done will always be called to do any
 * cleanup work necessary.  In that page_done call, @page will be NULL if the
 * associated page could not be obtained.
 */
struct iomap_page_ops {
	int (*page_prepare)(struct inode *inode, loff_t pos, unsigned len,
			struct iomap *iomap);
96 97
	void (*page_done)(struct inode *inode, loff_t pos, unsigned copied,
			struct page *page, struct iomap *iomap);
98 99 100 101 102
};

/*
 * Flags for iomap_begin / iomap_end.  No flag implies a read.
 */
C
Christoph Hellwig 已提交
103 104 105
#define IOMAP_WRITE		(1 << 0) /* writing, must allocate blocks */
#define IOMAP_ZERO		(1 << 1) /* zeroing operation, may skip holes */
#define IOMAP_REPORT		(1 << 2) /* report extent status, e.g. FIEMAP */
J
Jan Kara 已提交
106
#define IOMAP_FAULT		(1 << 3) /* mapping for page fault */
C
Christoph Hellwig 已提交
107
#define IOMAP_DIRECT		(1 << 4) /* direct I/O */
108
#define IOMAP_NOWAIT		(1 << 5) /* do not block */
109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126

struct iomap_ops {
	/*
	 * Return the existing mapping at pos, or reserve space starting at
	 * pos for up to length, as long as we can do it as a single mapping.
	 * The actual length is returned in iomap->length.
	 */
	int (*iomap_begin)(struct inode *inode, loff_t pos, loff_t length,
			unsigned flags, struct iomap *iomap);

	/*
	 * Commit and/or unreserve space previous allocated using iomap_begin.
	 * Written indicates the length of the successful write operation which
	 * needs to be commited, while the rest needs to be unreserved.
	 * Written might be zero if no data was written.
	 */
	int (*iomap_end)(struct inode *inode, loff_t pos, loff_t length,
			ssize_t written, unsigned flags, struct iomap *iomap);
127 128
};

129 130 131 132 133 134 135 136 137 138
/*
 * Main iomap iterator function.
 */
typedef loff_t (*iomap_actor_t)(struct inode *inode, loff_t pos, loff_t len,
		void *data, struct iomap *iomap);

loff_t iomap_apply(struct inode *inode, loff_t pos, loff_t length,
		unsigned flags, const struct iomap_ops *ops, void *data,
		iomap_actor_t actor);

139
ssize_t iomap_file_buffered_write(struct kiocb *iocb, struct iov_iter *from,
140
		const struct iomap_ops *ops);
141 142 143
int iomap_readpage(struct page *page, const struct iomap_ops *ops);
int iomap_readpages(struct address_space *mapping, struct list_head *pages,
		unsigned nr_pages, const struct iomap_ops *ops);
144
int iomap_set_page_dirty(struct page *page);
145 146 147 148 149 150 151 152 153 154 155
int iomap_is_partially_uptodate(struct page *page, unsigned long from,
		unsigned long count);
int iomap_releasepage(struct page *page, gfp_t gfp_mask);
void iomap_invalidatepage(struct page *page, unsigned int offset,
		unsigned int len);
#ifdef CONFIG_MIGRATION
int iomap_migrate_page(struct address_space *mapping, struct page *newpage,
		struct page *page, enum migrate_mode mode);
#else
#define iomap_migrate_page NULL
#endif
C
Christoph Hellwig 已提交
156
int iomap_file_dirty(struct inode *inode, loff_t pos, loff_t len,
157
		const struct iomap_ops *ops);
158
int iomap_zero_range(struct inode *inode, loff_t pos, loff_t len,
159
		bool *did_zero, const struct iomap_ops *ops);
160
int iomap_truncate_page(struct inode *inode, loff_t pos, bool *did_zero,
161
		const struct iomap_ops *ops);
162 163
vm_fault_t iomap_page_mkwrite(struct vm_fault *vmf,
			const struct iomap_ops *ops);
164
int iomap_fiemap(struct inode *inode, struct fiemap_extent_info *fieinfo,
165
		loff_t start, loff_t len, const struct iomap_ops *ops);
166 167 168 169
loff_t iomap_seek_hole(struct inode *inode, loff_t offset,
		const struct iomap_ops *ops);
loff_t iomap_seek_data(struct inode *inode, loff_t offset,
		const struct iomap_ops *ops);
170 171
sector_t iomap_bmap(struct address_space *mapping, sector_t bno,
		const struct iomap_ops *ops);
172

173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229
/*
 * Structure for writeback I/O completions.
 */
struct iomap_ioend {
	struct list_head	io_list;	/* next ioend in chain */
	u16			io_type;
	u16			io_flags;	/* IOMAP_F_* */
	struct inode		*io_inode;	/* file being written to */
	size_t			io_size;	/* size of the extent */
	loff_t			io_offset;	/* offset in the file */
	void			*io_private;	/* file system private data */
	struct bio		*io_bio;	/* bio being built */
	struct bio		io_inline_bio;	/* MUST BE LAST! */
};

struct iomap_writeback_ops {
	/*
	 * Required, maps the blocks so that writeback can be performed on
	 * the range starting at offset.
	 */
	int (*map_blocks)(struct iomap_writepage_ctx *wpc, struct inode *inode,
				loff_t offset);

	/*
	 * Optional, allows the file systems to perform actions just before
	 * submitting the bio and/or override the bio end_io handler for complex
	 * operations like copy on write extent manipulation or unwritten extent
	 * conversions.
	 */
	int (*prepare_ioend)(struct iomap_ioend *ioend, int status);

	/*
	 * Optional, allows the file system to discard state on a page where
	 * we failed to submit any I/O.
	 */
	void (*discard_page)(struct page *page);
};

struct iomap_writepage_ctx {
	struct iomap		iomap;
	struct iomap_ioend	*ioend;
	const struct iomap_writeback_ops *ops;
};

void iomap_finish_ioends(struct iomap_ioend *ioend, int error);
void iomap_ioend_try_merge(struct iomap_ioend *ioend,
		struct list_head *more_ioends,
		void (*merge_private)(struct iomap_ioend *ioend,
				struct iomap_ioend *next));
void iomap_sort_ioends(struct list_head *ioend_list);
int iomap_writepage(struct page *page, struct writeback_control *wbc,
		struct iomap_writepage_ctx *wpc,
		const struct iomap_writeback_ops *ops);
int iomap_writepages(struct address_space *mapping,
		struct writeback_control *wbc, struct iomap_writepage_ctx *wpc,
		const struct iomap_writeback_ops *ops);

C
Christoph Hellwig 已提交
230 231 232 233 234
/*
 * Flags for direct I/O ->end_io:
 */
#define IOMAP_DIO_UNWRITTEN	(1 << 0)	/* covers unwritten extent(s) */
#define IOMAP_DIO_COW		(1 << 1)	/* covers COW extent(s) */
235 236 237 238 239 240

struct iomap_dio_ops {
	int (*end_io)(struct kiocb *iocb, ssize_t size, int error,
		      unsigned flags);
};

C
Christoph Hellwig 已提交
241
ssize_t iomap_dio_rw(struct kiocb *iocb, struct iov_iter *iter,
242 243
		const struct iomap_ops *ops, const struct iomap_dio_ops *dops,
		bool wait_for_completion);
244
int iomap_dio_iopoll(struct kiocb *kiocb, bool spin);
C
Christoph Hellwig 已提交
245

246 247 248 249 250 251 252 253 254 255 256
#ifdef CONFIG_SWAP
struct file;
struct swap_info_struct;

int iomap_swapfile_activate(struct swap_info_struct *sis,
		struct file *swap_file, sector_t *pagespan,
		const struct iomap_ops *ops);
#else
# define iomap_swapfile_activate(sis, swapfile, pagespan, ops)	(-EIO)
#endif /* CONFIG_SWAP */

257
#endif /* LINUX_IOMAP_H */