dax.h 5.1 KB
Newer Older
1 2 3 4 5
#ifndef _LINUX_DAX_H
#define _LINUX_DAX_H

#include <linux/fs.h>
#include <linux/mm.h>
6
#include <linux/radix-tree.h>
7 8
#include <asm/pgtable.h>

9
struct iomap_ops;
D
Dan Williams 已提交
10 11 12 13 14 15 16 17 18
struct dax_device;
struct dax_operations {
	/*
	 * direct_access: translate a device-relative
	 * logical-page-offset into an absolute physical pfn. Return the
	 * number of pages available for DAX at that pfn.
	 */
	long (*direct_access)(struct dax_device *, pgoff_t, long,
			void **, pfn_t *);
19
	/* copy_from_iter: required operation for fs-dax direct-i/o */
20 21
	size_t (*copy_from_iter)(struct dax_device *, pgoff_t, void *, size_t,
			struct iov_iter *);
22 23
	/* flush: optional driver-specific cache management after writes */
	void (*flush)(struct dax_device *, pgoff_t, void *, size_t);
D
Dan Williams 已提交
24
};
25

26 27
extern struct attribute_group dax_attribute_group;

28 29 30 31 32 33 34 35 36 37 38 39 40 41
#if IS_ENABLED(CONFIG_DAX)
struct dax_device *dax_get_by_host(const char *host);
void put_dax(struct dax_device *dax_dev);
#else
static inline struct dax_device *dax_get_by_host(const char *host)
{
	return NULL;
}

static inline void put_dax(struct dax_device *dax_dev)
{
}
#endif

42 43 44 45 46 47 48
int bdev_dax_pgoff(struct block_device *, sector_t, size_t, pgoff_t *pgoff);
#if IS_ENABLED(CONFIG_FS_DAX)
int __bdev_dax_supported(struct super_block *sb, int blocksize);
static inline int bdev_dax_supported(struct super_block *sb, int blocksize)
{
	return __bdev_dax_supported(sb, blocksize);
}
49 50 51 52 53 54 55 56 57 58 59

static inline struct dax_device *fs_dax_get_by_host(const char *host)
{
	return dax_get_by_host(host);
}

static inline void fs_put_dax(struct dax_device *dax_dev)
{
	put_dax(dax_dev);
}

60
struct dax_device *fs_dax_get_by_bdev(struct block_device *bdev);
61 62 63 64 65 66
#else
static inline int bdev_dax_supported(struct super_block *sb, int blocksize)
{
	return -EOPNOTSUPP;
}

67
static inline struct dax_device *fs_dax_get_by_host(const char *host)
68 69 70 71
{
	return NULL;
}

72
static inline void fs_put_dax(struct dax_device *dax_dev)
73 74
{
}
75 76 77 78 79

static inline struct dax_device *fs_dax_get_by_bdev(struct block_device *bdev)
{
	return NULL;
}
80 81
#endif

82 83
int dax_read_lock(void);
void dax_read_unlock(int id);
D
Dan Williams 已提交
84 85 86 87 88
struct dax_device *alloc_dax(void *private, const char *host,
		const struct dax_operations *ops);
bool dax_alive(struct dax_device *dax_dev);
void kill_dax(struct dax_device *dax_dev);
void *dax_get_private(struct dax_device *dax_dev);
89 90
long dax_direct_access(struct dax_device *dax_dev, pgoff_t pgoff, long nr_pages,
		void **kaddr, pfn_t *pfn);
91 92
size_t dax_copy_from_iter(struct dax_device *dax_dev, pgoff_t pgoff, void *addr,
		size_t bytes, struct iov_iter *i);
93 94
void dax_flush(struct dax_device *dax_dev, pgoff_t pgoff, void *addr,
		size_t size);
95
void dax_write_cache(struct dax_device *dax_dev, bool wc);
96
bool dax_write_cache_enabled(struct dax_device *dax_dev);
97

98
/*
99 100 101 102 103 104 105 106
 * We use lowest available bit in exceptional entry for locking, one bit for
 * the entry size (PMD) and two more to tell us if the entry is a huge zero
 * page (HZP) or an empty entry that is just used for locking.  In total four
 * special bits.
 *
 * If the PMD bit isn't set the entry has size PAGE_SIZE, and if the HZP and
 * EMPTY bits aren't set the entry is a normal DAX entry with a filesystem
 * block allocation.
107
 */
108
#define RADIX_DAX_SHIFT	(RADIX_TREE_EXCEPTIONAL_SHIFT + 4)
109
#define RADIX_DAX_ENTRY_LOCK (1 << RADIX_TREE_EXCEPTIONAL_SHIFT)
110 111 112
#define RADIX_DAX_PMD (1 << (RADIX_TREE_EXCEPTIONAL_SHIFT + 1))
#define RADIX_DAX_HZP (1 << (RADIX_TREE_EXCEPTIONAL_SHIFT + 2))
#define RADIX_DAX_EMPTY (1 << (RADIX_TREE_EXCEPTIONAL_SHIFT + 3))
113

114 115 116 117 118 119 120 121 122 123 124
static inline unsigned long dax_radix_sector(void *entry)
{
	return (unsigned long)entry >> RADIX_DAX_SHIFT;
}

static inline void *dax_radix_locked_entry(sector_t sector, unsigned long flags)
{
	return (void *)(RADIX_TREE_EXCEPTIONAL_ENTRY | flags |
			((unsigned long)sector << RADIX_DAX_SHIFT) |
			RADIX_DAX_ENTRY_LOCK);
}
125

126
ssize_t dax_iomap_rw(struct kiocb *iocb, struct iov_iter *iter,
127
		const struct iomap_ops *ops);
128 129
int dax_iomap_fault(struct vm_fault *vmf, enum page_entry_size pe_size,
		    const struct iomap_ops *ops);
J
Jan Kara 已提交
130
int dax_delete_mapping_entry(struct address_space *mapping, pgoff_t index);
131 132
int dax_invalidate_mapping_entry_sync(struct address_space *mapping,
				      pgoff_t index);
J
Jan Kara 已提交
133
void dax_wake_mapping_entry_waiter(struct address_space *mapping,
134
		pgoff_t index, void *entry, bool wake_all);
135 136

#ifdef CONFIG_FS_DAX
137 138
int __dax_zero_page_range(struct block_device *bdev,
		struct dax_device *dax_dev, sector_t sector,
139
		unsigned int offset, unsigned int length);
140
#else
141
static inline int __dax_zero_page_range(struct block_device *bdev,
142 143
		struct dax_device *dax_dev, sector_t sector,
		unsigned int offset, unsigned int length)
144 145 146
{
	return -ENXIO;
}
147 148
#endif

149 150 151 152 153 154 155 156 157 158 159 160 161
#ifdef CONFIG_FS_DAX_PMD
static inline unsigned int dax_radix_order(void *entry)
{
	if ((unsigned long)entry & RADIX_DAX_PMD)
		return PMD_SHIFT - PAGE_SHIFT;
	return 0;
}
#else
static inline unsigned int dax_radix_order(void *entry)
{
	return 0;
}
#endif
162
int dax_pfn_mkwrite(struct vm_fault *vmf);
163

164 165 166 167
static inline bool dax_mapping(struct address_space *mapping)
{
	return mapping->host && IS_DAX(mapping->host);
}
168 169 170 171

struct writeback_control;
int dax_writeback_mapping_range(struct address_space *mapping,
		struct block_device *bdev, struct writeback_control *wbc);
172
#endif