xfs_buf.h 11.6 KB
Newer Older
L
Linus Torvalds 已提交
1
/*
2 3
 * Copyright (c) 2000-2005 Silicon Graphics, Inc.
 * All Rights Reserved.
L
Linus Torvalds 已提交
4
 *
5 6
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License as
L
Linus Torvalds 已提交
7 8
 * published by the Free Software Foundation.
 *
9 10 11 12
 * This program is distributed in the hope that it would be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
L
Linus Torvalds 已提交
13
 *
14 15 16
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write the Free Software Foundation,
 * Inc.,  51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
L
Linus Torvalds 已提交
17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32
 */
#ifndef __XFS_BUF_H__
#define __XFS_BUF_H__

#include <linux/list.h>
#include <linux/types.h>
#include <linux/spinlock.h>
#include <linux/mm.h>
#include <linux/fs.h>
#include <linux/buffer_head.h>
#include <linux/uio.h>

/*
 *	Base types
 */

33 34 35 36 37 38 39 40
#define XFS_BUF_DADDR_NULL	((xfs_daddr_t) (-1LL))

typedef enum {
	XBRW_READ = 1,			/* transfer into target memory */
	XBRW_WRITE = 2,			/* transfer from target memory */
	XBRW_ZERO = 3,			/* Zero target memory */
} xfs_buf_rw_t;

41 42 43 44 45 46
#define XBF_READ	 (1 << 0) /* buffer intended for reading from device */
#define XBF_WRITE	 (1 << 1) /* buffer intended for writing to device */
#define XBF_READ_AHEAD	 (1 << 2) /* asynchronous read-ahead */
#define XBF_ASYNC	 (1 << 4) /* initiator will not wait for completion */
#define XBF_DONE	 (1 << 5) /* all pages in the buffer uptodate */
#define XBF_STALE	 (1 << 6) /* buffer has been staled, do not find it */
47 48

/* I/O hints for the BIO layer */
49 50 51
#define XBF_SYNCIO	 (1 << 10)/* treat this buffer as synchronous I/O */
#define XBF_FUA		 (1 << 11)/* force cache write through mode */
#define XBF_FLUSH	 (1 << 12)/* flush the disk cache before a write */
L
Linus Torvalds 已提交
52

53
/* flags used only as arguments to access routines */
54 55
#define XBF_TRYLOCK	 (1 << 16)/* lock requested, but do not wait */
#define XBF_UNMAPPED	 (1 << 17)/* do not map the buffer */
L
Linus Torvalds 已提交
56

57
/* flags used only internally */
58 59 60 61 62
#define _XBF_PAGES	 (1 << 20)/* backed by refcounted pages */
#define _XBF_KMEM	 (1 << 21)/* backed by heap memory */
#define _XBF_DELWRI_Q	 (1 << 22)/* buffer on a delwri queue */
#define _XBF_COMPOUND	 (1 << 23)/* compound buffer */
#define _XBF_LRU_DISPOSE (1 << 24)/* buffer being discarded */
63

64
typedef unsigned int xfs_buf_flags_t;
L
Linus Torvalds 已提交
65

C
Christoph Hellwig 已提交
66 67 68
#define XFS_BUF_FLAGS \
	{ XBF_READ,		"READ" }, \
	{ XBF_WRITE,		"WRITE" }, \
69
	{ XBF_READ_AHEAD,	"READ_AHEAD" }, \
C
Christoph Hellwig 已提交
70 71 72
	{ XBF_ASYNC,		"ASYNC" }, \
	{ XBF_DONE,		"DONE" }, \
	{ XBF_STALE,		"STALE" }, \
73 74 75
	{ XBF_SYNCIO,		"SYNCIO" }, \
	{ XBF_FUA,		"FUA" }, \
	{ XBF_FLUSH,		"FLUSH" }, \
76
	{ XBF_TRYLOCK,		"TRYLOCK" },	/* should never be set */\
77
	{ XBF_UNMAPPED,		"UNMAPPED" },	/* ditto */\
C
Christoph Hellwig 已提交
78
	{ _XBF_PAGES,		"PAGES" }, \
79
	{ _XBF_KMEM,		"KMEM" }, \
80
	{ _XBF_DELWRI_Q,	"DELWRI_Q" }, \
81 82
	{ _XBF_COMPOUND,	"COMPOUND" }, \
	{ _XBF_LRU_DISPOSE,	"LRU_DISPOSE" }
C
Christoph Hellwig 已提交
83

L
Linus Torvalds 已提交
84
typedef struct xfs_buftarg {
85 86
	dev_t			bt_dev;
	struct block_device	*bt_bdev;
87
	struct backing_dev_info	*bt_bdi;
88
	struct xfs_mount	*bt_mount;
89 90 91 92
	unsigned int		bt_bsize;
	unsigned int		bt_sshift;
	size_t			bt_smask;

93 94
	/* LRU control structures */
	struct shrinker		bt_shrinker;
95 96 97
	struct list_head	bt_lru;
	spinlock_t		bt_lru_lock;
	unsigned int		bt_lru_nr;
L
Linus Torvalds 已提交
98 99 100
} xfs_buftarg_t;

struct xfs_buf;
101
typedef void (*xfs_buf_iodone_t)(struct xfs_buf *);
L
Linus Torvalds 已提交
102

103

104
#define XB_PAGES	2
L
Linus Torvalds 已提交
105

106 107 108 109 110
struct xfs_buf_map {
	xfs_daddr_t		bm_bn;	/* block number for I/O */
	int			bm_len;	/* size of I/O */
};

111 112 113
#define DEFINE_SINGLE_BUF_MAP(map, blkno, numblk) \
	struct xfs_buf_map (map) = { .bm_bn = (blkno), .bm_len = (numblk) };

L
Linus Torvalds 已提交
114
typedef struct xfs_buf {
115 116 117 118 119 120 121 122
	/*
	 * first cacheline holds all the fields needed for an uncontended cache
	 * hit to be fully processed. The semaphore straddles the cacheline
	 * boundary, but the counter and lock sits on the first cacheline,
	 * which is the only bit that is touched if we hit the semaphore
	 * fast-path on locking.
	 */
	struct rb_node		b_rbnode;	/* rbtree node */
123
	xfs_daddr_t		b_bn;		/* block number of buffer */
124
	int			b_length;	/* size of buffer in BBs */
125
	atomic_t		b_hold;		/* reference count */
126
	atomic_t		b_lru_ref;	/* lru reclaim ref count */
127
	xfs_buf_flags_t		b_flags;	/* status flags */
128
	struct semaphore	b_sema;		/* semaphore for lockables */
129

130 131 132 133
	/*
	 * concurrent access to b_lru and b_lru_flags are protected by
	 * bt_lru_lock and not by b_sema
	 */
134
	struct list_head	b_lru;		/* lru list */
135
	xfs_buf_flags_t		b_lru_flags;	/* internal lru status flags */
136 137
	wait_queue_head_t	b_waiters;	/* unpin waiters */
	struct list_head	b_list;
138
	struct xfs_perag	*b_pag;		/* contains rbtree root */
139 140 141 142
	xfs_buftarg_t		*b_target;	/* buffer target (device) */
	void			*b_addr;	/* virtual address of buffer */
	struct work_struct	b_iodone_work;
	xfs_buf_iodone_t	b_iodone;	/* I/O completion function */
143
	struct completion	b_iowait;	/* queue for I/O waiters */
144
	void			*b_fspriv;
145
	struct xfs_trans	*b_transp;
146 147
	struct page		**b_pages;	/* array of page pointers */
	struct page		*b_page_array[XB_PAGES]; /* inline pages */
148 149 150
	struct xfs_buf_map	*b_maps;	/* compound buffer map */
	struct xfs_buf_map	b_map;		/* inline compound buffer map */
	int			b_map_count;
151
	int			b_io_length;	/* IO size in BBs */
152 153 154 155 156
	atomic_t		b_pin_count;	/* pin count */
	atomic_t		b_io_remaining;	/* #outstanding I/O requests */
	unsigned int		b_page_count;	/* size of page array */
	unsigned int		b_offset;	/* page offset in first page */
	unsigned short		b_error;	/* error code on I/O */
157

158 159
#ifdef XFS_BUF_LOCK_TRACKING
	int			b_last_holder;
L
Linus Torvalds 已提交
160 161 162 163
#endif
} xfs_buf_t;

/* Finding and Reading Buffers */
164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192
struct xfs_buf *_xfs_buf_find(struct xfs_buftarg *target,
			      struct xfs_buf_map *map, int nmaps,
			      xfs_buf_flags_t flags, struct xfs_buf *new_bp);

static inline struct xfs_buf *
xfs_incore(
	struct xfs_buftarg	*target,
	xfs_daddr_t		blkno,
	size_t			numblks,
	xfs_buf_flags_t		flags)
{
	DEFINE_SINGLE_BUF_MAP(map, blkno, numblks);
	return _xfs_buf_find(target, &map, 1, flags, NULL);
}

struct xfs_buf *_xfs_buf_alloc(struct xfs_buftarg *target,
			       struct xfs_buf_map *map, int nmaps,
			       xfs_buf_flags_t flags);

static inline struct xfs_buf *
xfs_buf_alloc(
	struct xfs_buftarg	*target,
	xfs_daddr_t		blkno,
	size_t			numblks,
	xfs_buf_flags_t		flags)
{
	DEFINE_SINGLE_BUF_MAP(map, blkno, numblks);
	return _xfs_buf_alloc(target, &map, 1, flags);
}
L
Linus Torvalds 已提交
193

194 195 196 197 198
struct xfs_buf *xfs_buf_get_map(struct xfs_buftarg *target,
			       struct xfs_buf_map *map, int nmaps,
			       xfs_buf_flags_t flags);
struct xfs_buf *xfs_buf_read_map(struct xfs_buftarg *target,
			       struct xfs_buf_map *map, int nmaps,
199
			       xfs_buf_flags_t flags, xfs_buf_iodone_t verify);
200
void xfs_buf_readahead_map(struct xfs_buftarg *target,
201 202
			       struct xfs_buf_map *map, int nmaps,
			       xfs_buf_iodone_t verify);
203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219

static inline struct xfs_buf *
xfs_buf_get(
	struct xfs_buftarg	*target,
	xfs_daddr_t		blkno,
	size_t			numblks,
	xfs_buf_flags_t		flags)
{
	DEFINE_SINGLE_BUF_MAP(map, blkno, numblks);
	return xfs_buf_get_map(target, &map, 1, flags);
}

static inline struct xfs_buf *
xfs_buf_read(
	struct xfs_buftarg	*target,
	xfs_daddr_t		blkno,
	size_t			numblks,
220 221
	xfs_buf_flags_t		flags,
	xfs_buf_iodone_t	verify)
222 223
{
	DEFINE_SINGLE_BUF_MAP(map, blkno, numblks);
224
	return xfs_buf_read_map(target, &map, 1, flags, verify);
225 226 227 228 229 230
}

static inline void
xfs_buf_readahead(
	struct xfs_buftarg	*target,
	xfs_daddr_t		blkno,
231 232
	size_t			numblks,
	xfs_buf_iodone_t	verify)
233 234
{
	DEFINE_SINGLE_BUF_MAP(map, blkno, numblks);
235
	return xfs_buf_readahead_map(target, &map, 1, verify);
236
}
237 238 239 240 241 242 243 244

struct xfs_buf *xfs_buf_get_empty(struct xfs_buftarg *target, size_t numblks);
void xfs_buf_set_empty(struct xfs_buf *bp, size_t numblks);
int xfs_buf_associate_memory(struct xfs_buf *bp, void *mem, size_t length);

struct xfs_buf *xfs_buf_get_uncached(struct xfs_buftarg *target, size_t numblks,
				int flags);
struct xfs_buf *xfs_buf_read_uncached(struct xfs_buftarg *target,
245 246
				xfs_daddr_t daddr, size_t numblks, int flags,
				xfs_buf_iodone_t verify);
247
void xfs_buf_hold(struct xfs_buf *bp);
L
Linus Torvalds 已提交
248 249

/* Releasing Buffers */
250 251
extern void xfs_buf_free(xfs_buf_t *);
extern void xfs_buf_rele(xfs_buf_t *);
L
Linus Torvalds 已提交
252 253

/* Locking and Unlocking Buffers */
254
extern int xfs_buf_trylock(xfs_buf_t *);
255 256
extern void xfs_buf_lock(xfs_buf_t *);
extern void xfs_buf_unlock(xfs_buf_t *);
257 258
#define xfs_buf_islocked(bp) \
	((bp)->b_sema.count <= 0)
L
Linus Torvalds 已提交
259 260

/* Buffer Read and Write Routines */
261
extern int xfs_bwrite(struct xfs_buf *bp);
262 263 264

extern void xfsbdstrat(struct xfs_mount *, struct xfs_buf *);

265 266
extern void xfs_buf_ioend(xfs_buf_t *,	int);
extern void xfs_buf_ioerror(xfs_buf_t *, int);
267
extern void xfs_buf_ioerror_alert(struct xfs_buf *, const char *func);
268
extern void xfs_buf_iorequest(xfs_buf_t *);
269
extern int xfs_buf_iowait(xfs_buf_t *);
270
extern void xfs_buf_iomove(xfs_buf_t *, size_t, size_t, void *,
271
				xfs_buf_rw_t);
C
Christoph Hellwig 已提交
272 273
#define xfs_buf_zero(bp, off, len) \
	    xfs_buf_iomove((bp), (off), (len), NULL, XBRW_ZERO)
274 275

static inline int xfs_buf_geterror(xfs_buf_t *bp)
L
Linus Torvalds 已提交
276
{
277
	return bp ? bp->b_error : ENOMEM;
L
Linus Torvalds 已提交
278 279 280
}

/* Buffer Utility Routines */
281
extern xfs_caddr_t xfs_buf_offset(xfs_buf_t *, size_t);
L
Linus Torvalds 已提交
282 283

/* Delayed Write Buffer Routines */
284 285 286
extern bool xfs_buf_delwri_queue(struct xfs_buf *, struct list_head *);
extern int xfs_buf_delwri_submit(struct list_head *);
extern int xfs_buf_delwri_submit_nowait(struct list_head *);
L
Linus Torvalds 已提交
287 288

/* Buffer Daemon Setup Routines */
289 290
extern int xfs_buf_init(void);
extern void xfs_buf_terminate(void);
L
Linus Torvalds 已提交
291

292
#define XFS_BUF_ZEROFLAGS(bp) \
293
	((bp)->b_flags &= ~(XBF_READ|XBF_WRITE|XBF_ASYNC| \
294
			    XBF_SYNCIO|XBF_FUA|XBF_FLUSH))
295

296
void xfs_buf_stale(struct xfs_buf *bp);
297 298
#define XFS_BUF_UNSTALE(bp)	((bp)->b_flags &= ~XBF_STALE)
#define XFS_BUF_ISSTALE(bp)	((bp)->b_flags & XBF_STALE)
L
Linus Torvalds 已提交
299

300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315
#define XFS_BUF_DONE(bp)	((bp)->b_flags |= XBF_DONE)
#define XFS_BUF_UNDONE(bp)	((bp)->b_flags &= ~XBF_DONE)
#define XFS_BUF_ISDONE(bp)	((bp)->b_flags & XBF_DONE)

#define XFS_BUF_ASYNC(bp)	((bp)->b_flags |= XBF_ASYNC)
#define XFS_BUF_UNASYNC(bp)	((bp)->b_flags &= ~XBF_ASYNC)
#define XFS_BUF_ISASYNC(bp)	((bp)->b_flags & XBF_ASYNC)

#define XFS_BUF_READ(bp)	((bp)->b_flags |= XBF_READ)
#define XFS_BUF_UNREAD(bp)	((bp)->b_flags &= ~XBF_READ)
#define XFS_BUF_ISREAD(bp)	((bp)->b_flags & XBF_READ)

#define XFS_BUF_WRITE(bp)	((bp)->b_flags |= XBF_WRITE)
#define XFS_BUF_UNWRITE(bp)	((bp)->b_flags &= ~XBF_WRITE)
#define XFS_BUF_ISWRITE(bp)	((bp)->b_flags & XBF_WRITE)

316 317 318 319 320 321 322 323 324 325 326 327
/*
 * These macros use the IO block map rather than b_bn. b_bn is now really
 * just for the buffer cache index for cached buffers. As IO does not use b_bn
 * anymore, uncached buffers do not use b_bn at all and hence must modify the IO
 * map directly. Uncached buffers are not allowed to be discontiguous, so this
 * is safe to do.
 *
 * In future, uncached buffers will pass the block number directly to the io
 * request function and hence these macros will go away at that point.
 */
#define XFS_BUF_ADDR(bp)		((bp)->b_map.bm_bn)
#define XFS_BUF_SET_ADDR(bp, bno)	((bp)->b_map.bm_bn = (xfs_daddr_t)(bno))
328

329
static inline void xfs_buf_set_ref(struct xfs_buf *bp, int lru_ref)
330 331 332
{
	atomic_set(&bp->b_lru_ref, lru_ref);
}
333

334 335 336 337
static inline int xfs_buf_ispinned(struct xfs_buf *bp)
{
	return atomic_read(&bp->b_pin_count);
}
338 339

static inline void xfs_buf_relse(xfs_buf_t *bp)
L
Linus Torvalds 已提交
340
{
341
	xfs_buf_unlock(bp);
342
	xfs_buf_rele(bp);
L
Linus Torvalds 已提交
343 344 345 346 347
}

/*
 *	Handling of buftargs.
 */
348 349
extern xfs_buftarg_t *xfs_alloc_buftarg(struct xfs_mount *,
			struct block_device *, int, const char *);
350
extern void xfs_free_buftarg(struct xfs_mount *, struct xfs_buftarg *);
L
Linus Torvalds 已提交
351 352
extern void xfs_wait_buftarg(xfs_buftarg_t *);
extern int xfs_setsize_buftarg(xfs_buftarg_t *, unsigned int, unsigned int);
353

354 355 356
#define xfs_getsize_buftarg(buftarg)	block_size((buftarg)->bt_bdev)
#define xfs_readonly_buftarg(buftarg)	bdev_read_only((buftarg)->bt_bdev)

L
Linus Torvalds 已提交
357
#endif	/* __XFS_BUF_H__ */