xfs_inode.h 14.7 KB
Newer Older
D
Dave Chinner 已提交
1
// SPDX-License-Identifier: GPL-2.0
L
Linus Torvalds 已提交
2
/*
3 4
 * Copyright (c) 2000-2003,2005 Silicon Graphics, Inc.
 * All Rights Reserved.
L
Linus Torvalds 已提交
5 6 7 8
 */
#ifndef	__XFS_INODE_H__
#define	__XFS_INODE_H__

9
#include "xfs_inode_buf.h"
10
#include "xfs_inode_fork.h"
L
Linus Torvalds 已提交
11

12
/*
13
 * Kernel only inode definitions
14
 */
15 16
struct xfs_dinode;
struct xfs_inode;
17 18 19 20 21 22 23
struct xfs_buf;
struct xfs_bmbt_irec;
struct xfs_inode_log_item;
struct xfs_mount;
struct xfs_trans;
struct xfs_dquot;

L
Linus Torvalds 已提交
24 25 26 27 28
typedef struct xfs_inode {
	/* Inode linking and identification information. */
	struct xfs_mount	*i_mount;	/* fs mount struct ptr */
	struct xfs_dquot	*i_udquot;	/* user dquot */
	struct xfs_dquot	*i_gdquot;	/* group dquot */
29
	struct xfs_dquot	*i_pdquot;	/* project dquot */
L
Linus Torvalds 已提交
30 31 32

	/* Inode location stuff */
	xfs_ino_t		i_ino;		/* inode number (agno/agino)*/
33
	struct xfs_imap		i_imap;		/* location for xfs_imap() */
L
Linus Torvalds 已提交
34 35

	/* Extent information. */
36 37 38
	struct xfs_ifork	*i_afp;		/* attribute fork pointer */
	struct xfs_ifork	*i_cowfp;	/* copy on write extents */
	struct xfs_ifork	i_df;		/* data fork */
L
Linus Torvalds 已提交
39 40 41 42

	/* Transaction and locking information. */
	struct xfs_inode_log_item *i_itemp;	/* logging information */
	mrlock_t		i_lock;		/* inode lock */
D
Dave Chinner 已提交
43
	mrlock_t		i_mmaplock;	/* inode mmap IO lock */
L
Linus Torvalds 已提交
44
	atomic_t		i_pincount;	/* inode pin count */
45 46 47 48 49 50 51 52

	/*
	 * Bitsets of inode metadata that have been checked and/or are sick.
	 * Callers must hold i_flags_lock before accessing this field.
	 */
	uint16_t		i_checked;
	uint16_t		i_sick;

53
	spinlock_t		i_flags_lock;	/* inode i_flags lock */
L
Linus Torvalds 已提交
54
	/* Miscellaneous state. */
55
	unsigned long		i_flags;	/* see defined flags below */
56
	uint64_t		i_delayed_blks;	/* count of delay alloc blks */
L
Linus Torvalds 已提交
57

58
	struct xfs_icdinode	i_d;		/* most of ondisk inode */
L
Linus Torvalds 已提交
59

60 61
	/* VFS inode */
	struct inode		i_vnode;	/* embedded VFS inode */
62 63 64 65 66

	/* pending io completions */
	spinlock_t		i_ioend_lock;
	struct work_struct	i_ioend_work;
	struct list_head	i_ioend_list;
L
Linus Torvalds 已提交
67 68
} xfs_inode_t;

69 70 71
/* Convert from vfs inode to xfs inode */
static inline struct xfs_inode *XFS_I(struct inode *inode)
{
72
	return container_of(inode, struct xfs_inode, i_vnode);
73 74 75 76 77
}

/* convert from xfs inode to vfs inode */
static inline struct inode *VFS_I(struct xfs_inode *ip)
{
78
	return &ip->i_vnode;
79 80
}

81 82 83 84 85 86 87
/*
 * For regular files we only update the on-disk filesize when actually
 * writing data back to disk.  Until then only the copy in the VFS inode
 * is uptodate.
 */
static inline xfs_fsize_t XFS_ISIZE(struct xfs_inode *ip)
{
D
Dave Chinner 已提交
88
	if (S_ISREG(VFS_I(ip)->i_mode))
89 90 91 92
		return i_size_read(VFS_I(ip));
	return ip->i_d.di_size;
}

93 94 95 96 97 98 99 100 101
/*
 * If this I/O goes past the on-disk inode size update it unless it would
 * be past the current in-core inode size.
 */
static inline xfs_fsize_t
xfs_new_eof(struct xfs_inode *ip, xfs_fsize_t new_size)
{
	xfs_fsize_t i_size = i_size_read(VFS_I(ip));

102
	if (new_size > i_size || new_size < 0)
103 104 105 106
		new_size = i_size;
	return new_size > ip->i_d.di_size ? new_size : 0;
}

107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146
/*
 * i_flags helper functions
 */
static inline void
__xfs_iflags_set(xfs_inode_t *ip, unsigned short flags)
{
	ip->i_flags |= flags;
}

static inline void
xfs_iflags_set(xfs_inode_t *ip, unsigned short flags)
{
	spin_lock(&ip->i_flags_lock);
	__xfs_iflags_set(ip, flags);
	spin_unlock(&ip->i_flags_lock);
}

static inline void
xfs_iflags_clear(xfs_inode_t *ip, unsigned short flags)
{
	spin_lock(&ip->i_flags_lock);
	ip->i_flags &= ~flags;
	spin_unlock(&ip->i_flags_lock);
}

static inline int
__xfs_iflags_test(xfs_inode_t *ip, unsigned short flags)
{
	return (ip->i_flags & flags);
}

static inline int
xfs_iflags_test(xfs_inode_t *ip, unsigned short flags)
{
	int ret;
	spin_lock(&ip->i_flags_lock);
	ret = __xfs_iflags_test(ip, flags);
	spin_unlock(&ip->i_flags_lock);
	return ret;
}
147 148 149 150 151 152 153 154 155 156 157 158 159

static inline int
xfs_iflags_test_and_clear(xfs_inode_t *ip, unsigned short flags)
{
	int ret;

	spin_lock(&ip->i_flags_lock);
	ret = ip->i_flags & flags;
	if (ret)
		ip->i_flags &= ~flags;
	spin_unlock(&ip->i_flags_lock);
	return ret;
}
L
Linus Torvalds 已提交
160

161 162 163 164 165 166 167 168 169 170 171 172 173
static inline int
xfs_iflags_test_and_set(xfs_inode_t *ip, unsigned short flags)
{
	int ret;

	spin_lock(&ip->i_flags_lock);
	ret = ip->i_flags & flags;
	if (!ret)
		ip->i_flags |= flags;
	spin_unlock(&ip->i_flags_lock);
	return ret;
}

174 175 176 177
static inline prid_t
xfs_get_initial_prid(struct xfs_inode *dp)
{
	if (dp->i_d.di_flags & XFS_DIFLAG_PROJINHERIT)
178
		return dp->i_d.di_projid;
179 180 181 182

	return XFS_PROJID_DEFAULT;
}

183 184 185 186 187
static inline bool xfs_is_reflink_inode(struct xfs_inode *ip)
{
	return ip->i_d.di_flags2 & XFS_DIFLAG2_REFLINK;
}

188 189 190 191 192 193 194 195 196
/*
 * Check if an inode has any data in the COW fork.  This might be often false
 * even for inodes with the reflink flag when there is no pending COW operation.
 */
static inline bool xfs_inode_has_cow_data(struct xfs_inode *ip)
{
	return ip->i_cowfp && ip->i_cowfp->if_bytes;
}

197 198 199 200 201 202 203
/*
 * Return the buftarg used for data allocations on a given inode.
 */
#define xfs_inode_buftarg(ip) \
	(XFS_IS_REALTIME_INODE(ip) ? \
		(ip)->i_mount->m_rtdev_targp : (ip)->i_mount->m_ddev_targp)

L
Linus Torvalds 已提交
204 205 206
/*
 * In-core inode flags.
 */
207 208 209
#define XFS_IRECLAIM		(1 << 0) /* started reclaiming this inode */
#define XFS_ISTALE		(1 << 1) /* inode has been staled */
#define XFS_IRECLAIMABLE	(1 << 2) /* inode can be reclaimed */
210 211
#define __XFS_INEW_BIT		3	 /* inode has just been allocated */
#define XFS_INEW		(1 << __XFS_INEW_BIT)
212 213 214 215
#define XFS_ITRUNCATED		(1 << 5) /* truncated down so flush-on-close */
#define XFS_IDIRTY_RELEASE	(1 << 6) /* dirty release already seen */
#define __XFS_IFLOCK_BIT	7	 /* inode is being flushed right now */
#define XFS_IFLOCK		(1 << __XFS_IFLOCK_BIT)
216 217
#define __XFS_IPINNED_BIT	8	 /* wakeup key for zero pin count */
#define XFS_IPINNED		(1 << __XFS_IPINNED_BIT)
218
#define XFS_IEOFBLOCKS		(1 << 9) /* has the preallocblocks tag set */
219 220 221 222 223 224
/*
 * If this unlinked inode is in the middle of recovery, don't let drop_inode
 * truncate and free the inode.  This can happen if we iget the inode during
 * log recovery to replay a bmap operation on the inode.
 */
#define XFS_IRECOVERY		(1 << 11)
225
#define XFS_ICOWBLOCKS		(1 << 12)/* has the cowblocks tag set */
L
Linus Torvalds 已提交
226

227 228
/*
 * Per-lifetime flags need to be reset when re-using a reclaimable inode during
229
 * inode lookup. This prevents unintended behaviour on the new inode from
230 231 232 233
 * ocurring.
 */
#define XFS_IRECLAIM_RESET_FLAGS	\
	(XFS_IRECLAIMABLE | XFS_IRECLAIM | \
C
Christoph Hellwig 已提交
234
	 XFS_IDIRTY_RELEASE | XFS_ITRUNCATED)
235

236 237 238 239
/*
 * Synchronize processes attempting to flush the in-core inode back to disk.
 */

240 241 242 243 244
static inline int xfs_isiflocked(struct xfs_inode *ip)
{
	return xfs_iflags_test(ip, XFS_IFLOCK);
}

245 246 247 248 249 250 251 252 253 254 255 256 257 258 259
extern void __xfs_iflock(struct xfs_inode *ip);

static inline int xfs_iflock_nowait(struct xfs_inode *ip)
{
	return !xfs_iflags_test_and_set(ip, XFS_IFLOCK);
}

static inline void xfs_iflock(struct xfs_inode *ip)
{
	if (!xfs_iflock_nowait(ip))
		__xfs_iflock(ip);
}

static inline void xfs_ifunlock(struct xfs_inode *ip)
{
260
	ASSERT(xfs_isiflocked(ip));
261
	xfs_iflags_clear(ip, XFS_IFLOCK);
262
	smp_mb();
263 264 265
	wake_up_bit(&ip->i_flags, __XFS_IFLOCK_BIT);
}

L
Linus Torvalds 已提交
266 267
/*
 * Flags for inode locking.
268 269
 * Bit ranges:	1<<1  - 1<<16-1 -- iolock/ilock modes (bitfield)
 *		1<<16 - 1<<32-1 -- lockdep annotation (integers)
L
Linus Torvalds 已提交
270
 */
271 272 273 274
#define	XFS_IOLOCK_EXCL		(1<<0)
#define	XFS_IOLOCK_SHARED	(1<<1)
#define	XFS_ILOCK_EXCL		(1<<2)
#define	XFS_ILOCK_SHARED	(1<<3)
D
Dave Chinner 已提交
275 276
#define	XFS_MMAPLOCK_EXCL	(1<<4)
#define	XFS_MMAPLOCK_SHARED	(1<<5)
L
Linus Torvalds 已提交
277

278
#define XFS_LOCK_MASK		(XFS_IOLOCK_EXCL | XFS_IOLOCK_SHARED \
D
Dave Chinner 已提交
279 280
				| XFS_ILOCK_EXCL | XFS_ILOCK_SHARED \
				| XFS_MMAPLOCK_EXCL | XFS_MMAPLOCK_SHARED)
281

C
Christoph Hellwig 已提交
282 283 284 285
#define XFS_LOCK_FLAGS \
	{ XFS_IOLOCK_EXCL,	"IOLOCK_EXCL" }, \
	{ XFS_IOLOCK_SHARED,	"IOLOCK_SHARED" }, \
	{ XFS_ILOCK_EXCL,	"ILOCK_EXCL" }, \
D
Dave Chinner 已提交
286 287 288
	{ XFS_ILOCK_SHARED,	"ILOCK_SHARED" }, \
	{ XFS_MMAPLOCK_EXCL,	"MMAPLOCK_EXCL" }, \
	{ XFS_MMAPLOCK_SHARED,	"MMAPLOCK_SHARED" }
C
Christoph Hellwig 已提交
289 290


291 292 293
/*
 * Flags for lockdep annotations.
 *
294
 * XFS_LOCK_PARENT - for directory operations that require locking a
295 296 297
 * parent directory inode and a child entry inode. IOLOCK requires nesting,
 * MMAPLOCK does not support this class, ILOCK requires a single subclass
 * to differentiate parent from child.
298 299 300 301
 *
 * XFS_LOCK_RTBITMAP/XFS_LOCK_RTSUM - the realtime device bitmap and summary
 * inodes do not participate in the normal lock order, and thus have their
 * own subclasses.
302
 *
303
 * XFS_LOCK_INUMORDER - for locking several inodes at the some time
304 305
 * with xfs_lock_inodes().  This flag is used as the starting subclass
 * and each subsequent lock acquired will increment the subclass by one.
306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326
 * However, MAX_LOCKDEP_SUBCLASSES == 8, which means we are greatly
 * limited to the subclasses we can represent via nesting. We need at least
 * 5 inodes nest depth for the ILOCK through rename, and we also have to support
 * XFS_ILOCK_PARENT, which gives 6 subclasses. Then we have XFS_ILOCK_RTBITMAP
 * and XFS_ILOCK_RTSUM, which are another 2 unique subclasses, so that's all
 * 8 subclasses supported by lockdep.
 *
 * This also means we have to number the sub-classes in the lowest bits of
 * the mask we keep, and we have to ensure we never exceed 3 bits of lockdep
 * mask and we can't use bit-masking to build the subclasses. What a mess.
 *
 * Bit layout:
 *
 * Bit		Lock Region
 * 16-19	XFS_IOLOCK_SHIFT dependencies
 * 20-23	XFS_MMAPLOCK_SHIFT dependencies
 * 24-31	XFS_ILOCK_SHIFT dependencies
 *
 * IOLOCK values
 *
 * 0-3		subclass value
327
 * 4-7		unused
328 329 330 331 332 333 334 335 336 337 338 339
 *
 * MMAPLOCK values
 *
 * 0-3		subclass value
 * 4-7		unused
 *
 * ILOCK values
 * 0-4		subclass values
 * 5		PARENT subclass (not nestable)
 * 6		RTBITMAP subclass (not nestable)
 * 7		RTSUM subclass (not nestable)
 * 
340
 */
341
#define XFS_IOLOCK_SHIFT		16
342
#define XFS_IOLOCK_MAX_SUBCLASS		3
343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360
#define XFS_IOLOCK_DEP_MASK		0x000f0000

#define XFS_MMAPLOCK_SHIFT		20
#define XFS_MMAPLOCK_NUMORDER		0
#define XFS_MMAPLOCK_MAX_SUBCLASS	3
#define XFS_MMAPLOCK_DEP_MASK		0x00f00000

#define XFS_ILOCK_SHIFT			24
#define XFS_ILOCK_PARENT_VAL		5
#define XFS_ILOCK_MAX_SUBCLASS		(XFS_ILOCK_PARENT_VAL - 1)
#define XFS_ILOCK_RTBITMAP_VAL		6
#define XFS_ILOCK_RTSUM_VAL		7
#define XFS_ILOCK_DEP_MASK		0xff000000
#define	XFS_ILOCK_PARENT		(XFS_ILOCK_PARENT_VAL << XFS_ILOCK_SHIFT)
#define	XFS_ILOCK_RTBITMAP		(XFS_ILOCK_RTBITMAP_VAL << XFS_ILOCK_SHIFT)
#define	XFS_ILOCK_RTSUM			(XFS_ILOCK_RTSUM_VAL << XFS_ILOCK_SHIFT)

#define XFS_LOCK_SUBCLASS_MASK	(XFS_IOLOCK_DEP_MASK | \
D
Dave Chinner 已提交
361 362 363 364 365 366 367 368 369
				 XFS_MMAPLOCK_DEP_MASK | \
				 XFS_ILOCK_DEP_MASK)

#define XFS_IOLOCK_DEP(flags)	(((flags) & XFS_IOLOCK_DEP_MASK) \
					>> XFS_IOLOCK_SHIFT)
#define XFS_MMAPLOCK_DEP(flags)	(((flags) & XFS_MMAPLOCK_DEP_MASK) \
					>> XFS_MMAPLOCK_SHIFT)
#define XFS_ILOCK_DEP(flags)	(((flags) & XFS_ILOCK_DEP_MASK) \
					>> XFS_ILOCK_SHIFT)
L
Linus Torvalds 已提交
370

371 372 373 374 375 376 377 378 379 380 381 382 383 384
/*
 * Layouts are broken in the BREAK_WRITE case to ensure that
 * layout-holders do not collide with local writes. Additionally,
 * layouts are broken in the BREAK_UNMAP case to make sure the
 * layout-holder has a consistent view of the file's extent map. While
 * BREAK_WRITE breaks can be satisfied by recalling FL_LAYOUT leases,
 * BREAK_UNMAP breaks additionally require waiting for busy dax-pages to
 * go idle.
 */
enum layout_break_reason {
        BREAK_WRITE,
        BREAK_UNMAP,
};

L
Linus Torvalds 已提交
385 386 387 388 389
/*
 * For multiple groups support: if S_ISGID bit is set in the parent
 * directory, group of new file is set to that of the parent, and
 * new subdirectory gets S_ISGID bit from parent.
 */
390 391
#define XFS_INHERIT_GID(pip)	\
	(((pip)->i_mount->m_flags & XFS_MOUNT_GRPID) || \
D
Dave Chinner 已提交
392
	 (VFS_I(pip)->i_mode & S_ISGID))
L
Linus Torvalds 已提交
393

D
Dave Chinner 已提交
394
int		xfs_release(struct xfs_inode *ip);
395
void		xfs_inactive(struct xfs_inode *ip);
D
Dave Chinner 已提交
396 397 398
int		xfs_lookup(struct xfs_inode *dp, struct xfs_name *name,
			   struct xfs_inode **ipp, struct xfs_name *ci_name);
int		xfs_create(struct xfs_inode *dp, struct xfs_name *name,
C
Christoph Hellwig 已提交
399
			   umode_t mode, dev_t rdev, struct xfs_inode **ipp);
400 401
int		xfs_create_tmpfile(struct xfs_inode *dp, umode_t mode,
			   struct xfs_inode **ipp);
D
Dave Chinner 已提交
402 403 404 405 406 407 408
int		xfs_remove(struct xfs_inode *dp, struct xfs_name *name,
			   struct xfs_inode *ip);
int		xfs_link(struct xfs_inode *tdp, struct xfs_inode *sip,
			 struct xfs_name *target_name);
int		xfs_rename(struct xfs_inode *src_dp, struct xfs_name *src_name,
			   struct xfs_inode *src_ip, struct xfs_inode *target_dp,
			   struct xfs_name *target_name,
409
			   struct xfs_inode *target_ip, unsigned int flags);
D
Dave Chinner 已提交
410

L
Linus Torvalds 已提交
411 412 413 414
void		xfs_ilock(xfs_inode_t *, uint);
int		xfs_ilock_nowait(xfs_inode_t *, uint);
void		xfs_iunlock(xfs_inode_t *, uint);
void		xfs_ilock_demote(xfs_inode_t *, uint);
C
Christoph Hellwig 已提交
415
int		xfs_isilocked(xfs_inode_t *, uint);
416
uint		xfs_ilock_data_map_shared(struct xfs_inode *);
417
uint		xfs_ilock_attr_map_shared(struct xfs_inode *);
418

L
Linus Torvalds 已提交
419
uint		xfs_ip2xflags(struct xfs_inode *);
420
int		xfs_ifree(struct xfs_trans *, struct xfs_inode *);
B
Brian Foster 已提交
421 422
int		xfs_itruncate_extents_flags(struct xfs_trans **,
				struct xfs_inode *, int, xfs_fsize_t, int);
L
Linus Torvalds 已提交
423
void		xfs_iext_realloc(xfs_inode_t *, int, int);
424

425
int		xfs_log_force_inode(struct xfs_inode *ip);
426
void		xfs_iunpin_wait(xfs_inode_t *);
427 428
#define xfs_ipincount(ip)	((unsigned int) atomic_read(&ip->i_pincount))

429
int		xfs_iflush(struct xfs_inode *, struct xfs_buf **);
430 431
void		xfs_lock_two_inodes(struct xfs_inode *ip0, uint ip0_mode,
				struct xfs_inode *ip1, uint ip1_mode);
L
Linus Torvalds 已提交
432

433
xfs_extlen_t	xfs_get_extsz_hint(struct xfs_inode *ip);
434
xfs_extlen_t	xfs_get_cowextsz_hint(struct xfs_inode *ip);
435

D
Dave Chinner 已提交
436
int		xfs_dir_ialloc(struct xfs_trans **, struct xfs_inode *, umode_t,
437
			       xfs_nlink_t, dev_t, prid_t,
438
			       struct xfs_inode **);
D
Dave Chinner 已提交
439

440 441 442 443 444 445 446
static inline int
xfs_itruncate_extents(
	struct xfs_trans	**tpp,
	struct xfs_inode	*ip,
	int			whichfork,
	xfs_fsize_t		new_size)
{
B
Brian Foster 已提交
447
	return xfs_itruncate_extents_flags(tpp, ip, whichfork, new_size, 0);
448 449
}

D
Dave Chinner 已提交
450
/* from xfs_file.c */
451 452 453 454 455 456 457
enum xfs_prealloc_flags {
	XFS_PREALLOC_SET	= (1 << 1),
	XFS_PREALLOC_CLEAR	= (1 << 2),
	XFS_PREALLOC_SYNC	= (1 << 3),
	XFS_PREALLOC_INVISIBLE	= (1 << 4),
};

458 459
int	xfs_update_prealloc_flags(struct xfs_inode *ip,
				  enum xfs_prealloc_flags flags);
460 461
int	xfs_break_layouts(struct inode *inode, uint *iolock,
		enum layout_break_reason reason);
D
Dave Chinner 已提交
462

463
/* from xfs_iops.c */
464 465
extern void xfs_setup_inode(struct xfs_inode *ip);
extern void xfs_setup_iops(struct xfs_inode *ip);
466
extern void xfs_diflags_to_iflags(struct xfs_inode *ip, bool init);
467

468 469 470 471 472 473 474 475 476 477 478 479
/*
 * When setting up a newly allocated inode, we need to call
 * xfs_finish_inode_setup() once the inode is fully instantiated at
 * the VFS level to prevent the rest of the world seeing the inode
 * before we've completed instantiation. Otherwise we can do it
 * the moment the inode lookup is complete.
 */
static inline void xfs_finish_inode_setup(struct xfs_inode *ip)
{
	xfs_iflags_clear(ip, XFS_INEW);
	barrier();
	unlock_new_inode(VFS_I(ip));
480
	wake_up_bit(&ip->i_flags, __XFS_INEW_BIT);
481 482 483 484 485
}

static inline void xfs_setup_existing_inode(struct xfs_inode *ip)
{
	xfs_setup_inode(ip);
486
	xfs_setup_iops(ip);
487 488 489
	xfs_finish_inode_setup(ip);
}

490
void xfs_irele(struct xfs_inode *ip);
491

L
Linus Torvalds 已提交
492 493
extern struct kmem_zone	*xfs_inode_zone;

494 495 496
/* The default CoW extent size hint. */
#define XFS_DEFAULT_COWEXTSZ_HINT 32

497 498 499
int xfs_iunlink_init(struct xfs_perag *pag);
void xfs_iunlink_destroy(struct xfs_perag *pag);

500 501
void xfs_end_io(struct work_struct *work);

L
Linus Torvalds 已提交
502
#endif	/* __XFS_INODE_H__ */