xfs_inode.h 14.9 KB
Newer Older
D
Dave Chinner 已提交
1
// SPDX-License-Identifier: GPL-2.0
L
Linus Torvalds 已提交
2
/*
3 4
 * Copyright (c) 2000-2003,2005 Silicon Graphics, Inc.
 * All Rights Reserved.
L
Linus Torvalds 已提交
5 6 7 8
 */
#ifndef	__XFS_INODE_H__
#define	__XFS_INODE_H__

9
#include "xfs_inode_buf.h"
10
#include "xfs_inode_fork.h"
L
Linus Torvalds 已提交
11

12
/*
13
 * Kernel only inode definitions
14
 */
15 16
struct xfs_dinode;
struct xfs_inode;
17 18 19 20 21 22 23
struct xfs_buf;
struct xfs_bmbt_irec;
struct xfs_inode_log_item;
struct xfs_mount;
struct xfs_trans;
struct xfs_dquot;

L
Linus Torvalds 已提交
24 25 26 27 28
typedef struct xfs_inode {
	/* Inode linking and identification information. */
	struct xfs_mount	*i_mount;	/* fs mount struct ptr */
	struct xfs_dquot	*i_udquot;	/* user dquot */
	struct xfs_dquot	*i_gdquot;	/* group dquot */
29
	struct xfs_dquot	*i_pdquot;	/* project dquot */
L
Linus Torvalds 已提交
30 31 32

	/* Inode location stuff */
	xfs_ino_t		i_ino;		/* inode number (agno/agino)*/
33
	struct xfs_imap		i_imap;		/* location for xfs_imap() */
L
Linus Torvalds 已提交
34 35

	/* Extent information. */
36 37 38
	struct xfs_ifork	*i_afp;		/* attribute fork pointer */
	struct xfs_ifork	*i_cowfp;	/* copy on write extents */
	struct xfs_ifork	i_df;		/* data fork */
L
Linus Torvalds 已提交
39 40 41 42

	/* Transaction and locking information. */
	struct xfs_inode_log_item *i_itemp;	/* logging information */
	mrlock_t		i_lock;		/* inode lock */
D
Dave Chinner 已提交
43
	mrlock_t		i_mmaplock;	/* inode mmap IO lock */
L
Linus Torvalds 已提交
44
	atomic_t		i_pincount;	/* inode pin count */
45 46 47 48 49 50 51 52

	/*
	 * Bitsets of inode metadata that have been checked and/or are sick.
	 * Callers must hold i_flags_lock before accessing this field.
	 */
	uint16_t		i_checked;
	uint16_t		i_sick;

53
	spinlock_t		i_flags_lock;	/* inode i_flags lock */
L
Linus Torvalds 已提交
54
	/* Miscellaneous state. */
55
	unsigned long		i_flags;	/* see defined flags below */
56
	uint64_t		i_delayed_blks;	/* count of delay alloc blks */
57
	xfs_fsize_t		i_disk_size;	/* number of bytes in file */
58
	prid_t			i_projid;	/* owner's project id */
L
Linus Torvalds 已提交
59

60
	struct xfs_icdinode	i_d;		/* most of ondisk inode */
L
Linus Torvalds 已提交
61

62 63
	/* VFS inode */
	struct inode		i_vnode;	/* embedded VFS inode */
64 65 66 67 68

	/* pending io completions */
	spinlock_t		i_ioend_lock;
	struct work_struct	i_ioend_work;
	struct list_head	i_ioend_list;
L
Linus Torvalds 已提交
69 70
} xfs_inode_t;

71 72 73
/* Convert from vfs inode to xfs inode */
static inline struct xfs_inode *XFS_I(struct inode *inode)
{
74
	return container_of(inode, struct xfs_inode, i_vnode);
75 76 77 78 79
}

/* convert from xfs inode to vfs inode */
static inline struct inode *VFS_I(struct xfs_inode *ip)
{
80
	return &ip->i_vnode;
81 82
}

83 84 85 86 87 88 89
/*
 * For regular files we only update the on-disk filesize when actually
 * writing data back to disk.  Until then only the copy in the VFS inode
 * is uptodate.
 */
static inline xfs_fsize_t XFS_ISIZE(struct xfs_inode *ip)
{
D
Dave Chinner 已提交
90
	if (S_ISREG(VFS_I(ip)->i_mode))
91
		return i_size_read(VFS_I(ip));
92
	return ip->i_disk_size;
93 94
}

95 96 97 98 99 100 101 102 103
/*
 * If this I/O goes past the on-disk inode size update it unless it would
 * be past the current in-core inode size.
 */
static inline xfs_fsize_t
xfs_new_eof(struct xfs_inode *ip, xfs_fsize_t new_size)
{
	xfs_fsize_t i_size = i_size_read(VFS_I(ip));

104
	if (new_size > i_size || new_size < 0)
105
		new_size = i_size;
106
	return new_size > ip->i_disk_size ? new_size : 0;
107 108
}

109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148
/*
 * i_flags helper functions
 */
static inline void
__xfs_iflags_set(xfs_inode_t *ip, unsigned short flags)
{
	ip->i_flags |= flags;
}

static inline void
xfs_iflags_set(xfs_inode_t *ip, unsigned short flags)
{
	spin_lock(&ip->i_flags_lock);
	__xfs_iflags_set(ip, flags);
	spin_unlock(&ip->i_flags_lock);
}

static inline void
xfs_iflags_clear(xfs_inode_t *ip, unsigned short flags)
{
	spin_lock(&ip->i_flags_lock);
	ip->i_flags &= ~flags;
	spin_unlock(&ip->i_flags_lock);
}

static inline int
__xfs_iflags_test(xfs_inode_t *ip, unsigned short flags)
{
	return (ip->i_flags & flags);
}

static inline int
xfs_iflags_test(xfs_inode_t *ip, unsigned short flags)
{
	int ret;
	spin_lock(&ip->i_flags_lock);
	ret = __xfs_iflags_test(ip, flags);
	spin_unlock(&ip->i_flags_lock);
	return ret;
}
149 150 151 152 153 154 155 156 157 158 159 160 161

static inline int
xfs_iflags_test_and_clear(xfs_inode_t *ip, unsigned short flags)
{
	int ret;

	spin_lock(&ip->i_flags_lock);
	ret = ip->i_flags & flags;
	if (ret)
		ip->i_flags &= ~flags;
	spin_unlock(&ip->i_flags_lock);
	return ret;
}
L
Linus Torvalds 已提交
162

163 164 165 166 167 168 169 170 171 172 173 174 175
static inline int
xfs_iflags_test_and_set(xfs_inode_t *ip, unsigned short flags)
{
	int ret;

	spin_lock(&ip->i_flags_lock);
	ret = ip->i_flags & flags;
	if (!ret)
		ip->i_flags |= flags;
	spin_unlock(&ip->i_flags_lock);
	return ret;
}

176 177 178 179
static inline prid_t
xfs_get_initial_prid(struct xfs_inode *dp)
{
	if (dp->i_d.di_flags & XFS_DIFLAG_PROJINHERIT)
180
		return dp->i_projid;
181 182 183 184

	return XFS_PROJID_DEFAULT;
}

185 186 187 188 189
static inline bool xfs_is_reflink_inode(struct xfs_inode *ip)
{
	return ip->i_d.di_flags2 & XFS_DIFLAG2_REFLINK;
}

190 191 192 193 194 195 196 197
static inline bool xfs_is_metadata_inode(struct xfs_inode *ip)
{
	struct xfs_mount	*mp = ip->i_mount;

	return ip == mp->m_rbmip || ip == mp->m_rsumip ||
		xfs_is_quota_inode(&mp->m_sb, ip->i_ino);
}

198 199 200 201 202 203 204 205 206
/*
 * Check if an inode has any data in the COW fork.  This might be often false
 * even for inodes with the reflink flag when there is no pending COW operation.
 */
static inline bool xfs_inode_has_cow_data(struct xfs_inode *ip)
{
	return ip->i_cowfp && ip->i_cowfp->if_bytes;
}

207 208 209 210 211
static inline bool xfs_inode_has_bigtime(struct xfs_inode *ip)
{
	return ip->i_d.di_flags2 & XFS_DIFLAG2_BIGTIME;
}

212 213 214 215 216 217 218
/*
 * Return the buftarg used for data allocations on a given inode.
 */
#define xfs_inode_buftarg(ip) \
	(XFS_IS_REALTIME_INODE(ip) ? \
		(ip)->i_mount->m_rtdev_targp : (ip)->i_mount->m_ddev_targp)

L
Linus Torvalds 已提交
219 220 221
/*
 * In-core inode flags.
 */
222 223 224
#define XFS_IRECLAIM		(1 << 0) /* started reclaiming this inode */
#define XFS_ISTALE		(1 << 1) /* inode has been staled */
#define XFS_IRECLAIMABLE	(1 << 2) /* inode can be reclaimed */
225 226
#define __XFS_INEW_BIT		3	 /* inode has just been allocated */
#define XFS_INEW		(1 << __XFS_INEW_BIT)
227
#define XFS_IPRESERVE_DM_FIELDS	(1 << 4) /* has legacy DMAPI fields set */
228 229
#define XFS_ITRUNCATED		(1 << 5) /* truncated down so flush-on-close */
#define XFS_IDIRTY_RELEASE	(1 << 6) /* dirty release already seen */
230
#define XFS_IFLUSHING		(1 << 7) /* inode is being flushed */
231 232
#define __XFS_IPINNED_BIT	8	 /* wakeup key for zero pin count */
#define XFS_IPINNED		(1 << __XFS_IPINNED_BIT)
233
#define XFS_IEOFBLOCKS		(1 << 9) /* has the preallocblocks tag set */
234 235 236 237 238 239
/*
 * If this unlinked inode is in the middle of recovery, don't let drop_inode
 * truncate and free the inode.  This can happen if we iget the inode during
 * log recovery to replay a bmap operation on the inode.
 */
#define XFS_IRECOVERY		(1 << 11)
240
#define XFS_ICOWBLOCKS		(1 << 12)/* has the cowblocks tag set */
L
Linus Torvalds 已提交
241

242 243
/*
 * Per-lifetime flags need to be reset when re-using a reclaimable inode during
244
 * inode lookup. This prevents unintended behaviour on the new inode from
245 246 247 248
 * ocurring.
 */
#define XFS_IRECLAIM_RESET_FLAGS	\
	(XFS_IRECLAIMABLE | XFS_IRECLAIM | \
C
Christoph Hellwig 已提交
249
	 XFS_IDIRTY_RELEASE | XFS_ITRUNCATED)
250

L
Linus Torvalds 已提交
251 252
/*
 * Flags for inode locking.
253 254
 * Bit ranges:	1<<1  - 1<<16-1 -- iolock/ilock modes (bitfield)
 *		1<<16 - 1<<32-1 -- lockdep annotation (integers)
L
Linus Torvalds 已提交
255
 */
256 257 258 259
#define	XFS_IOLOCK_EXCL		(1<<0)
#define	XFS_IOLOCK_SHARED	(1<<1)
#define	XFS_ILOCK_EXCL		(1<<2)
#define	XFS_ILOCK_SHARED	(1<<3)
D
Dave Chinner 已提交
260 261
#define	XFS_MMAPLOCK_EXCL	(1<<4)
#define	XFS_MMAPLOCK_SHARED	(1<<5)
L
Linus Torvalds 已提交
262

263
#define XFS_LOCK_MASK		(XFS_IOLOCK_EXCL | XFS_IOLOCK_SHARED \
D
Dave Chinner 已提交
264 265
				| XFS_ILOCK_EXCL | XFS_ILOCK_SHARED \
				| XFS_MMAPLOCK_EXCL | XFS_MMAPLOCK_SHARED)
266

C
Christoph Hellwig 已提交
267 268 269 270
#define XFS_LOCK_FLAGS \
	{ XFS_IOLOCK_EXCL,	"IOLOCK_EXCL" }, \
	{ XFS_IOLOCK_SHARED,	"IOLOCK_SHARED" }, \
	{ XFS_ILOCK_EXCL,	"ILOCK_EXCL" }, \
D
Dave Chinner 已提交
271 272 273
	{ XFS_ILOCK_SHARED,	"ILOCK_SHARED" }, \
	{ XFS_MMAPLOCK_EXCL,	"MMAPLOCK_EXCL" }, \
	{ XFS_MMAPLOCK_SHARED,	"MMAPLOCK_SHARED" }
C
Christoph Hellwig 已提交
274 275


276 277 278
/*
 * Flags for lockdep annotations.
 *
279
 * XFS_LOCK_PARENT - for directory operations that require locking a
280 281 282
 * parent directory inode and a child entry inode. IOLOCK requires nesting,
 * MMAPLOCK does not support this class, ILOCK requires a single subclass
 * to differentiate parent from child.
283 284 285 286
 *
 * XFS_LOCK_RTBITMAP/XFS_LOCK_RTSUM - the realtime device bitmap and summary
 * inodes do not participate in the normal lock order, and thus have their
 * own subclasses.
287
 *
288
 * XFS_LOCK_INUMORDER - for locking several inodes at the some time
289 290
 * with xfs_lock_inodes().  This flag is used as the starting subclass
 * and each subsequent lock acquired will increment the subclass by one.
291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311
 * However, MAX_LOCKDEP_SUBCLASSES == 8, which means we are greatly
 * limited to the subclasses we can represent via nesting. We need at least
 * 5 inodes nest depth for the ILOCK through rename, and we also have to support
 * XFS_ILOCK_PARENT, which gives 6 subclasses. Then we have XFS_ILOCK_RTBITMAP
 * and XFS_ILOCK_RTSUM, which are another 2 unique subclasses, so that's all
 * 8 subclasses supported by lockdep.
 *
 * This also means we have to number the sub-classes in the lowest bits of
 * the mask we keep, and we have to ensure we never exceed 3 bits of lockdep
 * mask and we can't use bit-masking to build the subclasses. What a mess.
 *
 * Bit layout:
 *
 * Bit		Lock Region
 * 16-19	XFS_IOLOCK_SHIFT dependencies
 * 20-23	XFS_MMAPLOCK_SHIFT dependencies
 * 24-31	XFS_ILOCK_SHIFT dependencies
 *
 * IOLOCK values
 *
 * 0-3		subclass value
312
 * 4-7		unused
313 314 315 316 317 318 319 320 321 322 323 324
 *
 * MMAPLOCK values
 *
 * 0-3		subclass value
 * 4-7		unused
 *
 * ILOCK values
 * 0-4		subclass values
 * 5		PARENT subclass (not nestable)
 * 6		RTBITMAP subclass (not nestable)
 * 7		RTSUM subclass (not nestable)
 * 
325
 */
326
#define XFS_IOLOCK_SHIFT		16
327
#define XFS_IOLOCK_MAX_SUBCLASS		3
328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345
#define XFS_IOLOCK_DEP_MASK		0x000f0000

#define XFS_MMAPLOCK_SHIFT		20
#define XFS_MMAPLOCK_NUMORDER		0
#define XFS_MMAPLOCK_MAX_SUBCLASS	3
#define XFS_MMAPLOCK_DEP_MASK		0x00f00000

#define XFS_ILOCK_SHIFT			24
#define XFS_ILOCK_PARENT_VAL		5
#define XFS_ILOCK_MAX_SUBCLASS		(XFS_ILOCK_PARENT_VAL - 1)
#define XFS_ILOCK_RTBITMAP_VAL		6
#define XFS_ILOCK_RTSUM_VAL		7
#define XFS_ILOCK_DEP_MASK		0xff000000
#define	XFS_ILOCK_PARENT		(XFS_ILOCK_PARENT_VAL << XFS_ILOCK_SHIFT)
#define	XFS_ILOCK_RTBITMAP		(XFS_ILOCK_RTBITMAP_VAL << XFS_ILOCK_SHIFT)
#define	XFS_ILOCK_RTSUM			(XFS_ILOCK_RTSUM_VAL << XFS_ILOCK_SHIFT)

#define XFS_LOCK_SUBCLASS_MASK	(XFS_IOLOCK_DEP_MASK | \
D
Dave Chinner 已提交
346 347 348 349 350 351 352 353 354
				 XFS_MMAPLOCK_DEP_MASK | \
				 XFS_ILOCK_DEP_MASK)

#define XFS_IOLOCK_DEP(flags)	(((flags) & XFS_IOLOCK_DEP_MASK) \
					>> XFS_IOLOCK_SHIFT)
#define XFS_MMAPLOCK_DEP(flags)	(((flags) & XFS_MMAPLOCK_DEP_MASK) \
					>> XFS_MMAPLOCK_SHIFT)
#define XFS_ILOCK_DEP(flags)	(((flags) & XFS_ILOCK_DEP_MASK) \
					>> XFS_ILOCK_SHIFT)
L
Linus Torvalds 已提交
355

356 357 358 359 360 361 362 363 364 365 366 367 368 369
/*
 * Layouts are broken in the BREAK_WRITE case to ensure that
 * layout-holders do not collide with local writes. Additionally,
 * layouts are broken in the BREAK_UNMAP case to make sure the
 * layout-holder has a consistent view of the file's extent map. While
 * BREAK_WRITE breaks can be satisfied by recalling FL_LAYOUT leases,
 * BREAK_UNMAP breaks additionally require waiting for busy dax-pages to
 * go idle.
 */
enum layout_break_reason {
        BREAK_WRITE,
        BREAK_UNMAP,
};

L
Linus Torvalds 已提交
370 371 372 373 374
/*
 * For multiple groups support: if S_ISGID bit is set in the parent
 * directory, group of new file is set to that of the parent, and
 * new subdirectory gets S_ISGID bit from parent.
 */
375 376
#define XFS_INHERIT_GID(pip)	\
	(((pip)->i_mount->m_flags & XFS_MOUNT_GRPID) || \
D
Dave Chinner 已提交
377
	 (VFS_I(pip)->i_mode & S_ISGID))
L
Linus Torvalds 已提交
378

D
Dave Chinner 已提交
379
int		xfs_release(struct xfs_inode *ip);
380
void		xfs_inactive(struct xfs_inode *ip);
D
Dave Chinner 已提交
381 382
int		xfs_lookup(struct xfs_inode *dp, struct xfs_name *name,
			   struct xfs_inode **ipp, struct xfs_name *ci_name);
C
Christoph Hellwig 已提交
383 384
int		xfs_create(struct user_namespace *mnt_userns,
			   struct xfs_inode *dp, struct xfs_name *name,
385 386
			   umode_t mode, dev_t rdev, bool need_xattr,
			   struct xfs_inode **ipp);
C
Christoph Hellwig 已提交
387 388
int		xfs_create_tmpfile(struct user_namespace *mnt_userns,
			   struct xfs_inode *dp, umode_t mode,
389
			   struct xfs_inode **ipp);
D
Dave Chinner 已提交
390 391 392 393
int		xfs_remove(struct xfs_inode *dp, struct xfs_name *name,
			   struct xfs_inode *ip);
int		xfs_link(struct xfs_inode *tdp, struct xfs_inode *sip,
			 struct xfs_name *target_name);
C
Christoph Hellwig 已提交
394 395
int		xfs_rename(struct user_namespace *mnt_userns,
			   struct xfs_inode *src_dp, struct xfs_name *src_name,
D
Dave Chinner 已提交
396 397
			   struct xfs_inode *src_ip, struct xfs_inode *target_dp,
			   struct xfs_name *target_name,
398
			   struct xfs_inode *target_ip, unsigned int flags);
D
Dave Chinner 已提交
399

L
Linus Torvalds 已提交
400 401 402 403
void		xfs_ilock(xfs_inode_t *, uint);
int		xfs_ilock_nowait(xfs_inode_t *, uint);
void		xfs_iunlock(xfs_inode_t *, uint);
void		xfs_ilock_demote(xfs_inode_t *, uint);
C
Christoph Hellwig 已提交
404
int		xfs_isilocked(xfs_inode_t *, uint);
405
uint		xfs_ilock_data_map_shared(struct xfs_inode *);
406
uint		xfs_ilock_attr_map_shared(struct xfs_inode *);
407

L
Linus Torvalds 已提交
408
uint		xfs_ip2xflags(struct xfs_inode *);
409
int		xfs_ifree(struct xfs_trans *, struct xfs_inode *);
B
Brian Foster 已提交
410 411
int		xfs_itruncate_extents_flags(struct xfs_trans **,
				struct xfs_inode *, int, xfs_fsize_t, int);
L
Linus Torvalds 已提交
412
void		xfs_iext_realloc(xfs_inode_t *, int, int);
413

414
int		xfs_log_force_inode(struct xfs_inode *ip);
415
void		xfs_iunpin_wait(xfs_inode_t *);
416 417
#define xfs_ipincount(ip)	((unsigned int) atomic_read(&ip->i_pincount))

418
int		xfs_iflush_cluster(struct xfs_buf *);
419 420
void		xfs_lock_two_inodes(struct xfs_inode *ip0, uint ip0_mode,
				struct xfs_inode *ip1, uint ip1_mode);
L
Linus Torvalds 已提交
421

422
xfs_extlen_t	xfs_get_extsz_hint(struct xfs_inode *ip);
423
xfs_extlen_t	xfs_get_cowextsz_hint(struct xfs_inode *ip);
424

C
Christoph Hellwig 已提交
425 426 427
int		xfs_dir_ialloc(struct user_namespace *mnt_userns,
			       struct xfs_trans **tpp, struct xfs_inode *dp,
			       umode_t mode, xfs_nlink_t nlink, dev_t dev,
428 429
			       prid_t prid, bool need_xattr,
			       struct xfs_inode **ipp);
D
Dave Chinner 已提交
430

431 432 433 434 435 436 437
static inline int
xfs_itruncate_extents(
	struct xfs_trans	**tpp,
	struct xfs_inode	*ip,
	int			whichfork,
	xfs_fsize_t		new_size)
{
B
Brian Foster 已提交
438
	return xfs_itruncate_extents_flags(tpp, ip, whichfork, new_size, 0);
439 440
}

D
Dave Chinner 已提交
441
/* from xfs_file.c */
442 443 444 445 446 447 448
enum xfs_prealloc_flags {
	XFS_PREALLOC_SET	= (1 << 1),
	XFS_PREALLOC_CLEAR	= (1 << 2),
	XFS_PREALLOC_SYNC	= (1 << 3),
	XFS_PREALLOC_INVISIBLE	= (1 << 4),
};

449 450
int	xfs_update_prealloc_flags(struct xfs_inode *ip,
				  enum xfs_prealloc_flags flags);
451 452
int	xfs_break_layouts(struct inode *inode, uint *iolock,
		enum layout_break_reason reason);
D
Dave Chinner 已提交
453

454
/* from xfs_iops.c */
455 456
extern void xfs_setup_inode(struct xfs_inode *ip);
extern void xfs_setup_iops(struct xfs_inode *ip);
457
extern void xfs_diflags_to_iflags(struct xfs_inode *ip, bool init);
458

459 460 461 462 463 464 465 466 467 468 469 470
/*
 * When setting up a newly allocated inode, we need to call
 * xfs_finish_inode_setup() once the inode is fully instantiated at
 * the VFS level to prevent the rest of the world seeing the inode
 * before we've completed instantiation. Otherwise we can do it
 * the moment the inode lookup is complete.
 */
static inline void xfs_finish_inode_setup(struct xfs_inode *ip)
{
	xfs_iflags_clear(ip, XFS_INEW);
	barrier();
	unlock_new_inode(VFS_I(ip));
471
	wake_up_bit(&ip->i_flags, __XFS_INEW_BIT);
472 473 474 475 476
}

static inline void xfs_setup_existing_inode(struct xfs_inode *ip)
{
	xfs_setup_inode(ip);
477
	xfs_setup_iops(ip);
478 479 480
	xfs_finish_inode_setup(ip);
}

481
void xfs_irele(struct xfs_inode *ip);
482

L
Linus Torvalds 已提交
483 484
extern struct kmem_zone	*xfs_inode_zone;

485 486 487
/* The default CoW extent size hint. */
#define XFS_DEFAULT_COWEXTSZ_HINT 32

488 489 490
int xfs_iunlink_init(struct xfs_perag *pag);
void xfs_iunlink_destroy(struct xfs_perag *pag);

491 492
void xfs_end_io(struct work_struct *work);

493 494 495
int xfs_ilock2_io_mmap(struct xfs_inode *ip1, struct xfs_inode *ip2);
void xfs_iunlock2_io_mmap(struct xfs_inode *ip1, struct xfs_inode *ip2);

L
Linus Torvalds 已提交
496
#endif	/* __XFS_INODE_H__ */