xfs_inode.h 14.8 KB
Newer Older
D
Dave Chinner 已提交
1
// SPDX-License-Identifier: GPL-2.0
L
Linus Torvalds 已提交
2
/*
3 4
 * Copyright (c) 2000-2003,2005 Silicon Graphics, Inc.
 * All Rights Reserved.
L
Linus Torvalds 已提交
5 6 7 8
 */
#ifndef	__XFS_INODE_H__
#define	__XFS_INODE_H__

9
#include "xfs_inode_buf.h"
10
#include "xfs_inode_fork.h"
L
Linus Torvalds 已提交
11

12
/*
13
 * Kernel only inode definitions
14
 */
15 16
struct xfs_dinode;
struct xfs_inode;
17 18 19 20 21 22 23
struct xfs_buf;
struct xfs_bmbt_irec;
struct xfs_inode_log_item;
struct xfs_mount;
struct xfs_trans;
struct xfs_dquot;

L
Linus Torvalds 已提交
24 25 26 27 28
typedef struct xfs_inode {
	/* Inode linking and identification information. */
	struct xfs_mount	*i_mount;	/* fs mount struct ptr */
	struct xfs_dquot	*i_udquot;	/* user dquot */
	struct xfs_dquot	*i_gdquot;	/* group dquot */
29
	struct xfs_dquot	*i_pdquot;	/* project dquot */
L
Linus Torvalds 已提交
30 31 32

	/* Inode location stuff */
	xfs_ino_t		i_ino;		/* inode number (agno/agino)*/
33
	struct xfs_imap		i_imap;		/* location for xfs_imap() */
L
Linus Torvalds 已提交
34 35

	/* Extent information. */
36 37 38
	struct xfs_ifork	*i_afp;		/* attribute fork pointer */
	struct xfs_ifork	*i_cowfp;	/* copy on write extents */
	struct xfs_ifork	i_df;		/* data fork */
L
Linus Torvalds 已提交
39 40 41 42

	/* Transaction and locking information. */
	struct xfs_inode_log_item *i_itemp;	/* logging information */
	mrlock_t		i_lock;		/* inode lock */
D
Dave Chinner 已提交
43
	mrlock_t		i_mmaplock;	/* inode mmap IO lock */
L
Linus Torvalds 已提交
44
	atomic_t		i_pincount;	/* inode pin count */
45 46 47 48 49 50 51 52

	/*
	 * Bitsets of inode metadata that have been checked and/or are sick.
	 * Callers must hold i_flags_lock before accessing this field.
	 */
	uint16_t		i_checked;
	uint16_t		i_sick;

53
	spinlock_t		i_flags_lock;	/* inode i_flags lock */
L
Linus Torvalds 已提交
54
	/* Miscellaneous state. */
55
	unsigned long		i_flags;	/* see defined flags below */
56
	uint64_t		i_delayed_blks;	/* count of delay alloc blks */
57
	prid_t			i_projid;	/* owner's project id */
L
Linus Torvalds 已提交
58

59
	struct xfs_icdinode	i_d;		/* most of ondisk inode */
L
Linus Torvalds 已提交
60

61 62
	/* VFS inode */
	struct inode		i_vnode;	/* embedded VFS inode */
63 64 65 66 67

	/* pending io completions */
	spinlock_t		i_ioend_lock;
	struct work_struct	i_ioend_work;
	struct list_head	i_ioend_list;
L
Linus Torvalds 已提交
68 69
} xfs_inode_t;

70 71 72
/* Convert from vfs inode to xfs inode */
static inline struct xfs_inode *XFS_I(struct inode *inode)
{
73
	return container_of(inode, struct xfs_inode, i_vnode);
74 75 76 77 78
}

/* convert from xfs inode to vfs inode */
static inline struct inode *VFS_I(struct xfs_inode *ip)
{
79
	return &ip->i_vnode;
80 81
}

82 83 84 85 86 87 88
/*
 * For regular files we only update the on-disk filesize when actually
 * writing data back to disk.  Until then only the copy in the VFS inode
 * is uptodate.
 */
static inline xfs_fsize_t XFS_ISIZE(struct xfs_inode *ip)
{
D
Dave Chinner 已提交
89
	if (S_ISREG(VFS_I(ip)->i_mode))
90 91 92 93
		return i_size_read(VFS_I(ip));
	return ip->i_d.di_size;
}

94 95 96 97 98 99 100 101 102
/*
 * If this I/O goes past the on-disk inode size update it unless it would
 * be past the current in-core inode size.
 */
static inline xfs_fsize_t
xfs_new_eof(struct xfs_inode *ip, xfs_fsize_t new_size)
{
	xfs_fsize_t i_size = i_size_read(VFS_I(ip));

103
	if (new_size > i_size || new_size < 0)
104 105 106 107
		new_size = i_size;
	return new_size > ip->i_d.di_size ? new_size : 0;
}

108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147
/*
 * i_flags helper functions
 */
static inline void
__xfs_iflags_set(xfs_inode_t *ip, unsigned short flags)
{
	ip->i_flags |= flags;
}

static inline void
xfs_iflags_set(xfs_inode_t *ip, unsigned short flags)
{
	spin_lock(&ip->i_flags_lock);
	__xfs_iflags_set(ip, flags);
	spin_unlock(&ip->i_flags_lock);
}

static inline void
xfs_iflags_clear(xfs_inode_t *ip, unsigned short flags)
{
	spin_lock(&ip->i_flags_lock);
	ip->i_flags &= ~flags;
	spin_unlock(&ip->i_flags_lock);
}

static inline int
__xfs_iflags_test(xfs_inode_t *ip, unsigned short flags)
{
	return (ip->i_flags & flags);
}

static inline int
xfs_iflags_test(xfs_inode_t *ip, unsigned short flags)
{
	int ret;
	spin_lock(&ip->i_flags_lock);
	ret = __xfs_iflags_test(ip, flags);
	spin_unlock(&ip->i_flags_lock);
	return ret;
}
148 149 150 151 152 153 154 155 156 157 158 159 160

static inline int
xfs_iflags_test_and_clear(xfs_inode_t *ip, unsigned short flags)
{
	int ret;

	spin_lock(&ip->i_flags_lock);
	ret = ip->i_flags & flags;
	if (ret)
		ip->i_flags &= ~flags;
	spin_unlock(&ip->i_flags_lock);
	return ret;
}
L
Linus Torvalds 已提交
161

162 163 164 165 166 167 168 169 170 171 172 173 174
static inline int
xfs_iflags_test_and_set(xfs_inode_t *ip, unsigned short flags)
{
	int ret;

	spin_lock(&ip->i_flags_lock);
	ret = ip->i_flags & flags;
	if (!ret)
		ip->i_flags |= flags;
	spin_unlock(&ip->i_flags_lock);
	return ret;
}

175 176 177 178
static inline prid_t
xfs_get_initial_prid(struct xfs_inode *dp)
{
	if (dp->i_d.di_flags & XFS_DIFLAG_PROJINHERIT)
179
		return dp->i_projid;
180 181 182 183

	return XFS_PROJID_DEFAULT;
}

184 185 186 187 188
static inline bool xfs_is_reflink_inode(struct xfs_inode *ip)
{
	return ip->i_d.di_flags2 & XFS_DIFLAG2_REFLINK;
}

189 190 191 192 193 194 195 196
static inline bool xfs_is_metadata_inode(struct xfs_inode *ip)
{
	struct xfs_mount	*mp = ip->i_mount;

	return ip == mp->m_rbmip || ip == mp->m_rsumip ||
		xfs_is_quota_inode(&mp->m_sb, ip->i_ino);
}

197 198 199 200 201 202 203 204 205
/*
 * Check if an inode has any data in the COW fork.  This might be often false
 * even for inodes with the reflink flag when there is no pending COW operation.
 */
static inline bool xfs_inode_has_cow_data(struct xfs_inode *ip)
{
	return ip->i_cowfp && ip->i_cowfp->if_bytes;
}

206 207 208 209 210
static inline bool xfs_inode_has_bigtime(struct xfs_inode *ip)
{
	return ip->i_d.di_flags2 & XFS_DIFLAG2_BIGTIME;
}

211 212 213 214 215 216 217
/*
 * Return the buftarg used for data allocations on a given inode.
 */
#define xfs_inode_buftarg(ip) \
	(XFS_IS_REALTIME_INODE(ip) ? \
		(ip)->i_mount->m_rtdev_targp : (ip)->i_mount->m_ddev_targp)

L
Linus Torvalds 已提交
218 219 220
/*
 * In-core inode flags.
 */
221 222 223
#define XFS_IRECLAIM		(1 << 0) /* started reclaiming this inode */
#define XFS_ISTALE		(1 << 1) /* inode has been staled */
#define XFS_IRECLAIMABLE	(1 << 2) /* inode can be reclaimed */
224 225
#define __XFS_INEW_BIT		3	 /* inode has just been allocated */
#define XFS_INEW		(1 << __XFS_INEW_BIT)
226
#define XFS_IPRESERVE_DM_FIELDS	(1 << 4) /* has legacy DMAPI fields set */
227 228
#define XFS_ITRUNCATED		(1 << 5) /* truncated down so flush-on-close */
#define XFS_IDIRTY_RELEASE	(1 << 6) /* dirty release already seen */
229
#define XFS_IFLUSHING		(1 << 7) /* inode is being flushed */
230 231
#define __XFS_IPINNED_BIT	8	 /* wakeup key for zero pin count */
#define XFS_IPINNED		(1 << __XFS_IPINNED_BIT)
232
#define XFS_IEOFBLOCKS		(1 << 9) /* has the preallocblocks tag set */
233 234 235 236 237 238
/*
 * If this unlinked inode is in the middle of recovery, don't let drop_inode
 * truncate and free the inode.  This can happen if we iget the inode during
 * log recovery to replay a bmap operation on the inode.
 */
#define XFS_IRECOVERY		(1 << 11)
239
#define XFS_ICOWBLOCKS		(1 << 12)/* has the cowblocks tag set */
L
Linus Torvalds 已提交
240

241 242
/*
 * Per-lifetime flags need to be reset when re-using a reclaimable inode during
243
 * inode lookup. This prevents unintended behaviour on the new inode from
244 245 246 247
 * ocurring.
 */
#define XFS_IRECLAIM_RESET_FLAGS	\
	(XFS_IRECLAIMABLE | XFS_IRECLAIM | \
C
Christoph Hellwig 已提交
248
	 XFS_IDIRTY_RELEASE | XFS_ITRUNCATED)
249

L
Linus Torvalds 已提交
250 251
/*
 * Flags for inode locking.
252 253
 * Bit ranges:	1<<1  - 1<<16-1 -- iolock/ilock modes (bitfield)
 *		1<<16 - 1<<32-1 -- lockdep annotation (integers)
L
Linus Torvalds 已提交
254
 */
255 256 257 258
#define	XFS_IOLOCK_EXCL		(1<<0)
#define	XFS_IOLOCK_SHARED	(1<<1)
#define	XFS_ILOCK_EXCL		(1<<2)
#define	XFS_ILOCK_SHARED	(1<<3)
D
Dave Chinner 已提交
259 260
#define	XFS_MMAPLOCK_EXCL	(1<<4)
#define	XFS_MMAPLOCK_SHARED	(1<<5)
L
Linus Torvalds 已提交
261

262
#define XFS_LOCK_MASK		(XFS_IOLOCK_EXCL | XFS_IOLOCK_SHARED \
D
Dave Chinner 已提交
263 264
				| XFS_ILOCK_EXCL | XFS_ILOCK_SHARED \
				| XFS_MMAPLOCK_EXCL | XFS_MMAPLOCK_SHARED)
265

C
Christoph Hellwig 已提交
266 267 268 269
#define XFS_LOCK_FLAGS \
	{ XFS_IOLOCK_EXCL,	"IOLOCK_EXCL" }, \
	{ XFS_IOLOCK_SHARED,	"IOLOCK_SHARED" }, \
	{ XFS_ILOCK_EXCL,	"ILOCK_EXCL" }, \
D
Dave Chinner 已提交
270 271 272
	{ XFS_ILOCK_SHARED,	"ILOCK_SHARED" }, \
	{ XFS_MMAPLOCK_EXCL,	"MMAPLOCK_EXCL" }, \
	{ XFS_MMAPLOCK_SHARED,	"MMAPLOCK_SHARED" }
C
Christoph Hellwig 已提交
273 274


275 276 277
/*
 * Flags for lockdep annotations.
 *
278
 * XFS_LOCK_PARENT - for directory operations that require locking a
279 280 281
 * parent directory inode and a child entry inode. IOLOCK requires nesting,
 * MMAPLOCK does not support this class, ILOCK requires a single subclass
 * to differentiate parent from child.
282 283 284 285
 *
 * XFS_LOCK_RTBITMAP/XFS_LOCK_RTSUM - the realtime device bitmap and summary
 * inodes do not participate in the normal lock order, and thus have their
 * own subclasses.
286
 *
287
 * XFS_LOCK_INUMORDER - for locking several inodes at the some time
288 289
 * with xfs_lock_inodes().  This flag is used as the starting subclass
 * and each subsequent lock acquired will increment the subclass by one.
290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310
 * However, MAX_LOCKDEP_SUBCLASSES == 8, which means we are greatly
 * limited to the subclasses we can represent via nesting. We need at least
 * 5 inodes nest depth for the ILOCK through rename, and we also have to support
 * XFS_ILOCK_PARENT, which gives 6 subclasses. Then we have XFS_ILOCK_RTBITMAP
 * and XFS_ILOCK_RTSUM, which are another 2 unique subclasses, so that's all
 * 8 subclasses supported by lockdep.
 *
 * This also means we have to number the sub-classes in the lowest bits of
 * the mask we keep, and we have to ensure we never exceed 3 bits of lockdep
 * mask and we can't use bit-masking to build the subclasses. What a mess.
 *
 * Bit layout:
 *
 * Bit		Lock Region
 * 16-19	XFS_IOLOCK_SHIFT dependencies
 * 20-23	XFS_MMAPLOCK_SHIFT dependencies
 * 24-31	XFS_ILOCK_SHIFT dependencies
 *
 * IOLOCK values
 *
 * 0-3		subclass value
311
 * 4-7		unused
312 313 314 315 316 317 318 319 320 321 322 323
 *
 * MMAPLOCK values
 *
 * 0-3		subclass value
 * 4-7		unused
 *
 * ILOCK values
 * 0-4		subclass values
 * 5		PARENT subclass (not nestable)
 * 6		RTBITMAP subclass (not nestable)
 * 7		RTSUM subclass (not nestable)
 * 
324
 */
325
#define XFS_IOLOCK_SHIFT		16
326
#define XFS_IOLOCK_MAX_SUBCLASS		3
327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344
#define XFS_IOLOCK_DEP_MASK		0x000f0000

#define XFS_MMAPLOCK_SHIFT		20
#define XFS_MMAPLOCK_NUMORDER		0
#define XFS_MMAPLOCK_MAX_SUBCLASS	3
#define XFS_MMAPLOCK_DEP_MASK		0x00f00000

#define XFS_ILOCK_SHIFT			24
#define XFS_ILOCK_PARENT_VAL		5
#define XFS_ILOCK_MAX_SUBCLASS		(XFS_ILOCK_PARENT_VAL - 1)
#define XFS_ILOCK_RTBITMAP_VAL		6
#define XFS_ILOCK_RTSUM_VAL		7
#define XFS_ILOCK_DEP_MASK		0xff000000
#define	XFS_ILOCK_PARENT		(XFS_ILOCK_PARENT_VAL << XFS_ILOCK_SHIFT)
#define	XFS_ILOCK_RTBITMAP		(XFS_ILOCK_RTBITMAP_VAL << XFS_ILOCK_SHIFT)
#define	XFS_ILOCK_RTSUM			(XFS_ILOCK_RTSUM_VAL << XFS_ILOCK_SHIFT)

#define XFS_LOCK_SUBCLASS_MASK	(XFS_IOLOCK_DEP_MASK | \
D
Dave Chinner 已提交
345 346 347 348 349 350 351 352 353
				 XFS_MMAPLOCK_DEP_MASK | \
				 XFS_ILOCK_DEP_MASK)

#define XFS_IOLOCK_DEP(flags)	(((flags) & XFS_IOLOCK_DEP_MASK) \
					>> XFS_IOLOCK_SHIFT)
#define XFS_MMAPLOCK_DEP(flags)	(((flags) & XFS_MMAPLOCK_DEP_MASK) \
					>> XFS_MMAPLOCK_SHIFT)
#define XFS_ILOCK_DEP(flags)	(((flags) & XFS_ILOCK_DEP_MASK) \
					>> XFS_ILOCK_SHIFT)
L
Linus Torvalds 已提交
354

355 356 357 358 359 360 361 362 363 364 365 366 367 368
/*
 * Layouts are broken in the BREAK_WRITE case to ensure that
 * layout-holders do not collide with local writes. Additionally,
 * layouts are broken in the BREAK_UNMAP case to make sure the
 * layout-holder has a consistent view of the file's extent map. While
 * BREAK_WRITE breaks can be satisfied by recalling FL_LAYOUT leases,
 * BREAK_UNMAP breaks additionally require waiting for busy dax-pages to
 * go idle.
 */
enum layout_break_reason {
        BREAK_WRITE,
        BREAK_UNMAP,
};

L
Linus Torvalds 已提交
369 370 371 372 373
/*
 * For multiple groups support: if S_ISGID bit is set in the parent
 * directory, group of new file is set to that of the parent, and
 * new subdirectory gets S_ISGID bit from parent.
 */
374 375
#define XFS_INHERIT_GID(pip)	\
	(((pip)->i_mount->m_flags & XFS_MOUNT_GRPID) || \
D
Dave Chinner 已提交
376
	 (VFS_I(pip)->i_mode & S_ISGID))
L
Linus Torvalds 已提交
377

D
Dave Chinner 已提交
378
int		xfs_release(struct xfs_inode *ip);
379
void		xfs_inactive(struct xfs_inode *ip);
D
Dave Chinner 已提交
380 381
int		xfs_lookup(struct xfs_inode *dp, struct xfs_name *name,
			   struct xfs_inode **ipp, struct xfs_name *ci_name);
C
Christoph Hellwig 已提交
382 383
int		xfs_create(struct user_namespace *mnt_userns,
			   struct xfs_inode *dp, struct xfs_name *name,
384 385
			   umode_t mode, dev_t rdev, bool need_xattr,
			   struct xfs_inode **ipp);
C
Christoph Hellwig 已提交
386 387
int		xfs_create_tmpfile(struct user_namespace *mnt_userns,
			   struct xfs_inode *dp, umode_t mode,
388
			   struct xfs_inode **ipp);
D
Dave Chinner 已提交
389 390 391 392
int		xfs_remove(struct xfs_inode *dp, struct xfs_name *name,
			   struct xfs_inode *ip);
int		xfs_link(struct xfs_inode *tdp, struct xfs_inode *sip,
			 struct xfs_name *target_name);
C
Christoph Hellwig 已提交
393 394
int		xfs_rename(struct user_namespace *mnt_userns,
			   struct xfs_inode *src_dp, struct xfs_name *src_name,
D
Dave Chinner 已提交
395 396
			   struct xfs_inode *src_ip, struct xfs_inode *target_dp,
			   struct xfs_name *target_name,
397
			   struct xfs_inode *target_ip, unsigned int flags);
D
Dave Chinner 已提交
398

L
Linus Torvalds 已提交
399 400 401 402
void		xfs_ilock(xfs_inode_t *, uint);
int		xfs_ilock_nowait(xfs_inode_t *, uint);
void		xfs_iunlock(xfs_inode_t *, uint);
void		xfs_ilock_demote(xfs_inode_t *, uint);
C
Christoph Hellwig 已提交
403
int		xfs_isilocked(xfs_inode_t *, uint);
404
uint		xfs_ilock_data_map_shared(struct xfs_inode *);
405
uint		xfs_ilock_attr_map_shared(struct xfs_inode *);
406

L
Linus Torvalds 已提交
407
uint		xfs_ip2xflags(struct xfs_inode *);
408
int		xfs_ifree(struct xfs_trans *, struct xfs_inode *);
B
Brian Foster 已提交
409 410
int		xfs_itruncate_extents_flags(struct xfs_trans **,
				struct xfs_inode *, int, xfs_fsize_t, int);
L
Linus Torvalds 已提交
411
void		xfs_iext_realloc(xfs_inode_t *, int, int);
412

413
int		xfs_log_force_inode(struct xfs_inode *ip);
414
void		xfs_iunpin_wait(xfs_inode_t *);
415 416
#define xfs_ipincount(ip)	((unsigned int) atomic_read(&ip->i_pincount))

417
int		xfs_iflush_cluster(struct xfs_buf *);
418 419
void		xfs_lock_two_inodes(struct xfs_inode *ip0, uint ip0_mode,
				struct xfs_inode *ip1, uint ip1_mode);
L
Linus Torvalds 已提交
420

421
xfs_extlen_t	xfs_get_extsz_hint(struct xfs_inode *ip);
422
xfs_extlen_t	xfs_get_cowextsz_hint(struct xfs_inode *ip);
423

C
Christoph Hellwig 已提交
424 425 426
int		xfs_dir_ialloc(struct user_namespace *mnt_userns,
			       struct xfs_trans **tpp, struct xfs_inode *dp,
			       umode_t mode, xfs_nlink_t nlink, dev_t dev,
427 428
			       prid_t prid, bool need_xattr,
			       struct xfs_inode **ipp);
D
Dave Chinner 已提交
429

430 431 432 433 434 435 436
static inline int
xfs_itruncate_extents(
	struct xfs_trans	**tpp,
	struct xfs_inode	*ip,
	int			whichfork,
	xfs_fsize_t		new_size)
{
B
Brian Foster 已提交
437
	return xfs_itruncate_extents_flags(tpp, ip, whichfork, new_size, 0);
438 439
}

D
Dave Chinner 已提交
440
/* from xfs_file.c */
441 442 443 444 445 446 447
enum xfs_prealloc_flags {
	XFS_PREALLOC_SET	= (1 << 1),
	XFS_PREALLOC_CLEAR	= (1 << 2),
	XFS_PREALLOC_SYNC	= (1 << 3),
	XFS_PREALLOC_INVISIBLE	= (1 << 4),
};

448 449
int	xfs_update_prealloc_flags(struct xfs_inode *ip,
				  enum xfs_prealloc_flags flags);
450 451
int	xfs_break_layouts(struct inode *inode, uint *iolock,
		enum layout_break_reason reason);
D
Dave Chinner 已提交
452

453
/* from xfs_iops.c */
454 455
extern void xfs_setup_inode(struct xfs_inode *ip);
extern void xfs_setup_iops(struct xfs_inode *ip);
456
extern void xfs_diflags_to_iflags(struct xfs_inode *ip, bool init);
457

458 459 460 461 462 463 464 465 466 467 468 469
/*
 * When setting up a newly allocated inode, we need to call
 * xfs_finish_inode_setup() once the inode is fully instantiated at
 * the VFS level to prevent the rest of the world seeing the inode
 * before we've completed instantiation. Otherwise we can do it
 * the moment the inode lookup is complete.
 */
static inline void xfs_finish_inode_setup(struct xfs_inode *ip)
{
	xfs_iflags_clear(ip, XFS_INEW);
	barrier();
	unlock_new_inode(VFS_I(ip));
470
	wake_up_bit(&ip->i_flags, __XFS_INEW_BIT);
471 472 473 474 475
}

static inline void xfs_setup_existing_inode(struct xfs_inode *ip)
{
	xfs_setup_inode(ip);
476
	xfs_setup_iops(ip);
477 478 479
	xfs_finish_inode_setup(ip);
}

480
void xfs_irele(struct xfs_inode *ip);
481

L
Linus Torvalds 已提交
482 483
extern struct kmem_zone	*xfs_inode_zone;

484 485 486
/* The default CoW extent size hint. */
#define XFS_DEFAULT_COWEXTSZ_HINT 32

487 488 489
int xfs_iunlink_init(struct xfs_perag *pag);
void xfs_iunlink_destroy(struct xfs_perag *pag);

490 491
void xfs_end_io(struct work_struct *work);

492 493 494
int xfs_ilock2_io_mmap(struct xfs_inode *ip1, struct xfs_inode *ip2);
void xfs_iunlock2_io_mmap(struct xfs_inode *ip1, struct xfs_inode *ip2);

L
Linus Torvalds 已提交
495
#endif	/* __XFS_INODE_H__ */