xfs_super.c 56.1 KB
Newer Older
L
Linus Torvalds 已提交
1
/*
2
 * Copyright (c) 2000-2006 Silicon Graphics, Inc.
3
 * All Rights Reserved.
L
Linus Torvalds 已提交
4
 *
5 6
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License as
L
Linus Torvalds 已提交
7 8
 * published by the Free Software Foundation.
 *
9 10 11 12
 * This program is distributed in the hope that it would be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
L
Linus Torvalds 已提交
13
 *
14 15 16
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write the Free Software Foundation,
 * Inc.,  51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
L
Linus Torvalds 已提交
17
 */
C
Christoph Hellwig 已提交
18

L
Linus Torvalds 已提交
19
#include "xfs.h"
20
#include "xfs_shared.h"
21
#include "xfs_format.h"
22 23
#include "xfs_log_format.h"
#include "xfs_trans_resv.h"
L
Linus Torvalds 已提交
24 25
#include "xfs_sb.h"
#include "xfs_mount.h"
26
#include "xfs_da_format.h"
L
Linus Torvalds 已提交
27
#include "xfs_inode.h"
28
#include "xfs_btree.h"
L
Linus Torvalds 已提交
29
#include "xfs_bmap.h"
30
#include "xfs_alloc.h"
L
Linus Torvalds 已提交
31
#include "xfs_error.h"
C
Christoph Hellwig 已提交
32
#include "xfs_fsops.h"
33
#include "xfs_trans.h"
L
Linus Torvalds 已提交
34
#include "xfs_buf_item.h"
35
#include "xfs_log.h"
36
#include "xfs_log_priv.h"
37
#include "xfs_da_btree.h"
38
#include "xfs_dir2.h"
39 40 41
#include "xfs_extfree_item.h"
#include "xfs_mru_cache.h"
#include "xfs_inode_item.h"
42
#include "xfs_icache.h"
C
Christoph Hellwig 已提交
43
#include "xfs_trace.h"
D
Dave Chinner 已提交
44
#include "xfs_icreate_item.h"
45 46
#include "xfs_filestream.h"
#include "xfs_quota.h"
47
#include "xfs_sysfs.h"
48
#include "xfs_ondisk.h"
49
#include "xfs_rmap_item.h"
50
#include "xfs_refcount_item.h"
51
#include "xfs_bmap_item.h"
52
#include "xfs_reflink.h"
L
Linus Torvalds 已提交
53 54

#include <linux/namei.h>
55
#include <linux/dax.h>
L
Linus Torvalds 已提交
56
#include <linux/init.h>
57
#include <linux/slab.h>
L
Linus Torvalds 已提交
58
#include <linux/mount.h>
59
#include <linux/mempool.h>
L
Linus Torvalds 已提交
60
#include <linux/writeback.h>
61
#include <linux/kthread.h>
62
#include <linux/freezer.h>
63
#include <linux/parser.h>
L
Linus Torvalds 已提交
64

65
static const struct super_operations xfs_super_operations;
66
struct bio_set *xfs_ioend_bioset;
67

D
Dave Chinner 已提交
68
static struct kset *xfs_kset;		/* top-level xfs sysfs dir */
69 70 71
#ifdef DEBUG
static struct xfs_kobj xfs_dbg_kobj;	/* global debug sysfs attrs */
#endif
L
Linus Torvalds 已提交
72

73 74 75 76
/*
 * Table driven mount option parser.
 */
enum {
77 78 79 80 81 82 83 84 85 86
	Opt_logbufs, Opt_logbsize, Opt_logdev, Opt_rtdev, Opt_biosize,
	Opt_wsync, Opt_noalign, Opt_swalloc, Opt_sunit, Opt_swidth, Opt_nouuid,
	Opt_mtpt, Opt_grpid, Opt_nogrpid, Opt_bsdgroups, Opt_sysvgroups,
	Opt_allocsize, Opt_norecovery, Opt_barrier, Opt_nobarrier,
	Opt_inode64, Opt_inode32, Opt_ikeep, Opt_noikeep,
	Opt_largeio, Opt_nolargeio, Opt_attr2, Opt_noattr2, Opt_filestreams,
	Opt_quota, Opt_noquota, Opt_usrquota, Opt_grpquota, Opt_prjquota,
	Opt_uquota, Opt_gquota, Opt_pquota,
	Opt_uqnoenforce, Opt_gqnoenforce, Opt_pqnoenforce, Opt_qnoenforce,
	Opt_discard, Opt_nodiscard, Opt_dax, Opt_err,
87 88
};

89
static const match_table_t tokens = {
90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134
	{Opt_logbufs,	"logbufs=%u"},	/* number of XFS log buffers */
	{Opt_logbsize,	"logbsize=%s"},	/* size of XFS log buffers */
	{Opt_logdev,	"logdev=%s"},	/* log device */
	{Opt_rtdev,	"rtdev=%s"},	/* realtime I/O device */
	{Opt_biosize,	"biosize=%u"},	/* log2 of preferred buffered io size */
	{Opt_wsync,	"wsync"},	/* safe-mode nfs compatible mount */
	{Opt_noalign,	"noalign"},	/* turn off stripe alignment */
	{Opt_swalloc,	"swalloc"},	/* turn on stripe width allocation */
	{Opt_sunit,	"sunit=%u"},	/* data volume stripe unit */
	{Opt_swidth,	"swidth=%u"},	/* data volume stripe width */
	{Opt_nouuid,	"nouuid"},	/* ignore filesystem UUID */
	{Opt_mtpt,	"mtpt"},	/* filesystem mount point */
	{Opt_grpid,	"grpid"},	/* group-ID from parent directory */
	{Opt_nogrpid,	"nogrpid"},	/* group-ID from current process */
	{Opt_bsdgroups,	"bsdgroups"},	/* group-ID from parent directory */
	{Opt_sysvgroups,"sysvgroups"},	/* group-ID from current process */
	{Opt_allocsize,	"allocsize=%s"},/* preferred allocation size */
	{Opt_norecovery,"norecovery"},	/* don't run XFS recovery */
	{Opt_inode64,	"inode64"},	/* inodes can be allocated anywhere */
	{Opt_inode32,   "inode32"},	/* inode allocation limited to
					 * XFS_MAXINUMBER_32 */
	{Opt_ikeep,	"ikeep"},	/* do not free empty inode clusters */
	{Opt_noikeep,	"noikeep"},	/* free empty inode clusters */
	{Opt_largeio,	"largeio"},	/* report large I/O sizes in stat() */
	{Opt_nolargeio,	"nolargeio"},	/* do not report large I/O sizes
					 * in stat(). */
	{Opt_attr2,	"attr2"},	/* do use attr2 attribute format */
	{Opt_noattr2,	"noattr2"},	/* do not use attr2 attribute format */
	{Opt_filestreams,"filestreams"},/* use filestreams allocator */
	{Opt_quota,	"quota"},	/* disk quotas (user) */
	{Opt_noquota,	"noquota"},	/* no quotas */
	{Opt_usrquota,	"usrquota"},	/* user quota enabled */
	{Opt_grpquota,	"grpquota"},	/* group quota enabled */
	{Opt_prjquota,	"prjquota"},	/* project quota enabled */
	{Opt_uquota,	"uquota"},	/* user quota (IRIX variant) */
	{Opt_gquota,	"gquota"},	/* group quota (IRIX variant) */
	{Opt_pquota,	"pquota"},	/* project quota (IRIX variant) */
	{Opt_uqnoenforce,"uqnoenforce"},/* user quota limit enforcement */
	{Opt_gqnoenforce,"gqnoenforce"},/* group quota limit enforcement */
	{Opt_pqnoenforce,"pqnoenforce"},/* project quota limit enforcement */
	{Opt_qnoenforce, "qnoenforce"},	/* same as uqnoenforce */
	{Opt_discard,	"discard"},	/* Discard unused blocks */
	{Opt_nodiscard,	"nodiscard"},	/* Do not discard unused blocks */

	{Opt_dax,	"dax"},		/* Enable direct access to bdev pages */
135 136 137 138 139 140

	/* Deprecated mount options scheduled for removal */
	{Opt_barrier,	"barrier"},	/* use writer barriers for log write and
					 * unwritten extent conversion */
	{Opt_nobarrier,	"nobarrier"},	/* .. disable */

141
	{Opt_err,	NULL},
142 143 144
};


145
STATIC int
146
suffix_kstrtoint(const substring_t *s, unsigned int base, int *res)
147
{
148
	int	last, shift_left_factor = 0, _res;
149 150 151 152 153 154
	char	*value;
	int	ret = 0;

	value = match_strdup(s);
	if (!value)
		return -ENOMEM;
155 156 157 158 159 160 161 162 163 164 165 166 167 168 169

	last = strlen(value) - 1;
	if (value[last] == 'K' || value[last] == 'k') {
		shift_left_factor = 10;
		value[last] = '\0';
	}
	if (value[last] == 'M' || value[last] == 'm') {
		shift_left_factor = 20;
		value[last] = '\0';
	}
	if (value[last] == 'G' || value[last] == 'g') {
		shift_left_factor = 30;
		value[last] = '\0';
	}

170 171 172
	if (kstrtoint(value, base, &_res))
		ret = -EINVAL;
	kfree(value);
173
	*res = _res << shift_left_factor;
174
	return ret;
175 176
}

177 178 179 180 181 182
/*
 * This function fills in xfs_mount_t fields based on mount args.
 * Note: the superblock has _not_ yet been read in.
 *
 * Note that this function leaks the various device name allocations on
 * failure.  The caller takes care of them.
E
Eric Sandeen 已提交
183 184 185 186
 *
 * *sb is const because this is also used to test options on the remount
 * path, and we don't want this to have any side effects at remount time.
 * Today this function does not change *sb, but just to future-proof...
187
 */
188 189 190
STATIC int
xfs_parseargs(
	struct xfs_mount	*mp,
C
Christoph Hellwig 已提交
191
	char			*options)
192
{
E
Eric Sandeen 已提交
193
	const struct super_block *sb = mp->m_super;
194 195
	char			*p;
	substring_t		args[MAX_OPT_ARGS];
196 197 198
	int			dsunit = 0;
	int			dswidth = 0;
	int			iosize = 0;
199
	uint8_t			iosizelog = 0;
200

201 202 203 204 205 206
	/*
	 * set up the mount name first so all the errors will refer to the
	 * correct device.
	 */
	mp->m_fsname = kstrndup(sb->s_id, MAXNAMELEN, GFP_KERNEL);
	if (!mp->m_fsname)
D
Dave Chinner 已提交
207
		return -ENOMEM;
208 209
	mp->m_fsname_len = strlen(mp->m_fsname) + 1;

210 211 212
	/*
	 * Copy binary VFS mount flags we are interested in.
	 */
213
	if (sb_rdonly(sb))
214
		mp->m_flags |= XFS_MOUNT_RDONLY;
215
	if (sb->s_flags & SB_DIRSYNC)
216
		mp->m_flags |= XFS_MOUNT_DIRSYNC;
217
	if (sb->s_flags & SB_SYNCHRONOUS)
218 219 220 221 222 223 224 225
		mp->m_flags |= XFS_MOUNT_WSYNC;

	/*
	 * Set some default flags that could be cleared by the mount option
	 * parsing.
	 */
	mp->m_flags |= XFS_MOUNT_BARRIER;
	mp->m_flags |= XFS_MOUNT_COMPAT_IOSIZE;
226

227 228 229 230 231
	/*
	 * These can be overridden by the mount option parsing.
	 */
	mp->m_logbufs = -1;
	mp->m_logbsize = -1;
232 233 234 235

	if (!options)
		goto done;

236 237 238 239
	while ((p = strsep(&options, ",")) != NULL) {
		int		token;

		if (!*p)
240 241
			continue;

242 243 244 245
		token = match_token(p, tokens, args);
		switch (token) {
		case Opt_logbufs:
			if (match_int(args, &mp->m_logbufs))
D
Dave Chinner 已提交
246
				return -EINVAL;
247 248 249
			break;
		case Opt_logbsize:
			if (suffix_kstrtoint(args, 10, &mp->m_logbsize))
D
Dave Chinner 已提交
250
				return -EINVAL;
251 252
			break;
		case Opt_logdev:
253
			kfree(mp->m_logname);
254
			mp->m_logname = match_strdup(args);
255
			if (!mp->m_logname)
D
Dave Chinner 已提交
256
				return -ENOMEM;
257 258 259
			break;
		case Opt_mtpt:
			xfs_warn(mp, "%s option not allowed on this system", p);
D
Dave Chinner 已提交
260
			return -EINVAL;
261
		case Opt_rtdev:
262
			kfree(mp->m_rtname);
263
			mp->m_rtname = match_strdup(args);
264
			if (!mp->m_rtname)
D
Dave Chinner 已提交
265
				return -ENOMEM;
266 267 268 269
			break;
		case Opt_allocsize:
		case Opt_biosize:
			if (suffix_kstrtoint(args, 10, &iosize))
D
Dave Chinner 已提交
270
				return -EINVAL;
271
			iosizelog = ffs(iosize) - 1;
272 273 274
			break;
		case Opt_grpid:
		case Opt_bsdgroups:
275
			mp->m_flags |= XFS_MOUNT_GRPID;
276 277 278
			break;
		case Opt_nogrpid:
		case Opt_sysvgroups:
279
			mp->m_flags &= ~XFS_MOUNT_GRPID;
280 281
			break;
		case Opt_wsync:
282
			mp->m_flags |= XFS_MOUNT_WSYNC;
283 284
			break;
		case Opt_norecovery:
285
			mp->m_flags |= XFS_MOUNT_NORECOVERY;
286 287
			break;
		case Opt_noalign:
288
			mp->m_flags |= XFS_MOUNT_NOALIGN;
289 290
			break;
		case Opt_swalloc:
291
			mp->m_flags |= XFS_MOUNT_SWALLOC;
292 293 294
			break;
		case Opt_sunit:
			if (match_int(args, &dsunit))
D
Dave Chinner 已提交
295
				return -EINVAL;
296 297 298
			break;
		case Opt_swidth:
			if (match_int(args, &dswidth))
D
Dave Chinner 已提交
299
				return -EINVAL;
300 301
			break;
		case Opt_inode32:
302
			mp->m_flags |= XFS_MOUNT_SMALL_INUMS;
303 304
			break;
		case Opt_inode64:
305
			mp->m_flags &= ~XFS_MOUNT_SMALL_INUMS;
306 307
			break;
		case Opt_nouuid:
308
			mp->m_flags |= XFS_MOUNT_NOUUID;
309 310
			break;
		case Opt_ikeep:
311
			mp->m_flags |= XFS_MOUNT_IKEEP;
312 313
			break;
		case Opt_noikeep:
314
			mp->m_flags &= ~XFS_MOUNT_IKEEP;
315 316
			break;
		case Opt_largeio:
317
			mp->m_flags &= ~XFS_MOUNT_COMPAT_IOSIZE;
318 319
			break;
		case Opt_nolargeio:
320
			mp->m_flags |= XFS_MOUNT_COMPAT_IOSIZE;
321 322
			break;
		case Opt_attr2:
323
			mp->m_flags |= XFS_MOUNT_ATTR2;
324 325
			break;
		case Opt_noattr2:
326 327
			mp->m_flags &= ~XFS_MOUNT_ATTR2;
			mp->m_flags |= XFS_MOUNT_NOATTR2;
328 329
			break;
		case Opt_filestreams:
330
			mp->m_flags |= XFS_MOUNT_FILESTREAMS;
331 332
			break;
		case Opt_noquota:
333 334 335
			mp->m_qflags &= ~XFS_ALL_QUOTA_ACCT;
			mp->m_qflags &= ~XFS_ALL_QUOTA_ENFD;
			mp->m_qflags &= ~XFS_ALL_QUOTA_ACTIVE;
336 337 338 339
			break;
		case Opt_quota:
		case Opt_uquota:
		case Opt_usrquota:
340 341
			mp->m_qflags |= (XFS_UQUOTA_ACCT | XFS_UQUOTA_ACTIVE |
					 XFS_UQUOTA_ENFD);
342 343 344
			break;
		case Opt_qnoenforce:
		case Opt_uqnoenforce:
345 346
			mp->m_qflags |= (XFS_UQUOTA_ACCT | XFS_UQUOTA_ACTIVE);
			mp->m_qflags &= ~XFS_UQUOTA_ENFD;
347 348 349
			break;
		case Opt_pquota:
		case Opt_prjquota:
350
			mp->m_qflags |= (XFS_PQUOTA_ACCT | XFS_PQUOTA_ACTIVE |
351
					 XFS_PQUOTA_ENFD);
352 353
			break;
		case Opt_pqnoenforce:
354
			mp->m_qflags |= (XFS_PQUOTA_ACCT | XFS_PQUOTA_ACTIVE);
355
			mp->m_qflags &= ~XFS_PQUOTA_ENFD;
356
			break;
357 358
		case Opt_gquota:
		case Opt_grpquota:
359
			mp->m_qflags |= (XFS_GQUOTA_ACCT | XFS_GQUOTA_ACTIVE |
360
					 XFS_GQUOTA_ENFD);
361 362
			break;
		case Opt_gqnoenforce:
363
			mp->m_qflags |= (XFS_GQUOTA_ACCT | XFS_GQUOTA_ACTIVE);
364
			mp->m_qflags &= ~XFS_GQUOTA_ENFD;
365 366
			break;
		case Opt_discard:
367
			mp->m_flags |= XFS_MOUNT_DISCARD;
368 369
			break;
		case Opt_nodiscard:
370
			mp->m_flags &= ~XFS_MOUNT_DISCARD;
371
			break;
D
Dave Chinner 已提交
372
#ifdef CONFIG_FS_DAX
373
		case Opt_dax:
D
Dave Chinner 已提交
374
			mp->m_flags |= XFS_MOUNT_DAX;
375
			break;
D
Dave Chinner 已提交
376
#endif
377 378 379 380 381 382 383 384
		case Opt_barrier:
			xfs_warn(mp, "%s option is deprecated, ignoring.", p);
			mp->m_flags |= XFS_MOUNT_BARRIER;
			break;
		case Opt_nobarrier:
			xfs_warn(mp, "%s option is deprecated, ignoring.", p);
			mp->m_flags &= ~XFS_MOUNT_BARRIER;
			break;
385 386
		default:
			xfs_warn(mp, "unknown mount option [%s].", p);
D
Dave Chinner 已提交
387
			return -EINVAL;
388 389 390
		}
	}

391 392 393 394 395
	/*
	 * no recovery flag requires a read-only mount
	 */
	if ((mp->m_flags & XFS_MOUNT_NORECOVERY) &&
	    !(mp->m_flags & XFS_MOUNT_RDONLY)) {
396
		xfs_warn(mp, "no-recovery mounts must be read-only.");
D
Dave Chinner 已提交
397
		return -EINVAL;
398 399
	}

400
	if ((mp->m_flags & XFS_MOUNT_NOALIGN) && (dsunit || dswidth)) {
401 402
		xfs_warn(mp,
	"sunit and swidth options incompatible with the noalign option");
D
Dave Chinner 已提交
403
		return -EINVAL;
404 405
	}

C
Christoph Hellwig 已提交
406 407
#ifndef CONFIG_XFS_QUOTA
	if (XFS_IS_QUOTA_RUNNING(mp)) {
408
		xfs_warn(mp, "quota support not available in this kernel.");
D
Dave Chinner 已提交
409
		return -EINVAL;
C
Christoph Hellwig 已提交
410 411 412
	}
#endif

413
	if ((dsunit && !dswidth) || (!dsunit && dswidth)) {
414
		xfs_warn(mp, "sunit and swidth must be specified together");
D
Dave Chinner 已提交
415
		return -EINVAL;
416 417 418
	}

	if (dsunit && (dswidth % dsunit != 0)) {
419 420
		xfs_warn(mp,
	"stripe width (%d) must be a multiple of the stripe unit (%d)",
421
			dswidth, dsunit);
D
Dave Chinner 已提交
422
		return -EINVAL;
423 424
	}

425
done:
J
Jie Liu 已提交
426
	if (dsunit && !(mp->m_flags & XFS_MOUNT_NOALIGN)) {
427 428 429 430 431 432
		/*
		 * At this point the superblock has not been read
		 * in, therefore we do not know the block size.
		 * Before the mount call ends we will convert
		 * these to FSBs.
		 */
J
Jie Liu 已提交
433 434
		mp->m_dalign = dsunit;
		mp->m_swidth = dswidth;
435 436 437 438 439 440
	}

	if (mp->m_logbufs != -1 &&
	    mp->m_logbufs != 0 &&
	    (mp->m_logbufs < XLOG_MIN_ICLOGS ||
	     mp->m_logbufs > XLOG_MAX_ICLOGS)) {
441
		xfs_warn(mp, "invalid logbufs value: %d [not %d-%d]",
442
			mp->m_logbufs, XLOG_MIN_ICLOGS, XLOG_MAX_ICLOGS);
D
Dave Chinner 已提交
443
		return -EINVAL;
444 445 446 447 448 449
	}
	if (mp->m_logbsize != -1 &&
	    mp->m_logbsize !=  0 &&
	    (mp->m_logbsize < XLOG_MIN_RECORD_BSIZE ||
	     mp->m_logbsize > XLOG_MAX_RECORD_BSIZE ||
	     !is_power_of_2(mp->m_logbsize))) {
450 451
		xfs_warn(mp,
			"invalid logbufsize: %d [not 16k,32k,64k,128k or 256k]",
452
			mp->m_logbsize);
D
Dave Chinner 已提交
453
		return -EINVAL;
454 455 456 457 458
	}

	if (iosizelog) {
		if (iosizelog > XFS_MAX_IO_LOG ||
		    iosizelog < XFS_MIN_IO_LOG) {
459
			xfs_warn(mp, "invalid log iosize: %d [not %d-%d]",
460 461
				iosizelog, XFS_MIN_IO_LOG,
				XFS_MAX_IO_LOG);
D
Dave Chinner 已提交
462
			return -EINVAL;
463 464 465 466 467
		}

		mp->m_flags |= XFS_MOUNT_DFLT_IOSIZE;
		mp->m_readio_log = iosizelog;
		mp->m_writeio_log = iosizelog;
468 469 470 471 472 473
	}

	return 0;
}

struct proc_xfs_info {
D
Dave Chinner 已提交
474 475
	uint64_t	flag;
	char		*str;
476 477 478 479 480 481 482 483 484
};

STATIC int
xfs_showargs(
	struct xfs_mount	*mp,
	struct seq_file		*m)
{
	static struct proc_xfs_info xfs_info_set[] = {
		/* the few simple ones we can get from the mount struct */
485 486 487 488 489 490 491 492 493 494 495 496
		{ XFS_MOUNT_IKEEP,		",ikeep" },
		{ XFS_MOUNT_WSYNC,		",wsync" },
		{ XFS_MOUNT_NOALIGN,		",noalign" },
		{ XFS_MOUNT_SWALLOC,		",swalloc" },
		{ XFS_MOUNT_NOUUID,		",nouuid" },
		{ XFS_MOUNT_NORECOVERY,		",norecovery" },
		{ XFS_MOUNT_ATTR2,		",attr2" },
		{ XFS_MOUNT_FILESTREAMS,	",filestreams" },
		{ XFS_MOUNT_GRPID,		",grpid" },
		{ XFS_MOUNT_DISCARD,		",discard" },
		{ XFS_MOUNT_SMALL_INUMS,	",inode32" },
		{ XFS_MOUNT_DAX,		",dax" },
497 498 499 500
		{ 0, NULL }
	};
	static struct proc_xfs_info xfs_info_unset[] = {
		/* the few simple ones we can get from the mount struct */
501 502 503
		{ XFS_MOUNT_COMPAT_IOSIZE,	",largeio" },
		{ XFS_MOUNT_BARRIER,		",nobarrier" },
		{ XFS_MOUNT_SMALL_INUMS,	",inode64" },
504 505 506 507 508 509 510 511 512 513 514 515 516 517
		{ 0, NULL }
	};
	struct proc_xfs_info	*xfs_infop;

	for (xfs_infop = xfs_info_set; xfs_infop->flag; xfs_infop++) {
		if (mp->m_flags & xfs_infop->flag)
			seq_puts(m, xfs_infop->str);
	}
	for (xfs_infop = xfs_info_unset; xfs_infop->flag; xfs_infop++) {
		if (!(mp->m_flags & xfs_infop->flag))
			seq_puts(m, xfs_infop->str);
	}

	if (mp->m_flags & XFS_MOUNT_DFLT_IOSIZE)
518
		seq_printf(m, ",allocsize=%dk",
519 520 521
				(int)(1 << mp->m_writeio_log) >> 10);

	if (mp->m_logbufs > 0)
522
		seq_printf(m, ",logbufs=%d", mp->m_logbufs);
523
	if (mp->m_logbsize > 0)
524
		seq_printf(m, ",logbsize=%dk", mp->m_logbsize >> 10);
525 526

	if (mp->m_logname)
527
		seq_show_option(m, "logdev", mp->m_logname);
528
	if (mp->m_rtname)
529
		seq_show_option(m, "rtdev", mp->m_rtname);
530 531

	if (mp->m_dalign > 0)
532
		seq_printf(m, ",sunit=%d",
533 534
				(int)XFS_FSB_TO_BB(mp, mp->m_dalign));
	if (mp->m_swidth > 0)
535
		seq_printf(m, ",swidth=%d",
536 537 538
				(int)XFS_FSB_TO_BB(mp, mp->m_swidth));

	if (mp->m_qflags & (XFS_UQUOTA_ACCT|XFS_UQUOTA_ENFD))
539
		seq_puts(m, ",usrquota");
540
	else if (mp->m_qflags & XFS_UQUOTA_ACCT)
541
		seq_puts(m, ",uqnoenforce");
542

543
	if (mp->m_qflags & XFS_PQUOTA_ACCT) {
544
		if (mp->m_qflags & XFS_PQUOTA_ENFD)
545
			seq_puts(m, ",prjquota");
546
		else
547
			seq_puts(m, ",pqnoenforce");
548 549
	}
	if (mp->m_qflags & XFS_GQUOTA_ACCT) {
550
		if (mp->m_qflags & XFS_GQUOTA_ENFD)
551
			seq_puts(m, ",grpquota");
552
		else
553
			seq_puts(m, ",gqnoenforce");
554
	}
555 556

	if (!(mp->m_qflags & XFS_ALL_QUOTA_ACCT))
557
		seq_puts(m, ",noquota");
558 559 560

	return 0;
}
561
static uint64_t
L
Linus Torvalds 已提交
562 563 564 565 566 567 568 569
xfs_max_file_offset(
	unsigned int		blockshift)
{
	unsigned int		pagefactor = 1;
	unsigned int		bitshift = BITS_PER_LONG - 1;

	/* Figure out maximum filesize, on Linux this can depend on
	 * the filesystem blocksize (on 32 bit platforms).
C
Christoph Hellwig 已提交
570
	 * __block_write_begin does this in an [unsigned] long...
571
	 *      page->index << (PAGE_SHIFT - bbits)
L
Linus Torvalds 已提交
572 573
	 * So, for page sized blocks (4K on 32 bit platforms),
	 * this wraps at around 8Tb (hence MAX_LFS_FILESIZE which is
574
	 *      (((u64)PAGE_SIZE << (BITS_PER_LONG-1))-1)
L
Linus Torvalds 已提交
575 576 577 578 579 580 581 582
	 * but for smaller blocksizes it is less (bbits = log2 bsize).
	 * Note1: get_block_t takes a long (implicit cast from above)
	 * Note2: The Large Block Device (LBD and HAVE_SECTOR_T) patch
	 * can optionally convert the [unsigned] long from above into
	 * an [unsigned] long long.
	 */

#if BITS_PER_LONG == 32
583
# if defined(CONFIG_LBDAF)
L
Linus Torvalds 已提交
584
	ASSERT(sizeof(sector_t) == 8);
585
	pagefactor = PAGE_SIZE;
L
Linus Torvalds 已提交
586 587
	bitshift = BITS_PER_LONG;
# else
588
	pagefactor = PAGE_SIZE >> (PAGE_SHIFT - blockshift);
L
Linus Torvalds 已提交
589 590 591
# endif
#endif

592
	return (((uint64_t)pagefactor) << bitshift) - 1;
L
Linus Torvalds 已提交
593 594
}

595
/*
596 597 598 599 600 601 602 603 604 605 606 607 608
 * Set parameters for inode allocation heuristics, taking into account
 * filesystem size and inode32/inode64 mount options; i.e. specifically
 * whether or not XFS_MOUNT_SMALL_INUMS is set.
 *
 * Inode allocation patterns are altered only if inode32 is requested
 * (XFS_MOUNT_SMALL_INUMS), and the filesystem is sufficiently large.
 * If altered, XFS_MOUNT_32BITINODES is set as well.
 *
 * An agcount independent of that in the mount structure is provided
 * because in the growfs case, mp->m_sb.sb_agcount is not yet updated
 * to the potentially higher ag count.
 *
 * Returns the maximum AG index which may contain inodes.
609
 */
610
xfs_agnumber_t
611 612 613
xfs_set_inode_alloc(
	struct xfs_mount *mp,
	xfs_agnumber_t	agcount)
614
{
615
	xfs_agnumber_t	index;
616
	xfs_agnumber_t	maxagi = 0;
617 618
	xfs_sb_t	*sbp = &mp->m_sb;
	xfs_agnumber_t	max_metadata;
E
Eric Sandeen 已提交
619 620
	xfs_agino_t	agino;
	xfs_ino_t	ino;
621

622 623 624
	/*
	 * Calculate how much should be reserved for inodes to meet
	 * the max inode percentage.  Used only for inode32.
625 626
	 */
	if (mp->m_maxicount) {
627
		uint64_t	icount;
628 629 630 631 632 633 634

		icount = sbp->sb_dblocks * sbp->sb_imax_pct;
		do_div(icount, 100);
		icount += sbp->sb_agblocks - 1;
		do_div(icount, sbp->sb_agblocks);
		max_metadata = icount;
	} else {
635
		max_metadata = agcount;
636 637
	}

638
	/* Get the last possible inode in the filesystem */
E
Eric Sandeen 已提交
639
	agino =	XFS_OFFBNO_TO_AGINO(mp, sbp->sb_agblocks - 1, 0);
640 641 642 643 644 645 646 647 648 649 650
	ino = XFS_AGINO_TO_INO(mp, agcount - 1, agino);

	/*
	 * If user asked for no more than 32-bit inodes, and the fs is
	 * sufficiently large, set XFS_MOUNT_32BITINODES if we must alter
	 * the allocator to accommodate the request.
	 */
	if ((mp->m_flags & XFS_MOUNT_SMALL_INUMS) && ino > XFS_MAXINUMBER_32)
		mp->m_flags |= XFS_MOUNT_32BITINODES;
	else
		mp->m_flags &= ~XFS_MOUNT_32BITINODES;
E
Eric Sandeen 已提交
651

652
	for (index = 0; index < agcount; index++) {
653
		struct xfs_perag	*pag;
654

655
		ino = XFS_AGINO_TO_INO(mp, index, agino);
656 657 658

		pag = xfs_perag_get(mp, index);

659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674
		if (mp->m_flags & XFS_MOUNT_32BITINODES) {
			if (ino > XFS_MAXINUMBER_32) {
				pag->pagi_inodeok = 0;
				pag->pagf_metadata = 0;
			} else {
				pag->pagi_inodeok = 1;
				maxagi++;
				if (index < max_metadata)
					pag->pagf_metadata = 1;
				else
					pag->pagf_metadata = 0;
			}
		} else {
			pag->pagi_inodeok = 1;
			pag->pagf_metadata = 0;
		}
675 676 677 678

		xfs_perag_put(pag);
	}

679
	return (mp->m_flags & XFS_MOUNT_32BITINODES) ? maxagi : agcount;
680 681
}

H
Hannes Eder 已提交
682
STATIC int
L
Linus Torvalds 已提交
683 684 685 686 687 688 689
xfs_blkdev_get(
	xfs_mount_t		*mp,
	const char		*name,
	struct block_device	**bdevp)
{
	int			error = 0;

690 691
	*bdevp = blkdev_get_by_path(name, FMODE_READ|FMODE_WRITE|FMODE_EXCL,
				    mp);
L
Linus Torvalds 已提交
692 693
	if (IS_ERR(*bdevp)) {
		error = PTR_ERR(*bdevp);
694
		xfs_warn(mp, "Invalid device [%s], error=%d", name, error);
L
Linus Torvalds 已提交
695 696
	}

D
Dave Chinner 已提交
697
	return error;
L
Linus Torvalds 已提交
698 699
}

H
Hannes Eder 已提交
700
STATIC void
L
Linus Torvalds 已提交
701 702 703 704
xfs_blkdev_put(
	struct block_device	*bdev)
{
	if (bdev)
705
		blkdev_put(bdev, FMODE_READ|FMODE_WRITE|FMODE_EXCL);
L
Linus Torvalds 已提交
706 707
}

708 709 710 711
void
xfs_blkdev_issue_flush(
	xfs_buftarg_t		*buftarg)
{
712
	blkdev_issue_flush(buftarg->bt_bdev, GFP_NOFS, NULL);
713
}
L
Linus Torvalds 已提交
714

715 716 717 718
STATIC void
xfs_close_devices(
	struct xfs_mount	*mp)
{
719 720
	struct dax_device *dax_ddev = mp->m_ddev_targp->bt_daxdev;

721
	if (mp->m_logdev_targp && mp->m_logdev_targp != mp->m_ddev_targp) {
722
		struct block_device *logdev = mp->m_logdev_targp->bt_bdev;
723 724
		struct dax_device *dax_logdev = mp->m_logdev_targp->bt_daxdev;

725
		xfs_free_buftarg(mp->m_logdev_targp);
726
		xfs_blkdev_put(logdev);
727
		fs_put_dax(dax_logdev);
728 729
	}
	if (mp->m_rtdev_targp) {
730
		struct block_device *rtdev = mp->m_rtdev_targp->bt_bdev;
731 732
		struct dax_device *dax_rtdev = mp->m_rtdev_targp->bt_daxdev;

733
		xfs_free_buftarg(mp->m_rtdev_targp);
734
		xfs_blkdev_put(rtdev);
735
		fs_put_dax(dax_rtdev);
736
	}
737
	xfs_free_buftarg(mp->m_ddev_targp);
738
	fs_put_dax(dax_ddev);
739 740 741 742 743 744 745 746 747 748 749 750 751 752
}

/*
 * The file system configurations are:
 *	(1) device (partition) with data and internal log
 *	(2) logical volume with data and log subvolumes.
 *	(3) logical volume with data, log, and realtime subvolumes.
 *
 * We only have to handle opening the log and realtime volumes here if
 * they are present.  The data subvolume has already been opened by
 * get_sb_bdev() and is stored in sb->s_bdev.
 */
STATIC int
xfs_open_devices(
753
	struct xfs_mount	*mp)
754 755
{
	struct block_device	*ddev = mp->m_super->s_bdev;
756 757
	struct dax_device	*dax_ddev = fs_dax_get_by_bdev(ddev);
	struct dax_device	*dax_logdev = NULL, *dax_rtdev = NULL;
758 759 760 761 762 763
	struct block_device	*logdev = NULL, *rtdev = NULL;
	int			error;

	/*
	 * Open real time and log devices - order is important.
	 */
764 765
	if (mp->m_logname) {
		error = xfs_blkdev_get(mp, mp->m_logname, &logdev);
766 767
		if (error)
			goto out;
768
		dax_logdev = fs_dax_get_by_bdev(logdev);
769 770
	}

771 772
	if (mp->m_rtname) {
		error = xfs_blkdev_get(mp, mp->m_rtname, &rtdev);
773 774 775 776
		if (error)
			goto out_close_logdev;

		if (rtdev == ddev || rtdev == logdev) {
777 778
			xfs_warn(mp,
	"Cannot mount filesystem with identical rtdev and ddev/logdev.");
D
Dave Chinner 已提交
779
			error = -EINVAL;
780 781
			goto out_close_rtdev;
		}
782
		dax_rtdev = fs_dax_get_by_bdev(rtdev);
783 784 785 786 787
	}

	/*
	 * Setup xfs_mount buffer target pointers
	 */
D
Dave Chinner 已提交
788
	error = -ENOMEM;
789
	mp->m_ddev_targp = xfs_alloc_buftarg(mp, ddev, dax_ddev);
790 791 792 793
	if (!mp->m_ddev_targp)
		goto out_close_rtdev;

	if (rtdev) {
794
		mp->m_rtdev_targp = xfs_alloc_buftarg(mp, rtdev, dax_rtdev);
795 796 797 798 799
		if (!mp->m_rtdev_targp)
			goto out_free_ddev_targ;
	}

	if (logdev && logdev != ddev) {
800
		mp->m_logdev_targp = xfs_alloc_buftarg(mp, logdev, dax_logdev);
801 802 803 804 805 806 807 808 809 810
		if (!mp->m_logdev_targp)
			goto out_free_rtdev_targ;
	} else {
		mp->m_logdev_targp = mp->m_ddev_targp;
	}

	return 0;

 out_free_rtdev_targ:
	if (mp->m_rtdev_targp)
811
		xfs_free_buftarg(mp->m_rtdev_targp);
812
 out_free_ddev_targ:
813
	xfs_free_buftarg(mp->m_ddev_targp);
814
 out_close_rtdev:
815
	xfs_blkdev_put(rtdev);
816
	fs_put_dax(dax_rtdev);
817
 out_close_logdev:
818
	if (logdev && logdev != ddev) {
819
		xfs_blkdev_put(logdev);
820 821
		fs_put_dax(dax_logdev);
	}
822
 out:
823
	fs_put_dax(dax_ddev);
824 825 826
	return error;
}

827 828 829 830 831 832 833 834
/*
 * Setup xfs_mount buffer target pointers based on superblock
 */
STATIC int
xfs_setup_devices(
	struct xfs_mount	*mp)
{
	int			error;
835

836
	error = xfs_setsize_buftarg(mp->m_ddev_targp, mp->m_sb.sb_sectsize);
837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858
	if (error)
		return error;

	if (mp->m_logdev_targp && mp->m_logdev_targp != mp->m_ddev_targp) {
		unsigned int	log_sector_size = BBSIZE;

		if (xfs_sb_version_hassector(&mp->m_sb))
			log_sector_size = mp->m_sb.sb_logsectsize;
		error = xfs_setsize_buftarg(mp->m_logdev_targp,
					    log_sector_size);
		if (error)
			return error;
	}
	if (mp->m_rtdev_targp) {
		error = xfs_setsize_buftarg(mp->m_rtdev_targp,
					    mp->m_sb.sb_sectsize);
		if (error)
			return error;
	}

	return 0;
}
859

860 861 862 863
STATIC int
xfs_init_mount_workqueues(
	struct xfs_mount	*mp)
{
864
	mp->m_buf_workqueue = alloc_workqueue("xfs-buf/%s",
865
			WQ_MEM_RECLAIM|WQ_FREEZABLE, 1, mp->m_fsname);
866 867 868
	if (!mp->m_buf_workqueue)
		goto out;

869
	mp->m_data_workqueue = alloc_workqueue("xfs-data/%s",
870
			WQ_MEM_RECLAIM|WQ_FREEZABLE, 0, mp->m_fsname);
871
	if (!mp->m_data_workqueue)
872
		goto out_destroy_buf;
873 874

	mp->m_unwritten_workqueue = alloc_workqueue("xfs-conv/%s",
875
			WQ_MEM_RECLAIM|WQ_FREEZABLE, 0, mp->m_fsname);
876 877 878
	if (!mp->m_unwritten_workqueue)
		goto out_destroy_data_iodone_queue;

879
	mp->m_cil_workqueue = alloc_workqueue("xfs-cil/%s",
880
			WQ_MEM_RECLAIM|WQ_FREEZABLE, 0, mp->m_fsname);
881 882
	if (!mp->m_cil_workqueue)
		goto out_destroy_unwritten;
D
Dave Chinner 已提交
883 884

	mp->m_reclaim_workqueue = alloc_workqueue("xfs-reclaim/%s",
885
			WQ_MEM_RECLAIM|WQ_FREEZABLE, 0, mp->m_fsname);
D
Dave Chinner 已提交
886 887 888 889
	if (!mp->m_reclaim_workqueue)
		goto out_destroy_cil;

	mp->m_log_workqueue = alloc_workqueue("xfs-log/%s",
890 891
			WQ_MEM_RECLAIM|WQ_FREEZABLE|WQ_HIGHPRI, 0,
			mp->m_fsname);
D
Dave Chinner 已提交
892 893 894
	if (!mp->m_log_workqueue)
		goto out_destroy_reclaim;

895
	mp->m_eofblocks_workqueue = alloc_workqueue("xfs-eofblocks/%s",
896
			WQ_MEM_RECLAIM|WQ_FREEZABLE, 0, mp->m_fsname);
897 898 899
	if (!mp->m_eofblocks_workqueue)
		goto out_destroy_log;

900 901 902 903 904
	mp->m_sync_workqueue = alloc_workqueue("xfs-sync/%s", WQ_FREEZABLE, 0,
					       mp->m_fsname);
	if (!mp->m_sync_workqueue)
		goto out_destroy_eofb;

905 906
	return 0;

907 908
out_destroy_eofb:
	destroy_workqueue(mp->m_eofblocks_workqueue);
909 910
out_destroy_log:
	destroy_workqueue(mp->m_log_workqueue);
D
Dave Chinner 已提交
911 912 913 914
out_destroy_reclaim:
	destroy_workqueue(mp->m_reclaim_workqueue);
out_destroy_cil:
	destroy_workqueue(mp->m_cil_workqueue);
915 916
out_destroy_unwritten:
	destroy_workqueue(mp->m_unwritten_workqueue);
917 918
out_destroy_data_iodone_queue:
	destroy_workqueue(mp->m_data_workqueue);
919 920
out_destroy_buf:
	destroy_workqueue(mp->m_buf_workqueue);
921 922 923 924 925 926 927 928
out:
	return -ENOMEM;
}

STATIC void
xfs_destroy_mount_workqueues(
	struct xfs_mount	*mp)
{
929
	destroy_workqueue(mp->m_sync_workqueue);
930
	destroy_workqueue(mp->m_eofblocks_workqueue);
D
Dave Chinner 已提交
931 932
	destroy_workqueue(mp->m_log_workqueue);
	destroy_workqueue(mp->m_reclaim_workqueue);
933
	destroy_workqueue(mp->m_cil_workqueue);
934 935
	destroy_workqueue(mp->m_data_workqueue);
	destroy_workqueue(mp->m_unwritten_workqueue);
936
	destroy_workqueue(mp->m_buf_workqueue);
937 938
}

D
Dave Chinner 已提交
939 940 941 942 943 944 945 946 947 948 949 950 951
/*
 * Flush all dirty data to disk. Must not be called while holding an XFS_ILOCK
 * or a page lock. We use sync_inodes_sb() here to ensure we block while waiting
 * for IO to complete so that we effectively throttle multiple callers to the
 * rate at which IO is completing.
 */
void
xfs_flush_inodes(
	struct xfs_mount	*mp)
{
	struct super_block	*sb = mp->m_super;

	if (down_read_trylock(&sb->s_umount)) {
952
		sync_inodes_sb(sb);
D
Dave Chinner 已提交
953 954 955 956
		up_read(&sb->s_umount);
	}
}

957
/* Catch misguided souls that try to use this interface on XFS */
L
Linus Torvalds 已提交
958
STATIC struct inode *
959
xfs_fs_alloc_inode(
L
Linus Torvalds 已提交
960 961
	struct super_block	*sb)
{
962
	BUG();
963
	return NULL;
L
Linus Torvalds 已提交
964 965
}

966
/*
967
 * Now that the generic code is guaranteed not to be accessing
D
Dave Chinner 已提交
968
 * the linux inode, we can inactivate and reclaim the inode.
969
 */
L
Linus Torvalds 已提交
970
STATIC void
971
xfs_fs_destroy_inode(
C
Christoph Hellwig 已提交
972
	struct inode		*inode)
L
Linus Torvalds 已提交
973
{
C
Christoph Hellwig 已提交
974 975
	struct xfs_inode	*ip = XFS_I(inode);

C
Christoph Hellwig 已提交
976
	trace_xfs_destroy_inode(ip);
977

978
	ASSERT(!rwsem_is_locked(&inode->i_rwsem));
D
Dave Chinner 已提交
979 980 981 982
	XFS_STATS_INC(ip->i_mount, vn_rele);
	XFS_STATS_INC(ip->i_mount, vn_remove);

	xfs_inactive(ip);
C
Christoph Hellwig 已提交
983 984

	ASSERT(XFS_FORCED_SHUTDOWN(ip->i_mount) || ip->i_delayed_blks == 0);
D
Dave Chinner 已提交
985
	XFS_STATS_INC(ip->i_mount, vn_reclaim);
C
Christoph Hellwig 已提交
986 987 988 989 990 991 992 993

	/*
	 * We should never get here with one of the reclaim flags already set.
	 */
	ASSERT_ALWAYS(!xfs_iflags_test(ip, XFS_IRECLAIMABLE));
	ASSERT_ALWAYS(!xfs_iflags_test(ip, XFS_IRECLAIM));

	/*
994 995 996 997 998
	 * We always use background reclaim here because even if the
	 * inode is clean, it still may be under IO and hence we have
	 * to take the flush lock. The background reclaim path handles
	 * this more efficiently than we can here, so simply let background
	 * reclaim tear down all inodes.
C
Christoph Hellwig 已提交
999
	 */
1000
	xfs_inode_set_reclaim_tag(ip);
L
Linus Torvalds 已提交
1001 1002
}

1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024
static void
xfs_fs_dirty_inode(
	struct inode			*inode,
	int				flag)
{
	struct xfs_inode		*ip = XFS_I(inode);
	struct xfs_mount		*mp = ip->i_mount;
	struct xfs_trans		*tp;

	if (!(inode->i_sb->s_flags & SB_LAZYTIME))
		return;
	if (flag != I_DIRTY_SYNC || !(inode->i_state & I_DIRTY_TIME))
		return;

	if (xfs_trans_alloc(mp, &M_RES(mp)->tr_fsyncts, 0, 0, 0, &tp))
		return;
	xfs_ilock(ip, XFS_ILOCK_EXCL);
	xfs_trans_ijoin(tp, ip, XFS_ILOCK_EXCL);
	xfs_trans_log_inode(tp, ip, XFS_ILOG_TIMESTAMP);
	xfs_trans_commit(tp);
}

1025 1026 1027 1028
/*
 * Slab object creation initialisation for the XFS inode.
 * This covers only the idempotent fields in the XFS inode;
 * all other fields need to be initialised on allocation
1029
 * from the slab. This avoids the need to repeatedly initialise
1030 1031 1032
 * fields in the xfs inode that left in the initialise state
 * when freeing the inode.
 */
1033 1034
STATIC void
xfs_fs_inode_init_once(
1035 1036 1037 1038 1039
	void			*inode)
{
	struct xfs_inode	*ip = inode;

	memset(ip, 0, sizeof(struct xfs_inode));
1040 1041 1042 1043 1044

	/* vfs inode */
	inode_init_once(VFS_I(ip));

	/* xfs inode */
1045 1046 1047
	atomic_set(&ip->i_pincount, 0);
	spin_lock_init(&ip->i_flags_lock);

D
Dave Chinner 已提交
1048 1049
	mrlock_init(&ip->i_mmaplock, MRLOCK_ALLOW_EQUAL_PRI|MRLOCK_BARRIER,
		     "xfsino", ip->i_ino);
1050 1051 1052 1053
	mrlock_init(&ip->i_lock, MRLOCK_ALLOW_EQUAL_PRI|MRLOCK_BARRIER,
		     "xfsino", ip->i_ino);
}

1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066
/*
 * We do an unlocked check for XFS_IDONTCACHE here because we are already
 * serialised against cache hits here via the inode->i_lock and igrab() in
 * xfs_iget_cache_hit(). Hence a lookup that might clear this flag will not be
 * racing with us, and it avoids needing to grab a spinlock here for every inode
 * we drop the final reference on.
 */
STATIC int
xfs_fs_drop_inode(
	struct inode		*inode)
{
	struct xfs_inode	*ip = XFS_I(inode);

1067 1068 1069 1070 1071 1072 1073 1074 1075 1076
	/*
	 * If this unlinked inode is in the middle of recovery, don't
	 * drop the inode just yet; log recovery will take care of
	 * that.  See the comment for this inode flag.
	 */
	if (ip->i_flags & XFS_IRECOVERY) {
		ASSERT(ip->i_mount->m_log->l_flags & XLOG_RECOVERY_NEEDED);
		return 0;
	}

1077 1078 1079
	return generic_drop_inode(inode) || (ip->i_flags & XFS_IDONTCACHE);
}

1080 1081 1082 1083 1084 1085 1086 1087 1088
STATIC void
xfs_free_fsname(
	struct xfs_mount	*mp)
{
	kfree(mp->m_fsname);
	kfree(mp->m_rtname);
	kfree(mp->m_logname);
}

L
Linus Torvalds 已提交
1089
STATIC int
C
Christoph Hellwig 已提交
1090
xfs_fs_sync_fs(
L
Linus Torvalds 已提交
1091 1092 1093
	struct super_block	*sb,
	int			wait)
{
1094
	struct xfs_mount	*mp = XFS_M(sb);
L
Linus Torvalds 已提交
1095

1096
	/*
C
Christoph Hellwig 已提交
1097
	 * Doing anything during the async pass would be counterproductive.
1098
	 */
C
Christoph Hellwig 已提交
1099
	if (!wait)
C
Christoph Hellwig 已提交
1100 1101
		return 0;

D
Dave Chinner 已提交
1102
	xfs_log_force(mp, XFS_LOG_SYNC);
C
Christoph Hellwig 已提交
1103
	if (laptop_mode) {
L
Linus Torvalds 已提交
1104 1105
		/*
		 * The disk must be active because we're syncing.
1106
		 * We schedule log work now (now that the disk is
L
Linus Torvalds 已提交
1107 1108
		 * active) instead of later (when it might not be).
		 */
1109
		flush_delayed_work(&mp->m_log->l_work);
L
Linus Torvalds 已提交
1110 1111
	}

C
Christoph Hellwig 已提交
1112
	return 0;
L
Linus Torvalds 已提交
1113 1114 1115
}

STATIC int
1116
xfs_fs_statfs(
1117
	struct dentry		*dentry,
L
Linus Torvalds 已提交
1118 1119
	struct kstatfs		*statp)
{
C
Christoph Hellwig 已提交
1120 1121
	struct xfs_mount	*mp = XFS_M(dentry->d_sb);
	xfs_sb_t		*sbp = &mp->m_sb;
1122
	struct xfs_inode	*ip = XFS_I(d_inode(dentry));
1123 1124 1125 1126
	uint64_t		fakeinos, id;
	uint64_t		icount;
	uint64_t		ifree;
	uint64_t		fdblocks;
C
Christoph Hellwig 已提交
1127
	xfs_extlen_t		lsize;
1128
	int64_t			ffree;
C
Christoph Hellwig 已提交
1129 1130 1131 1132 1133 1134 1135 1136

	statp->f_type = XFS_SB_MAGIC;
	statp->f_namelen = MAXNAMELEN - 1;

	id = huge_encode_dev(mp->m_ddev_targp->bt_dev);
	statp->f_fsid.val[0] = (u32)id;
	statp->f_fsid.val[1] = (u32)(id >> 32);

1137
	icount = percpu_counter_sum(&mp->m_icount);
1138
	ifree = percpu_counter_sum(&mp->m_ifree);
1139
	fdblocks = percpu_counter_sum(&mp->m_fdblocks);
C
Christoph Hellwig 已提交
1140 1141 1142 1143 1144

	spin_lock(&mp->m_sb_lock);
	statp->f_bsize = sbp->sb_blocksize;
	lsize = sbp->sb_logstart ? sbp->sb_logblocks : 0;
	statp->f_blocks = sbp->sb_dblocks - lsize;
1145 1146
	spin_unlock(&mp->m_sb_lock);

1147
	statp->f_bfree = fdblocks - mp->m_alloc_set_aside;
1148 1149
	statp->f_bavail = statp->f_bfree;

C
Christoph Hellwig 已提交
1150
	fakeinos = statp->f_bfree << sbp->sb_inopblog;
1151
	statp->f_files = MIN(icount + fakeinos, (uint64_t)XFS_MAXINUMBER);
C
Christoph Hellwig 已提交
1152
	if (mp->m_maxicount)
C
Christoph Hellwig 已提交
1153 1154 1155
		statp->f_files = min_t(typeof(statp->f_files),
					statp->f_files,
					mp->m_maxicount);
1156

1157 1158 1159 1160 1161
	/* If sb_icount overshot maxicount, report actual allocation */
	statp->f_files = max_t(typeof(statp->f_files),
					statp->f_files,
					sbp->sb_icount);

1162
	/* make sure statp->f_ffree does not underflow */
1163
	ffree = statp->f_files - (icount - ifree);
1164
	statp->f_ffree = max_t(int64_t, ffree, 0);
1165

C
Christoph Hellwig 已提交
1166

1167
	if ((ip->i_d.di_flags & XFS_DIFLAG_PROJINHERIT) &&
1168 1169
	    ((mp->m_qflags & (XFS_PQUOTA_ACCT|XFS_PQUOTA_ENFD))) ==
			      (XFS_PQUOTA_ACCT|XFS_PQUOTA_ENFD))
C
Christoph Hellwig 已提交
1170
		xfs_qm_statvfs(ip, statp);
1171 1172 1173 1174 1175 1176 1177 1178

	if (XFS_IS_REALTIME_MOUNT(mp) &&
	    (ip->i_d.di_flags & (XFS_DIFLAG_RTINHERIT | XFS_DIFLAG_REALTIME))) {
		statp->f_blocks = sbp->sb_rblocks;
		statp->f_bavail = statp->f_bfree =
			sbp->sb_frextents * sbp->sb_rextsize;
	}

C
Christoph Hellwig 已提交
1179
	return 0;
L
Linus Torvalds 已提交
1180 1181
}

E
Eric Sandeen 已提交
1182 1183 1184
STATIC void
xfs_save_resvblks(struct xfs_mount *mp)
{
1185
	uint64_t resblks = 0;
E
Eric Sandeen 已提交
1186 1187 1188 1189 1190 1191 1192 1193

	mp->m_resblks_save = mp->m_resblks;
	xfs_reserve_blocks(mp, &resblks, NULL);
}

STATIC void
xfs_restore_resvblks(struct xfs_mount *mp)
{
1194
	uint64_t resblks;
E
Eric Sandeen 已提交
1195 1196 1197 1198 1199 1200 1201 1202 1203 1204

	if (mp->m_resblks_save) {
		resblks = mp->m_resblks_save;
		mp->m_resblks_save = 0;
	} else
		resblks = xfs_default_resblks(mp);

	xfs_reserve_blocks(mp, &resblks, NULL);
}

1205 1206 1207 1208 1209
/*
 * Trigger writeback of all the dirty metadata in the file system.
 *
 * This ensures that the metadata is written to their location on disk rather
 * than just existing in transactions in the log. This means after a quiesce
1210 1211
 * there is no log replay required to write the inodes to disk - this is the
 * primary difference between a sync and a quiesce.
1212
 *
1213 1214
 * Note: xfs_log_quiesce() stops background log work - the callers must ensure
 * it is started again when appropriate.
1215
 */
1216
void
1217 1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 1238
xfs_quiesce_attr(
	struct xfs_mount	*mp)
{
	int	error = 0;

	/* wait for all modifications to complete */
	while (atomic_read(&mp->m_active_trans) > 0)
		delay(100);

	/* force the log to unpin objects from the now complete transactions */
	xfs_log_force(mp, XFS_LOG_SYNC);

	/* reclaim inodes to do any IO before the freeze completes */
	xfs_reclaim_inodes(mp, 0);
	xfs_reclaim_inodes(mp, SYNC_WAIT);

	/* Push the superblock and write an unmount record */
	error = xfs_log_sbcount(mp);
	if (error)
		xfs_warn(mp, "xfs_attr_quiesce: failed to log sb changes. "
				"Frozen image may not be consistent.");
	/*
1239 1240
	 * Just warn here till VFS can correctly support
	 * read-only remount without racing.
1241
	 */
1242
	WARN_ON(atomic_read(&mp->m_active_trans) != 0);
1243

1244
	xfs_log_quiesce(mp);
1245 1246
}

E
Eric Sandeen 已提交
1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 1257 1258 1259 1260 1261
STATIC int
xfs_test_remount_options(
	struct super_block	*sb,
	char			*options)
{
	int			error = 0;
	struct xfs_mount	*tmp_mp;

	tmp_mp = kmem_zalloc(sizeof(*tmp_mp), KM_MAYFAIL);
	if (!tmp_mp)
		return -ENOMEM;

	tmp_mp->m_super = sb;
	error = xfs_parseargs(tmp_mp, options);
	xfs_free_fsname(tmp_mp);
1262
	kmem_free(tmp_mp);
E
Eric Sandeen 已提交
1263 1264 1265 1266

	return error;
}

L
Linus Torvalds 已提交
1267
STATIC int
1268
xfs_fs_remount(
L
Linus Torvalds 已提交
1269 1270 1271 1272
	struct super_block	*sb,
	int			*flags,
	char			*options)
{
1273
	struct xfs_mount	*mp = XFS_M(sb);
1274
	xfs_sb_t		*sbp = &mp->m_sb;
1275 1276
	substring_t		args[MAX_OPT_ARGS];
	char			*p;
1277
	int			error;
L
Linus Torvalds 已提交
1278

E
Eric Sandeen 已提交
1279
	/* First, check for complete junk; i.e. invalid options */
1280
	error = xfs_test_remount_options(sb, options);
E
Eric Sandeen 已提交
1281 1282 1283
	if (error)
		return error;

1284
	sync_filesystem(sb);
1285 1286
	while ((p = strsep(&options, ",")) != NULL) {
		int token;
1287

1288 1289
		if (!*p)
			continue;
1290

1291 1292 1293
		token = match_token(p, tokens, args);
		switch (token) {
		case Opt_barrier:
1294
			xfs_warn(mp, "%s option is deprecated, ignoring.", p);
1295
			mp->m_flags |= XFS_MOUNT_BARRIER;
1296 1297
			break;
		case Opt_nobarrier:
1298
			xfs_warn(mp, "%s option is deprecated, ignoring.", p);
1299
			mp->m_flags &= ~XFS_MOUNT_BARRIER;
1300
			break;
1301
		case Opt_inode64:
1302 1303
			mp->m_flags &= ~XFS_MOUNT_SMALL_INUMS;
			mp->m_maxagi = xfs_set_inode_alloc(mp, sbp->sb_agcount);
1304
			break;
1305
		case Opt_inode32:
1306 1307
			mp->m_flags |= XFS_MOUNT_SMALL_INUMS;
			mp->m_maxagi = xfs_set_inode_alloc(mp, sbp->sb_agcount);
1308
			break;
1309
		default:
1310 1311 1312 1313 1314 1315 1316 1317 1318 1319 1320 1321 1322 1323 1324 1325 1326
			/*
			 * Logically we would return an error here to prevent
			 * users from believing they might have changed
			 * mount options using remount which can't be changed.
			 *
			 * But unfortunately mount(8) adds all options from
			 * mtab and fstab to the mount arguments in some cases
			 * so we can't blindly reject options, but have to
			 * check for each specified option if it actually
			 * differs from the currently set option and only
			 * reject it if that's the case.
			 *
			 * Until that is implemented we return success for
			 * every remount request, and silently ignore all
			 * options that we can't actually change.
			 */
#if 0
1327
			xfs_info(mp,
1328
		"mount option \"%s\" not supported for remount", p);
1329
			return -EINVAL;
1330
#else
1331
			break;
1332
#endif
1333
		}
1334 1335
	}

1336
	/* ro -> rw */
1337
	if ((mp->m_flags & XFS_MOUNT_RDONLY) && !(*flags & SB_RDONLY)) {
1338 1339 1340 1341 1342 1343
		if (mp->m_flags & XFS_MOUNT_NORECOVERY) {
			xfs_warn(mp,
		"ro->rw transition prohibited on norecovery mount");
			return -EINVAL;
		}

1344 1345 1346 1347 1348 1349 1350 1351 1352 1353
		if (XFS_SB_VERSION_NUM(sbp) == XFS_SB_VERSION_5 &&
		    xfs_sb_has_ro_compat_feature(sbp,
					XFS_SB_FEAT_RO_COMPAT_UNKNOWN)) {
			xfs_warn(mp,
"ro->rw transition prohibited on unknown (0x%x) ro-compat filesystem",
				(sbp->sb_features_ro_compat &
					XFS_SB_FEAT_RO_COMPAT_UNKNOWN));
			return -EINVAL;
		}

1354
		mp->m_flags &= ~XFS_MOUNT_RDONLY;
1355 1356 1357 1358 1359

		/*
		 * If this is the first remount to writeable state we
		 * might have some superblock changes to update.
		 */
1360 1361
		if (mp->m_update_sb) {
			error = xfs_sync_sb(mp, false);
1362
			if (error) {
1363
				xfs_warn(mp, "failed to write sb changes");
1364 1365
				return error;
			}
1366
			mp->m_update_sb = false;
1367
		}
1368 1369 1370 1371 1372

		/*
		 * Fill out the reserve pool if it is empty. Use the stashed
		 * value if it is non-zero, otherwise go with the default.
		 */
E
Eric Sandeen 已提交
1373
		xfs_restore_resvblks(mp);
1374
		xfs_log_work_queue(mp);
1375 1376 1377 1378 1379 1380 1381 1382 1383

		/* Recover any CoW blocks that never got remapped. */
		error = xfs_reflink_recover_cow(mp);
		if (error) {
			xfs_err(mp,
	"Error %d recovering leftover CoW allocations.", error);
			xfs_force_shutdown(mp, SHUTDOWN_CORRUPT_INCORE);
			return error;
		}
1384
		xfs_icache_enable_reclaim(mp);
1385 1386 1387 1388 1389

		/* Create the per-AG metadata reservation pool .*/
		error = xfs_fs_reserve_ag_blocks(mp);
		if (error && error != -ENOSPC)
			return error;
1390 1391 1392
	}

	/* rw -> ro */
1393
	if (!(mp->m_flags & XFS_MOUNT_RDONLY) && (*flags & SB_RDONLY)) {
1394 1395 1396 1397 1398 1399
		/*
		 * Cancel background eofb scanning so it cannot race with the
		 * final log force+buftarg wait and deadlock the remount.
		 */
		xfs_icache_disable_reclaim(mp);

1400 1401 1402 1403 1404 1405 1406
		/* Get rid of any leftover CoW reservations... */
		error = xfs_icache_free_cowblocks(mp, NULL);
		if (error) {
			xfs_force_shutdown(mp, SHUTDOWN_CORRUPT_INCORE);
			return error;
		}

1407 1408 1409 1410 1411 1412 1413
		/* Free the per-AG metadata reservation pool. */
		error = xfs_fs_unreserve_ag_blocks(mp);
		if (error) {
			xfs_force_shutdown(mp, SHUTDOWN_CORRUPT_INCORE);
			return error;
		}

1414
		/*
D
Dave Chinner 已提交
1415 1416 1417 1418 1419
		 * Before we sync the metadata, we need to free up the reserve
		 * block pool so that the used block count in the superblock on
		 * disk is correct at the end of the remount. Stash the current
		 * reserve pool size so that if we get remounted rw, we can
		 * return it to the same size.
1420
		 */
E
Eric Sandeen 已提交
1421
		xfs_save_resvblks(mp);
1422

D
David Chinner 已提交
1423
		xfs_quiesce_attr(mp);
1424 1425 1426
		mp->m_flags |= XFS_MOUNT_RDONLY;
	}

1427
	return 0;
L
Linus Torvalds 已提交
1428 1429
}

C
Christoph Hellwig 已提交
1430 1431
/*
 * Second stage of a freeze. The data is already frozen so we only
1432 1433 1434
 * need to take care of the metadata. Once that's done sync the superblock
 * to the log to dirty it in case of a crash while frozen. This ensures that we
 * will recover the unlinked inode lists on the next mount.
C
Christoph Hellwig 已提交
1435
 */
1436 1437
STATIC int
xfs_fs_freeze(
L
Linus Torvalds 已提交
1438 1439
	struct super_block	*sb)
{
C
Christoph Hellwig 已提交
1440 1441
	struct xfs_mount	*mp = XFS_M(sb);

1442
	xfs_icache_disable_reclaim(mp);
E
Eric Sandeen 已提交
1443
	xfs_save_resvblks(mp);
D
David Chinner 已提交
1444
	xfs_quiesce_attr(mp);
1445
	return xfs_sync_sb(mp, true);
L
Linus Torvalds 已提交
1446 1447
}

E
Eric Sandeen 已提交
1448 1449 1450 1451 1452 1453 1454
STATIC int
xfs_fs_unfreeze(
	struct super_block	*sb)
{
	struct xfs_mount	*mp = XFS_M(sb);

	xfs_restore_resvblks(mp);
1455
	xfs_log_work_queue(mp);
1456
	xfs_icache_enable_reclaim(mp);
E
Eric Sandeen 已提交
1457 1458 1459
	return 0;
}

L
Linus Torvalds 已提交
1460
STATIC int
1461
xfs_fs_show_options(
L
Linus Torvalds 已提交
1462
	struct seq_file		*m,
1463
	struct dentry		*root)
L
Linus Torvalds 已提交
1464
{
D
Dave Chinner 已提交
1465
	return xfs_showargs(XFS_M(root->d_sb), m);
L
Linus Torvalds 已提交
1466 1467
}

1468 1469 1470 1471 1472 1473 1474 1475 1476 1477
/*
 * This function fills in xfs_mount_t fields based on mount args.
 * Note: the superblock _has_ now been read in.
 */
STATIC int
xfs_finish_flags(
	struct xfs_mount	*mp)
{
	int			ronly = (mp->m_flags & XFS_MOUNT_RDONLY);

1478
	/* Fail a mount where the logbuf is smaller than the log stripe */
1479
	if (xfs_sb_version_haslogv2(&mp->m_sb)) {
1480 1481
		if (mp->m_logbsize <= 0 &&
		    mp->m_sb.sb_logsunit > XLOG_BIG_RECORD_BSIZE) {
1482
			mp->m_logbsize = mp->m_sb.sb_logsunit;
1483 1484
		} else if (mp->m_logbsize > 0 &&
			   mp->m_logbsize < mp->m_sb.sb_logsunit) {
1485 1486
			xfs_warn(mp,
		"logbuf size must be greater than or equal to log stripe size");
D
Dave Chinner 已提交
1487
			return -EINVAL;
1488 1489 1490
		}
	} else {
		/* Fail a mount if the logbuf is larger than 32K */
1491
		if (mp->m_logbsize > XLOG_BIG_RECORD_BSIZE) {
1492 1493
			xfs_warn(mp,
		"logbuf size for version 1 logs must be 16K or 32K");
D
Dave Chinner 已提交
1494
			return -EINVAL;
1495 1496 1497
		}
	}

1498 1499 1500 1501 1502
	/*
	 * V5 filesystems always use attr2 format for attributes.
	 */
	if (xfs_sb_version_hascrc(&mp->m_sb) &&
	    (mp->m_flags & XFS_MOUNT_NOATTR2)) {
1503 1504
		xfs_warn(mp, "Cannot mount a V5 filesystem as noattr2. "
			     "attr2 is always enabled for V5 filesystems.");
D
Dave Chinner 已提交
1505
		return -EINVAL;
1506 1507
	}

1508 1509 1510 1511 1512
	/*
	 * mkfs'ed attr2 will turn on attr2 mount unless explicitly
	 * told by noattr2 to turn it off
	 */
	if (xfs_sb_version_hasattr2(&mp->m_sb) &&
1513
	    !(mp->m_flags & XFS_MOUNT_NOATTR2))
1514 1515 1516 1517 1518 1519
		mp->m_flags |= XFS_MOUNT_ATTR2;

	/*
	 * prohibit r/w mounts of read-only filesystems
	 */
	if ((mp->m_sb.sb_flags & XFS_SBF_READONLY) && !ronly) {
1520 1521
		xfs_warn(mp,
			"cannot mount a read-only filesystem as read-write");
D
Dave Chinner 已提交
1522
		return -EROFS;
1523 1524
	}

1525 1526 1527 1528 1529
	if ((mp->m_qflags & (XFS_GQUOTA_ACCT | XFS_GQUOTA_ACTIVE)) &&
	    (mp->m_qflags & (XFS_PQUOTA_ACCT | XFS_PQUOTA_ACTIVE)) &&
	    !xfs_sb_version_has_pquotino(&mp->m_sb)) {
		xfs_warn(mp,
		  "Super block does not support project and group quota together");
D
Dave Chinner 已提交
1530
		return -EINVAL;
1531 1532
	}

1533 1534 1535
	return 0;
}

D
Dave Chinner 已提交
1536 1537 1538 1539 1540 1541 1542 1543
static int
xfs_init_percpu_counters(
	struct xfs_mount	*mp)
{
	int		error;

	error = percpu_counter_init(&mp->m_icount, 0, GFP_KERNEL);
	if (error)
1544
		return -ENOMEM;
D
Dave Chinner 已提交
1545 1546 1547 1548 1549 1550 1551 1552 1553 1554 1555 1556 1557 1558 1559 1560 1561 1562 1563 1564 1565 1566 1567 1568 1569 1570 1571 1572 1573 1574 1575 1576 1577 1578 1579 1580

	error = percpu_counter_init(&mp->m_ifree, 0, GFP_KERNEL);
	if (error)
		goto free_icount;

	error = percpu_counter_init(&mp->m_fdblocks, 0, GFP_KERNEL);
	if (error)
		goto free_ifree;

	return 0;

free_ifree:
	percpu_counter_destroy(&mp->m_ifree);
free_icount:
	percpu_counter_destroy(&mp->m_icount);
	return -ENOMEM;
}

void
xfs_reinit_percpu_counters(
	struct xfs_mount	*mp)
{
	percpu_counter_set(&mp->m_icount, mp->m_sb.sb_icount);
	percpu_counter_set(&mp->m_ifree, mp->m_sb.sb_ifree);
	percpu_counter_set(&mp->m_fdblocks, mp->m_sb.sb_fdblocks);
}

static void
xfs_destroy_percpu_counters(
	struct xfs_mount	*mp)
{
	percpu_counter_destroy(&mp->m_icount);
	percpu_counter_destroy(&mp->m_ifree);
	percpu_counter_destroy(&mp->m_fdblocks);
}

1581 1582 1583
static struct xfs_mount *
xfs_mount_alloc(
	struct super_block	*sb)
L
Linus Torvalds 已提交
1584
{
1585
	struct xfs_mount	*mp;
1586

C
Christoph Hellwig 已提交
1587 1588
	mp = kzalloc(sizeof(struct xfs_mount), GFP_KERNEL);
	if (!mp)
1589
		return NULL;
L
Linus Torvalds 已提交
1590

1591
	mp->m_super = sb;
C
Christoph Hellwig 已提交
1592
	spin_lock_init(&mp->m_sb_lock);
1593 1594 1595
	spin_lock_init(&mp->m_agirotor_lock);
	INIT_RADIX_TREE(&mp->m_perag_tree, GFP_ATOMIC);
	spin_lock_init(&mp->m_perag_lock);
C
Christoph Hellwig 已提交
1596 1597
	mutex_init(&mp->m_growlock);
	atomic_set(&mp->m_active_trans, 0);
D
Dave Chinner 已提交
1598
	INIT_DELAYED_WORK(&mp->m_reclaim_work, xfs_reclaim_worker);
1599
	INIT_DELAYED_WORK(&mp->m_eofblocks_work, xfs_eofblocks_worker);
1600
	INIT_DELAYED_WORK(&mp->m_cowblocks_work, xfs_cowblocks_worker);
D
Dave Chinner 已提交
1601
	mp->m_kobj.kobject.kset = xfs_kset;
1602 1603
	return mp;
}
1604

1605 1606 1607 1608 1609 1610 1611 1612 1613 1614 1615 1616 1617 1618 1619 1620 1621 1622

STATIC int
xfs_fs_fill_super(
	struct super_block	*sb,
	void			*data,
	int			silent)
{
	struct inode		*root;
	struct xfs_mount	*mp = NULL;
	int			flags = 0, error = -ENOMEM;

	/*
	 * allocate mp and do all low-level struct initializations before we
	 * attach it to the super
	 */
	mp = xfs_mount_alloc(sb);
	if (!mp)
		goto out;
C
Christoph Hellwig 已提交
1623
	sb->s_fs_info = mp;
L
Linus Torvalds 已提交
1624

C
Christoph Hellwig 已提交
1625
	error = xfs_parseargs(mp, (char *)data);
1626
	if (error)
1627
		goto out_free_fsname;
L
Linus Torvalds 已提交
1628 1629

	sb_min_blocksize(sb, BBSIZE);
1630
	sb->s_xattr = xfs_xattr_handlers;
1631
	sb->s_export_op = &xfs_export_operations;
1632
#ifdef CONFIG_XFS_QUOTA
1633
	sb->s_qcop = &xfs_quotactl_operations;
J
Jan Kara 已提交
1634
	sb->s_quota_types = QTYPE_MASK_USR | QTYPE_MASK_GRP | QTYPE_MASK_PRJ;
1635
#endif
1636
	sb->s_op = &xfs_super_operations;
L
Linus Torvalds 已提交
1637

D
Dave Chinner 已提交
1638 1639 1640 1641 1642 1643 1644 1645 1646 1647 1648
	/*
	 * Delay mount work if the debug hook is set. This is debug
	 * instrumention to coordinate simulation of xfs mount failures with
	 * VFS superblock operations
	 */
	if (xfs_globals.mount_delay) {
		xfs_notice(mp, "Delaying mount for %d seconds.",
			xfs_globals.mount_delay);
		msleep(xfs_globals.mount_delay * 1000);
	}

1649
	if (silent)
1650 1651
		flags |= XFS_MFSI_QUIET;

1652
	error = xfs_open_devices(mp);
1653
	if (error)
C
Christoph Hellwig 已提交
1654
		goto out_free_fsname;
1655

D
Dave Chinner 已提交
1656
	error = xfs_init_mount_workqueues(mp);
1657 1658
	if (error)
		goto out_close_devices;
C
Christoph Hellwig 已提交
1659

D
Dave Chinner 已提交
1660
	error = xfs_init_percpu_counters(mp);
1661 1662 1663
	if (error)
		goto out_destroy_workqueues;

1664 1665 1666
	/* Allocate stats memory before we do operations that might use it */
	mp->m_stats.xs_stats = alloc_percpu(struct xfsstats);
	if (!mp->m_stats.xs_stats) {
1667
		error = -ENOMEM;
1668 1669 1670
		goto out_destroy_counters;
	}

1671 1672
	error = xfs_readsb(mp, flags);
	if (error)
1673
		goto out_free_stats;
1674 1675

	error = xfs_finish_flags(mp);
1676
	if (error)
1677
		goto out_free_sb;
1678

1679
	error = xfs_setup_devices(mp);
1680
	if (error)
1681
		goto out_free_sb;
1682 1683 1684

	error = xfs_filestream_mount(mp);
	if (error)
1685
		goto out_free_sb;
1686

1687 1688 1689 1690
	/*
	 * we must configure the block size in the superblock before we run the
	 * full mount process as the mount process can lookup and cache inodes.
	 */
C
Christoph Hellwig 已提交
1691 1692 1693
	sb->s_magic = XFS_SB_MAGIC;
	sb->s_blocksize = mp->m_sb.sb_blocksize;
	sb->s_blocksize_bits = ffs(sb->s_blocksize) - 1;
L
Linus Torvalds 已提交
1694
	sb->s_maxbytes = xfs_max_file_offset(sb->s_blocksize_bits);
1695
	sb->s_max_links = XFS_MAXLINK;
L
Linus Torvalds 已提交
1696 1697 1698
	sb->s_time_gran = 1;
	set_posix_acl_flag(sb);

D
Dave Chinner 已提交
1699 1700
	/* version 5 superblocks support inode version counters. */
	if (XFS_SB_VERSION_NUM(&mp->m_sb) == XFS_SB_VERSION_5)
M
Matthew Garrett 已提交
1701
		sb->s_flags |= SB_I_VERSION;
D
Dave Chinner 已提交
1702

D
Dave Chinner 已提交
1703
	if (mp->m_flags & XFS_MOUNT_DAX) {
1704 1705
		int	error2 = 0;

D
Dave Chinner 已提交
1706
		xfs_warn(mp,
1707 1708
		"DAX enabled. Warning: EXPERIMENTAL, use at your own risk");

1709 1710 1711 1712 1713 1714
		error = bdev_dax_supported(mp->m_ddev_targp->bt_bdev,
				sb->s_blocksize);
		if (mp->m_rtdev_targp)
			error2 = bdev_dax_supported(mp->m_rtdev_targp->bt_bdev,
					sb->s_blocksize);
		if (error && error2) {
D
Dave Chinner 已提交
1715
			xfs_alert(mp,
1716
			"DAX unsupported by block device. Turning off DAX.");
D
Dave Chinner 已提交
1717 1718
			mp->m_flags &= ~XFS_MOUNT_DAX;
		}
1719
		if (xfs_sb_version_hasreflink(&mp->m_sb)) {
1720
			xfs_alert(mp,
1721
		"DAX and reflink cannot be used together!");
1722 1723 1724
			error = -EINVAL;
			goto out_filestream_unmount;
		}
D
Dave Chinner 已提交
1725 1726
	}

1727 1728 1729 1730 1731 1732 1733 1734 1735 1736
	if (mp->m_flags & XFS_MOUNT_DISCARD) {
		struct request_queue *q = bdev_get_queue(sb->s_bdev);

		if (!blk_queue_discard(q)) {
			xfs_warn(mp, "mounting with \"discard\" option, but "
					"the device does not support discard");
			mp->m_flags &= ~XFS_MOUNT_DISCARD;
		}
	}

1737 1738 1739 1740 1741 1742 1743
	if (xfs_sb_version_hasreflink(&mp->m_sb) && mp->m_sb.sb_rblocks) {
		xfs_alert(mp,
	"reflink not compatible with realtime device!");
		error = -EINVAL;
		goto out_filestream_unmount;
	}

1744
	if (xfs_sb_version_hasrmapbt(&mp->m_sb) && mp->m_sb.sb_rblocks) {
1745
		xfs_alert(mp,
1746 1747 1748
	"reverse mapping btree not compatible with realtime device!");
		error = -EINVAL;
		goto out_filestream_unmount;
1749
	}
1750

1751
	error = xfs_mountfs(mp);
1752
	if (error)
D
Dave Chinner 已提交
1753
		goto out_filestream_unmount;
1754

1755
	root = igrab(VFS_I(mp->m_rootip));
1756
	if (!root) {
D
Dave Chinner 已提交
1757
		error = -ENOENT;
1758
		goto out_unmount;
C
Christoph Hellwig 已提交
1759
	}
1760
	sb->s_root = d_make_root(root);
1761
	if (!sb->s_root) {
D
Dave Chinner 已提交
1762
		error = -ENOMEM;
1763
		goto out_unmount;
L
Linus Torvalds 已提交
1764
	}
1765

L
Linus Torvalds 已提交
1766
	return 0;
D
Dave Chinner 已提交
1767

D
Dave Chinner 已提交
1768
 out_filestream_unmount:
1769
	xfs_filestream_unmount(mp);
1770 1771
 out_free_sb:
	xfs_freesb(mp);
1772 1773
 out_free_stats:
	free_percpu(mp->m_stats.xs_stats);
1774
 out_destroy_counters:
D
Dave Chinner 已提交
1775
	xfs_destroy_percpu_counters(mp);
1776
 out_destroy_workqueues:
1777
	xfs_destroy_mount_workqueues(mp);
1778
 out_close_devices:
1779
	xfs_close_devices(mp);
1780
 out_free_fsname:
1781
	sb->s_fs_info = NULL;
1782
	xfs_free_fsname(mp);
C
Christoph Hellwig 已提交
1783
	kfree(mp);
1784
 out:
D
Dave Chinner 已提交
1785
	return error;
1786

1787
 out_unmount:
1788
	xfs_filestream_unmount(mp);
1789
	xfs_unmountfs(mp);
1790
	goto out_free_sb;
L
Linus Torvalds 已提交
1791 1792
}

D
Dave Chinner 已提交
1793 1794 1795 1796 1797 1798
STATIC void
xfs_fs_put_super(
	struct super_block	*sb)
{
	struct xfs_mount	*mp = XFS_M(sb);

1799 1800 1801 1802
	/* if ->fill_super failed, we have no mount to tear down */
	if (!sb->s_fs_info)
		return;

1803
	xfs_notice(mp, "Unmounting Filesystem");
D
Dave Chinner 已提交
1804 1805 1806 1807
	xfs_filestream_unmount(mp);
	xfs_unmountfs(mp);

	xfs_freesb(mp);
1808
	free_percpu(mp->m_stats.xs_stats);
D
Dave Chinner 已提交
1809 1810 1811
	xfs_destroy_percpu_counters(mp);
	xfs_destroy_mount_workqueues(mp);
	xfs_close_devices(mp);
1812 1813

	sb->s_fs_info = NULL;
D
Dave Chinner 已提交
1814 1815 1816 1817
	xfs_free_fsname(mp);
	kfree(mp);
}

A
Al Viro 已提交
1818 1819
STATIC struct dentry *
xfs_fs_mount(
L
Linus Torvalds 已提交
1820 1821 1822
	struct file_system_type	*fs_type,
	int			flags,
	const char		*dev_name,
A
Al Viro 已提交
1823
	void			*data)
L
Linus Torvalds 已提交
1824
{
A
Al Viro 已提交
1825
	return mount_bdev(fs_type, flags, dev_name, data, xfs_fs_fill_super);
1826 1827
}

1828
static long
1829
xfs_fs_nr_cached_objects(
1830
	struct super_block	*sb,
1831
	struct shrink_control	*sc)
1832
{
1833 1834 1835
	/* Paranoia: catch incorrect calls during mount setup or teardown */
	if (WARN_ON_ONCE(!sb->s_fs_info))
		return 0;
1836 1837 1838
	return xfs_reclaim_inodes_count(XFS_M(sb));
}

1839
static long
1840 1841
xfs_fs_free_cached_objects(
	struct super_block	*sb,
1842
	struct shrink_control	*sc)
1843
{
1844
	return xfs_reclaim_inodes_nr(XFS_M(sb), sc->nr_to_scan);
1845 1846
}

1847
static const struct super_operations xfs_super_operations = {
1848 1849
	.alloc_inode		= xfs_fs_alloc_inode,
	.destroy_inode		= xfs_fs_destroy_inode,
1850
	.dirty_inode		= xfs_fs_dirty_inode,
1851
	.drop_inode		= xfs_fs_drop_inode,
1852
	.put_super		= xfs_fs_put_super,
C
Christoph Hellwig 已提交
1853
	.sync_fs		= xfs_fs_sync_fs,
1854
	.freeze_fs		= xfs_fs_freeze,
E
Eric Sandeen 已提交
1855
	.unfreeze_fs		= xfs_fs_unfreeze,
1856 1857 1858
	.statfs			= xfs_fs_statfs,
	.remount_fs		= xfs_fs_remount,
	.show_options		= xfs_fs_show_options,
1859 1860
	.nr_cached_objects	= xfs_fs_nr_cached_objects,
	.free_cached_objects	= xfs_fs_free_cached_objects,
L
Linus Torvalds 已提交
1861 1862
};

A
Andrew Morton 已提交
1863
static struct file_system_type xfs_fs_type = {
L
Linus Torvalds 已提交
1864 1865
	.owner			= THIS_MODULE,
	.name			= "xfs",
A
Al Viro 已提交
1866
	.mount			= xfs_fs_mount,
L
Linus Torvalds 已提交
1867 1868 1869
	.kill_sb		= kill_block_super,
	.fs_flags		= FS_REQUIRES_DEV,
};
1870
MODULE_ALIAS_FS("xfs");
L
Linus Torvalds 已提交
1871

1872 1873 1874
STATIC int __init
xfs_init_zones(void)
{
1875
	xfs_ioend_bioset = bioset_create(4 * MAX_BUF_PER_PAGE,
1876 1877
			offsetof(struct xfs_ioend, io_inline_bio),
			BIOSET_NEED_BVECS);
1878
	if (!xfs_ioend_bioset)
1879
		goto out;
1880 1881 1882 1883

	xfs_log_ticket_zone = kmem_zone_init(sizeof(xlog_ticket_t),
						"xfs_log_ticket");
	if (!xfs_log_ticket_zone)
1884
		goto out_free_ioend_bioset;
1885

1886
	xfs_bmap_free_item_zone = kmem_zone_init(
1887
			sizeof(struct xfs_extent_free_item),
1888
			"xfs_bmap_free_item");
1889 1890
	if (!xfs_bmap_free_item_zone)
		goto out_destroy_log_ticket_zone;
1891

1892 1893 1894 1895 1896 1897 1898 1899 1900 1901 1902 1903
	xfs_btree_cur_zone = kmem_zone_init(sizeof(xfs_btree_cur_t),
						"xfs_btree_cur");
	if (!xfs_btree_cur_zone)
		goto out_destroy_bmap_free_item_zone;

	xfs_da_state_zone = kmem_zone_init(sizeof(xfs_da_state_t),
						"xfs_da_state");
	if (!xfs_da_state_zone)
		goto out_destroy_btree_cur_zone;

	xfs_ifork_zone = kmem_zone_init(sizeof(xfs_ifork_t), "xfs_ifork");
	if (!xfs_ifork_zone)
1904
		goto out_destroy_da_state_zone;
1905 1906 1907 1908 1909

	xfs_trans_zone = kmem_zone_init(sizeof(xfs_trans_t), "xfs_trans");
	if (!xfs_trans_zone)
		goto out_destroy_ifork_zone;

1910

1911 1912 1913 1914 1915
	/*
	 * The size of the zone allocated buf log item is the maximum
	 * size possible under XFS.  This wastes a little bit of memory,
	 * but it is much faster.
	 */
1916 1917
	xfs_buf_item_zone = kmem_zone_init(sizeof(struct xfs_buf_log_item),
					   "xfs_buf_item");
1918
	if (!xfs_buf_item_zone)
1919
		goto out_destroy_trans_zone;
1920 1921 1922 1923 1924 1925 1926 1927 1928 1929 1930 1931 1932 1933 1934

	xfs_efd_zone = kmem_zone_init((sizeof(xfs_efd_log_item_t) +
			((XFS_EFD_MAX_FAST_EXTENTS - 1) *
				 sizeof(xfs_extent_t))), "xfs_efd_item");
	if (!xfs_efd_zone)
		goto out_destroy_buf_item_zone;

	xfs_efi_zone = kmem_zone_init((sizeof(xfs_efi_log_item_t) +
			((XFS_EFI_MAX_FAST_EXTENTS - 1) *
				sizeof(xfs_extent_t))), "xfs_efi_item");
	if (!xfs_efi_zone)
		goto out_destroy_efd_zone;

	xfs_inode_zone =
		kmem_zone_init_flags(sizeof(xfs_inode_t), "xfs_inode",
1935 1936
			KM_ZONE_HWALIGN | KM_ZONE_RECLAIM | KM_ZONE_SPREAD |
			KM_ZONE_ACCOUNT, xfs_fs_inode_init_once);
1937 1938 1939 1940 1941 1942 1943 1944
	if (!xfs_inode_zone)
		goto out_destroy_efi_zone;

	xfs_ili_zone =
		kmem_zone_init_flags(sizeof(xfs_inode_log_item_t), "xfs_ili",
					KM_ZONE_SPREAD, NULL);
	if (!xfs_ili_zone)
		goto out_destroy_inode_zone;
D
Dave Chinner 已提交
1945 1946 1947 1948
	xfs_icreate_zone = kmem_zone_init(sizeof(struct xfs_icreate_item),
					"xfs_icr");
	if (!xfs_icreate_zone)
		goto out_destroy_ili_zone;
1949

1950
	xfs_rud_zone = kmem_zone_init(sizeof(struct xfs_rud_log_item),
1951 1952 1953 1954
			"xfs_rud_item");
	if (!xfs_rud_zone)
		goto out_destroy_icreate_zone;

1955 1956
	xfs_rui_zone = kmem_zone_init(
			xfs_rui_log_item_sizeof(XFS_RUI_MAX_FAST_EXTENTS),
1957 1958 1959 1960
			"xfs_rui_item");
	if (!xfs_rui_zone)
		goto out_destroy_rud_zone;

1961 1962 1963 1964 1965 1966 1967 1968 1969 1970 1971
	xfs_cud_zone = kmem_zone_init(sizeof(struct xfs_cud_log_item),
			"xfs_cud_item");
	if (!xfs_cud_zone)
		goto out_destroy_rui_zone;

	xfs_cui_zone = kmem_zone_init(
			xfs_cui_log_item_sizeof(XFS_CUI_MAX_FAST_EXTENTS),
			"xfs_cui_item");
	if (!xfs_cui_zone)
		goto out_destroy_cud_zone;

1972 1973 1974 1975 1976 1977 1978 1979 1980 1981 1982
	xfs_bud_zone = kmem_zone_init(sizeof(struct xfs_bud_log_item),
			"xfs_bud_item");
	if (!xfs_bud_zone)
		goto out_destroy_cui_zone;

	xfs_bui_zone = kmem_zone_init(
			xfs_bui_log_item_sizeof(XFS_BUI_MAX_FAST_EXTENTS),
			"xfs_bui_item");
	if (!xfs_bui_zone)
		goto out_destroy_bud_zone;

1983 1984
	return 0;

1985 1986 1987 1988
 out_destroy_bud_zone:
	kmem_zone_destroy(xfs_bud_zone);
 out_destroy_cui_zone:
	kmem_zone_destroy(xfs_cui_zone);
1989 1990 1991 1992
 out_destroy_cud_zone:
	kmem_zone_destroy(xfs_cud_zone);
 out_destroy_rui_zone:
	kmem_zone_destroy(xfs_rui_zone);
1993 1994 1995 1996
 out_destroy_rud_zone:
	kmem_zone_destroy(xfs_rud_zone);
 out_destroy_icreate_zone:
	kmem_zone_destroy(xfs_icreate_zone);
D
Dave Chinner 已提交
1997 1998
 out_destroy_ili_zone:
	kmem_zone_destroy(xfs_ili_zone);
1999 2000 2001 2002 2003 2004 2005 2006 2007 2008 2009 2010 2011 2012 2013 2014 2015 2016 2017 2018
 out_destroy_inode_zone:
	kmem_zone_destroy(xfs_inode_zone);
 out_destroy_efi_zone:
	kmem_zone_destroy(xfs_efi_zone);
 out_destroy_efd_zone:
	kmem_zone_destroy(xfs_efd_zone);
 out_destroy_buf_item_zone:
	kmem_zone_destroy(xfs_buf_item_zone);
 out_destroy_trans_zone:
	kmem_zone_destroy(xfs_trans_zone);
 out_destroy_ifork_zone:
	kmem_zone_destroy(xfs_ifork_zone);
 out_destroy_da_state_zone:
	kmem_zone_destroy(xfs_da_state_zone);
 out_destroy_btree_cur_zone:
	kmem_zone_destroy(xfs_btree_cur_zone);
 out_destroy_bmap_free_item_zone:
	kmem_zone_destroy(xfs_bmap_free_item_zone);
 out_destroy_log_ticket_zone:
	kmem_zone_destroy(xfs_log_ticket_zone);
2019 2020
 out_free_ioend_bioset:
	bioset_free(xfs_ioend_bioset);
2021 2022 2023 2024 2025 2026 2027
 out:
	return -ENOMEM;
}

STATIC void
xfs_destroy_zones(void)
{
2028 2029 2030 2031 2032
	/*
	 * Make sure all delayed rcu free are flushed before we
	 * destroy caches.
	 */
	rcu_barrier();
2033 2034
	kmem_zone_destroy(xfs_bui_zone);
	kmem_zone_destroy(xfs_bud_zone);
2035 2036
	kmem_zone_destroy(xfs_cui_zone);
	kmem_zone_destroy(xfs_cud_zone);
2037 2038
	kmem_zone_destroy(xfs_rui_zone);
	kmem_zone_destroy(xfs_rud_zone);
D
Dave Chinner 已提交
2039
	kmem_zone_destroy(xfs_icreate_zone);
2040 2041 2042 2043 2044 2045 2046 2047 2048 2049 2050
	kmem_zone_destroy(xfs_ili_zone);
	kmem_zone_destroy(xfs_inode_zone);
	kmem_zone_destroy(xfs_efi_zone);
	kmem_zone_destroy(xfs_efd_zone);
	kmem_zone_destroy(xfs_buf_item_zone);
	kmem_zone_destroy(xfs_trans_zone);
	kmem_zone_destroy(xfs_ifork_zone);
	kmem_zone_destroy(xfs_da_state_zone);
	kmem_zone_destroy(xfs_btree_cur_zone);
	kmem_zone_destroy(xfs_bmap_free_item_zone);
	kmem_zone_destroy(xfs_log_ticket_zone);
2051
	bioset_free(xfs_ioend_bioset);
2052
}
L
Linus Torvalds 已提交
2053

2054 2055 2056
STATIC int __init
xfs_init_workqueues(void)
{
2057 2058 2059 2060 2061 2062
	/*
	 * The allocation workqueue can be used in memory reclaim situations
	 * (writepage path), and parallelism is only limited by the number of
	 * AGs in all the filesystems mounted. Hence use the default large
	 * max_active value for this workqueue.
	 */
2063 2064
	xfs_alloc_wq = alloc_workqueue("xfsalloc",
			WQ_MEM_RECLAIM|WQ_FREEZABLE, 0);
2065
	if (!xfs_alloc_wq)
D
Dave Chinner 已提交
2066
		return -ENOMEM;
2067

2068 2069 2070 2071
	xfs_discard_wq = alloc_workqueue("xfsdiscard", WQ_UNBOUND, 0);
	if (!xfs_discard_wq)
		goto out_free_alloc_wq;

2072
	return 0;
2073 2074 2075
out_free_alloc_wq:
	destroy_workqueue(xfs_alloc_wq);
	return -ENOMEM;
2076 2077
}

2078
STATIC void
2079 2080
xfs_destroy_workqueues(void)
{
2081
	destroy_workqueue(xfs_discard_wq);
2082
	destroy_workqueue(xfs_alloc_wq);
2083 2084
}

L
Linus Torvalds 已提交
2085
STATIC int __init
2086
init_xfs_fs(void)
L
Linus Torvalds 已提交
2087 2088 2089
{
	int			error;

2090 2091
	xfs_check_ondisk_structs();

2092 2093
	printk(KERN_INFO XFS_VERSION_STRING " with "
			 XFS_BUILD_OPTIONS " enabled\n");
L
Linus Torvalds 已提交
2094

2095
	xfs_extent_free_init_defer_op();
2096
	xfs_rmap_update_init_defer_op();
2097
	xfs_refcount_update_init_defer_op();
2098
	xfs_bmap_update_init_defer_op();
2099

2100
	xfs_dir_startup();
L
Linus Torvalds 已提交
2101

2102
	error = xfs_init_zones();
2103 2104 2105
	if (error)
		goto out;

2106
	error = xfs_init_workqueues();
2107
	if (error)
C
Christoph Hellwig 已提交
2108
		goto out_destroy_zones;
2109

2110 2111 2112 2113
	error = xfs_mru_cache_init();
	if (error)
		goto out_destroy_wq;

2114
	error = xfs_buf_init();
2115
	if (error)
2116
		goto out_mru_cache_uninit;
2117 2118 2119 2120 2121 2122 2123 2124

	error = xfs_init_procfs();
	if (error)
		goto out_buf_terminate;

	error = xfs_sysctl_register();
	if (error)
		goto out_cleanup_procfs;
L
Linus Torvalds 已提交
2125

B
Brian Foster 已提交
2126 2127 2128
	xfs_kset = kset_create_and_add("xfs", NULL, fs_kobj);
	if (!xfs_kset) {
		error = -ENOMEM;
2129
		goto out_sysctl_unregister;
B
Brian Foster 已提交
2130 2131
	}

2132 2133 2134 2135 2136 2137 2138 2139 2140
	xfsstats.xs_kobj.kobject.kset = xfs_kset;

	xfsstats.xs_stats = alloc_percpu(struct xfsstats);
	if (!xfsstats.xs_stats) {
		error = -ENOMEM;
		goto out_kset_unregister;
	}

	error = xfs_sysfs_init(&xfsstats.xs_kobj, &xfs_stats_ktype, NULL,
2141 2142
			       "stats");
	if (error)
2143
		goto out_free_stats;
2144

2145 2146 2147
#ifdef DEBUG
	xfs_dbg_kobj.kobject.kset = xfs_kset;
	error = xfs_sysfs_init(&xfs_dbg_kobj, &xfs_dbg_ktype, NULL, "debug");
2148
	if (error)
2149
		goto out_remove_stats_kobj;
2150 2151 2152 2153
#endif

	error = xfs_qm_init();
	if (error)
2154
		goto out_remove_dbg_kobj;
L
Linus Torvalds 已提交
2155 2156 2157

	error = register_filesystem(&xfs_fs_type);
	if (error)
2158
		goto out_qm_exit;
L
Linus Torvalds 已提交
2159 2160
	return 0;

2161 2162
 out_qm_exit:
	xfs_qm_exit();
2163
 out_remove_dbg_kobj:
2164 2165
#ifdef DEBUG
	xfs_sysfs_del(&xfs_dbg_kobj);
2166
 out_remove_stats_kobj:
2167
#endif
2168 2169 2170
	xfs_sysfs_del(&xfsstats.xs_kobj);
 out_free_stats:
	free_percpu(xfsstats.xs_stats);
2171
 out_kset_unregister:
B
Brian Foster 已提交
2172
	kset_unregister(xfs_kset);
2173 2174 2175 2176 2177
 out_sysctl_unregister:
	xfs_sysctl_unregister();
 out_cleanup_procfs:
	xfs_cleanup_procfs();
 out_buf_terminate:
2178
	xfs_buf_terminate();
2179 2180
 out_mru_cache_uninit:
	xfs_mru_cache_uninit();
2181 2182
 out_destroy_wq:
	xfs_destroy_workqueues();
2183
 out_destroy_zones:
2184
	xfs_destroy_zones();
2185
 out:
L
Linus Torvalds 已提交
2186 2187 2188 2189
	return error;
}

STATIC void __exit
2190
exit_xfs_fs(void)
L
Linus Torvalds 已提交
2191
{
2192
	xfs_qm_exit();
L
Linus Torvalds 已提交
2193
	unregister_filesystem(&xfs_fs_type);
2194 2195 2196
#ifdef DEBUG
	xfs_sysfs_del(&xfs_dbg_kobj);
#endif
2197 2198
	xfs_sysfs_del(&xfsstats.xs_kobj);
	free_percpu(xfsstats.xs_stats);
B
Brian Foster 已提交
2199
	kset_unregister(xfs_kset);
2200 2201
	xfs_sysctl_unregister();
	xfs_cleanup_procfs();
2202
	xfs_buf_terminate();
2203
	xfs_mru_cache_uninit();
2204
	xfs_destroy_workqueues();
2205
	xfs_destroy_zones();
2206
	xfs_uuid_table_free();
L
Linus Torvalds 已提交
2207 2208 2209 2210 2211 2212 2213 2214
}

module_init(init_xfs_fs);
module_exit(exit_xfs_fs);

MODULE_AUTHOR("Silicon Graphics, Inc.");
MODULE_DESCRIPTION(XFS_VERSION_STRING " with " XFS_BUILD_OPTIONS " enabled");
MODULE_LICENSE("GPL");