dir.c 21.4 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10
/*
 * dir.c - Operations for sysfs directories.
 */

#undef DEBUG

#include <linux/fs.h>
#include <linux/mount.h>
#include <linux/module.h>
#include <linux/kobject.h>
11
#include <linux/namei.h>
12
#include <linux/idr.h>
13
#include <linux/completion.h>
14
#include <asm/semaphore.h>
L
Linus Torvalds 已提交
15 16 17
#include "sysfs.h"

DECLARE_RWSEM(sysfs_rename_sem);
T
Tejun Heo 已提交
18
spinlock_t sysfs_assoc_lock = SPIN_LOCK_UNLOCKED;
L
Linus Torvalds 已提交
19

20 21 22
static spinlock_t sysfs_ino_lock = SPIN_LOCK_UNLOCKED;
static DEFINE_IDA(sysfs_ino_ida);

23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64
/**
 *	sysfs_link_sibling - link sysfs_dirent into sibling list
 *	@sd: sysfs_dirent of interest
 *
 *	Link @sd into its sibling list which starts from
 *	sd->s_parent->s_children.
 *
 *	Locking:
 *	mutex_lock(sd->s_parent->dentry->d_inode->i_mutex)
 */
static void sysfs_link_sibling(struct sysfs_dirent *sd)
{
	struct sysfs_dirent *parent_sd = sd->s_parent;

	BUG_ON(sd->s_sibling);
	sd->s_sibling = parent_sd->s_children;
	parent_sd->s_children = sd;
}

/**
 *	sysfs_unlink_sibling - unlink sysfs_dirent from sibling list
 *	@sd: sysfs_dirent of interest
 *
 *	Unlink @sd from its sibling list which starts from
 *	sd->s_parent->s_children.
 *
 *	Locking:
 *	mutex_lock(sd->s_parent->dentry->d_inode->i_mutex)
 */
static void sysfs_unlink_sibling(struct sysfs_dirent *sd)
{
	struct sysfs_dirent **pos;

	for (pos = &sd->s_parent->s_children; *pos; pos = &(*pos)->s_sibling) {
		if (*pos == sd) {
			*pos = sd->s_sibling;
			sd->s_sibling = NULL;
			break;
		}
	}
}

65 66 67 68 69 70 71 72 73 74 75 76
/**
 *	sysfs_get_active - get an active reference to sysfs_dirent
 *	@sd: sysfs_dirent to get an active reference to
 *
 *	Get an active reference of @sd.  This function is noop if @sd
 *	is NULL.
 *
 *	RETURNS:
 *	Pointer to @sd on success, NULL on failure.
 */
struct sysfs_dirent *sysfs_get_active(struct sysfs_dirent *sd)
{
77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93
	if (unlikely(!sd))
		return NULL;

	while (1) {
		int v, t;

		v = atomic_read(&sd->s_active);
		if (unlikely(v < 0))
			return NULL;

		t = atomic_cmpxchg(&sd->s_active, v, v + 1);
		if (likely(t == v))
			return sd;
		if (t < 0)
			return NULL;

		cpu_relax();
94 95 96 97 98 99 100 101 102 103 104 105
	}
}

/**
 *	sysfs_put_active - put an active reference to sysfs_dirent
 *	@sd: sysfs_dirent to put an active reference to
 *
 *	Put an active reference to @sd.  This function is noop if @sd
 *	is NULL.
 */
void sysfs_put_active(struct sysfs_dirent *sd)
{
106 107 108 109 110 111 112 113 114 115 116
	struct completion *cmpl;
	int v;

	if (unlikely(!sd))
		return;

	v = atomic_dec_return(&sd->s_active);
	if (likely(v != SD_DEACTIVATED_BIAS))
		return;

	/* atomic_dec_return() is a mb(), we'll always see the updated
117
	 * sd->s_sibling.
118
	 */
119
	cmpl = (void *)sd->s_sibling;
120
	complete(cmpl);
121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165
}

/**
 *	sysfs_get_active_two - get active references to sysfs_dirent and parent
 *	@sd: sysfs_dirent of interest
 *
 *	Get active reference to @sd and its parent.  Parent's active
 *	reference is grabbed first.  This function is noop if @sd is
 *	NULL.
 *
 *	RETURNS:
 *	Pointer to @sd on success, NULL on failure.
 */
struct sysfs_dirent *sysfs_get_active_two(struct sysfs_dirent *sd)
{
	if (sd) {
		if (sd->s_parent && unlikely(!sysfs_get_active(sd->s_parent)))
			return NULL;
		if (unlikely(!sysfs_get_active(sd))) {
			sysfs_put_active(sd->s_parent);
			return NULL;
		}
	}
	return sd;
}

/**
 *	sysfs_put_active_two - put active references to sysfs_dirent and parent
 *	@sd: sysfs_dirent of interest
 *
 *	Put active references to @sd and its parent.  This function is
 *	noop if @sd is NULL.
 */
void sysfs_put_active_two(struct sysfs_dirent *sd)
{
	if (sd) {
		sysfs_put_active(sd);
		sysfs_put_active(sd->s_parent);
	}
}

/**
 *	sysfs_deactivate - deactivate sysfs_dirent
 *	@sd: sysfs_dirent to deactivate
 *
166
 *	Deny new active references and drain existing ones.
167 168 169
 */
void sysfs_deactivate(struct sysfs_dirent *sd)
{
170 171
	DECLARE_COMPLETION_ONSTACK(wait);
	int v;
172

173
	BUG_ON(sd->s_sibling || !(sd->s_flags & SYSFS_FLAG_REMOVED));
174
	sd->s_sibling = (void *)&wait;
175 176

	/* atomic_add_return() is a mb(), put_active() will always see
177
	 * the updated sd->s_sibling.
178
	 */
179 180 181 182 183
	v = atomic_add_return(SD_DEACTIVATED_BIAS, &sd->s_active);

	if (v != SD_DEACTIVATED_BIAS)
		wait_for_completion(&wait);

184
	sd->s_sibling = NULL;
185 186
}

T
Tejun Heo 已提交
187
static int sysfs_alloc_ino(ino_t *pino)
188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212
{
	int ino, rc;

 retry:
	spin_lock(&sysfs_ino_lock);
	rc = ida_get_new_above(&sysfs_ino_ida, 2, &ino);
	spin_unlock(&sysfs_ino_lock);

	if (rc == -EAGAIN) {
		if (ida_pre_get(&sysfs_ino_ida, GFP_KERNEL))
			goto retry;
		rc = -ENOMEM;
	}

	*pino = ino;
	return rc;
}

static void sysfs_free_ino(ino_t ino)
{
	spin_lock(&sysfs_ino_lock);
	ida_remove(&sysfs_ino_ida, ino);
	spin_unlock(&sysfs_ino_lock);
}

213 214
void release_sysfs_dirent(struct sysfs_dirent * sd)
{
T
Tejun Heo 已提交
215 216 217 218 219
	struct sysfs_dirent *parent_sd;

 repeat:
	parent_sd = sd->s_parent;

220
	if (sysfs_type(sd) == SYSFS_KOBJ_LINK)
221
		sysfs_put(sd->s_elem.symlink.target_sd);
222
	if (sysfs_type(sd) & SYSFS_COPY_NAME)
T
Tejun Heo 已提交
223
		kfree(sd->s_name);
224
	kfree(sd->s_iattr);
225
	sysfs_free_ino(sd->s_ino);
226
	kmem_cache_free(sysfs_dir_cachep, sd);
T
Tejun Heo 已提交
227 228 229 230

	sd = parent_sd;
	if (sd && atomic_dec_and_test(&sd->s_count))
		goto repeat;
231 232
}

L
Linus Torvalds 已提交
233 234 235 236 237
static void sysfs_d_iput(struct dentry * dentry, struct inode * inode)
{
	struct sysfs_dirent * sd = dentry->d_fsdata;

	if (sd) {
T
Tejun Heo 已提交
238 239
		/* sd->s_dentry is protected with sysfs_assoc_lock.
		 * This allows sysfs_drop_dentry() to dereference it.
240
		 */
T
Tejun Heo 已提交
241
		spin_lock(&sysfs_assoc_lock);
242 243 244 245 246 247 248 249

		/* The dentry might have been deleted or another
		 * lookup could have happened updating sd->s_dentry to
		 * point the new dentry.  Ignore if it isn't pointing
		 * to this dentry.
		 */
		if (sd->s_dentry == dentry)
			sd->s_dentry = NULL;
T
Tejun Heo 已提交
250
		spin_unlock(&sysfs_assoc_lock);
L
Linus Torvalds 已提交
251 252 253 254 255 256 257 258 259
		sysfs_put(sd);
	}
	iput(inode);
}

static struct dentry_operations sysfs_dentry_ops = {
	.d_iput		= sysfs_d_iput,
};

260
struct sysfs_dirent *sysfs_new_dirent(const char *name, umode_t mode, int type)
L
Linus Torvalds 已提交
261
{
T
Tejun Heo 已提交
262 263 264 265 266 267 268 269
	char *dup_name = NULL;
	struct sysfs_dirent *sd = NULL;

	if (type & SYSFS_COPY_NAME) {
		name = dup_name = kstrdup(name, GFP_KERNEL);
		if (!name)
			goto err_out;
	}
L
Linus Torvalds 已提交
270

271
	sd = kmem_cache_zalloc(sysfs_dir_cachep, GFP_KERNEL);
L
Linus Torvalds 已提交
272
	if (!sd)
T
Tejun Heo 已提交
273
		goto err_out;
L
Linus Torvalds 已提交
274

T
Tejun Heo 已提交
275 276
	if (sysfs_alloc_ino(&sd->s_ino))
		goto err_out;
277

L
Linus Torvalds 已提交
278
	atomic_set(&sd->s_count, 1);
279
	atomic_set(&sd->s_active, 0);
280
	atomic_set(&sd->s_event, 1);
281

T
Tejun Heo 已提交
282
	sd->s_name = name;
283
	sd->s_mode = mode;
284
	sd->s_flags = type;
L
Linus Torvalds 已提交
285 286

	return sd;
T
Tejun Heo 已提交
287 288 289 290 291

 err_out:
	kfree(dup_name);
	kmem_cache_free(sysfs_dir_cachep, sd);
	return NULL;
L
Linus Torvalds 已提交
292 293
}

294 295 296 297 298 299
static void sysfs_attach_dentry(struct sysfs_dirent *sd, struct dentry *dentry)
{
	dentry->d_op = &sysfs_dentry_ops;
	dentry->d_fsdata = sysfs_get(sd);

	/* protect sd->s_dentry against sysfs_d_iput */
T
Tejun Heo 已提交
300
	spin_lock(&sysfs_assoc_lock);
301
	sd->s_dentry = dentry;
T
Tejun Heo 已提交
302
	spin_unlock(&sysfs_assoc_lock);
303 304 305 306

	d_rehash(dentry);
}

307 308
void sysfs_attach_dirent(struct sysfs_dirent *sd,
			 struct sysfs_dirent *parent_sd, struct dentry *dentry)
309
{
310 311
	if (dentry)
		sysfs_attach_dentry(sd, dentry);
312

T
Tejun Heo 已提交
313 314
	if (parent_sd) {
		sd->s_parent = sysfs_get(parent_sd);
315
		sysfs_link_sibling(sd);
T
Tejun Heo 已提交
316
	}
317 318
}

319 320 321 322 323 324
/**
 *	sysfs_find_dirent - find sysfs_dirent with the given name
 *	@parent_sd: sysfs_dirent to search under
 *	@name: name to look for
 *
 *	Look for sysfs_dirent with name @name under @parent_sd.
325
 *
326 327
 *	LOCKING:
 *	mutex_lock(parent->i_mutex)
328
 *
329 330
 *	RETURNS:
 *	Pointer to sysfs_dirent if found, NULL if not.
331
 */
332 333
struct sysfs_dirent *sysfs_find_dirent(struct sysfs_dirent *parent_sd,
				       const unsigned char *name)
334
{
335 336 337 338 339 340 341
	struct sysfs_dirent *sd;

	for (sd = parent_sd->s_children; sd; sd = sd->s_sibling)
		if (sysfs_type(sd) && !strcmp(sd->s_name, name))
			return sd;
	return NULL;
}
342

343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367
/**
 *	sysfs_get_dirent - find and get sysfs_dirent with the given name
 *	@parent_sd: sysfs_dirent to search under
 *	@name: name to look for
 *
 *	Look for sysfs_dirent with name @name under @parent_sd and get
 *	it if found.
 *
 *	LOCKING:
 *	Kernel thread context (may sleep)
 *
 *	RETURNS:
 *	Pointer to sysfs_dirent if found, NULL if not.
 */
struct sysfs_dirent *sysfs_get_dirent(struct sysfs_dirent *parent_sd,
				      const unsigned char *name)
{
	struct sysfs_dirent *sd;

	mutex_lock(&parent_sd->s_dentry->d_inode->i_mutex);
	sd = sysfs_find_dirent(parent_sd, name);
	sysfs_get(sd);
	mutex_unlock(&parent_sd->s_dentry->d_inode->i_mutex);

	return sd;
368 369
}

370 371
static int create_dir(struct kobject *kobj, struct sysfs_dirent *parent_sd,
		      const char *name, struct sysfs_dirent **p_sd)
L
Linus Torvalds 已提交
372
{
373
	struct dentry *parent = parent_sd->s_dentry;
L
Linus Torvalds 已提交
374 375
	int error;
	umode_t mode = S_IFDIR| S_IRWXU | S_IRUGO | S_IXUGO;
376
	struct dentry *dentry;
377
	struct inode *inode;
378
	struct sysfs_dirent *sd;
L
Linus Torvalds 已提交
379

380 381
	mutex_lock(&parent->d_inode->i_mutex);

382
	/* allocate */
383 384 385 386 387 388 389
	dentry = lookup_one_len(name, parent, strlen(name));
	if (IS_ERR(dentry)) {
		error = PTR_ERR(dentry);
		goto out_unlock;
	}

	error = -EEXIST;
390
	if (dentry->d_inode)
391 392
		goto out_dput;

393
	error = -ENOMEM;
394
	sd = sysfs_new_dirent(name, mode, SYSFS_DIR);
395
	if (!sd)
396
		goto out_drop;
397
	sd->s_elem.dir.kobj = kobj;
398

399
	inode = sysfs_get_inode(sd);
400
	if (!inode)
401 402
		goto out_sput;

403 404 405 406 407 408
	if (inode->i_state & I_NEW) {
		inode->i_op = &sysfs_dir_inode_operations;
		inode->i_fop = &sysfs_dir_operations;
		/* directory inodes start off with i_nlink == 2 (for ".") */
		inc_nlink(inode);
	}
409 410 411

	/* link in */
	error = -EEXIST;
412
	if (sysfs_find_dirent(parent_sd, name))
413 414 415
		goto out_iput;

	sysfs_instantiate(dentry, inode);
416
	inc_nlink(parent->d_inode);
417
	sysfs_attach_dirent(sd, parent_sd, dentry);
418

419
	*p_sd = sd;
420
	error = 0;
421
	goto out_unlock;	/* pin directory dentry in core */
422

423 424
 out_iput:
	iput(inode);
425 426 427 428 429 430 431 432
 out_sput:
	sysfs_put(sd);
 out_drop:
	d_drop(dentry);
 out_dput:
	dput(dentry);
 out_unlock:
	mutex_unlock(&parent->d_inode->i_mutex);
L
Linus Torvalds 已提交
433 434 435
	return error;
}

436 437
int sysfs_create_subdir(struct kobject *kobj, const char *name,
			struct sysfs_dirent **p_sd)
L
Linus Torvalds 已提交
438
{
439
	return create_dir(kobj, kobj->sd, name, p_sd);
L
Linus Torvalds 已提交
440 441 442 443 444
}

/**
 *	sysfs_create_dir - create a directory for an object.
 *	@kobj:		object we're creating directory for. 
445
 *	@shadow_parent:	parent object.
L
Linus Torvalds 已提交
446
 */
447 448
int sysfs_create_dir(struct kobject *kobj,
		     struct sysfs_dirent *shadow_parent_sd)
L
Linus Torvalds 已提交
449
{
450
	struct sysfs_dirent *parent_sd, *sd;
L
Linus Torvalds 已提交
451 452 453 454
	int error = 0;

	BUG_ON(!kobj);

455 456
	if (shadow_parent_sd)
		parent_sd = shadow_parent_sd;
457
	else if (kobj->parent)
458
		parent_sd = kobj->parent->sd;
L
Linus Torvalds 已提交
459
	else if (sysfs_mount && sysfs_mount->mnt_sb)
460
		parent_sd = sysfs_mount->mnt_sb->s_root->d_fsdata;
L
Linus Torvalds 已提交
461 462 463
	else
		return -EFAULT;

464
	error = create_dir(kobj, parent_sd, kobject_name(kobj), &sd);
L
Linus Torvalds 已提交
465
	if (!error)
466
		kobj->sd = sd;
L
Linus Torvalds 已提交
467 468 469 470 471 472 473 474
	return error;
}

static struct dentry * sysfs_lookup(struct inode *dir, struct dentry *dentry,
				struct nameidata *nd)
{
	struct sysfs_dirent * parent_sd = dentry->d_parent->d_fsdata;
	struct sysfs_dirent * sd;
475
	struct bin_attribute *bin_attr;
476 477
	struct inode *inode;
	int found = 0;
L
Linus Torvalds 已提交
478

479
	for (sd = parent_sd->s_children; sd; sd = sd->s_sibling) {
480
		if ((sysfs_type(sd) & SYSFS_NOT_PINNED) &&
481 482
		    !strcmp(sd->s_name, dentry->d_name.name)) {
			found = 1;
L
Linus Torvalds 已提交
483 484 485 486
			break;
		}
	}

487 488 489 490 491
	/* no such entry */
	if (!found)
		return NULL;

	/* attach dentry and inode */
492
	inode = sysfs_get_inode(sd);
493 494 495
	if (!inode)
		return ERR_PTR(-ENOMEM);

496 497
	if (inode->i_state & I_NEW) {
		/* initialize inode according to type */
498 499
		switch (sysfs_type(sd)) {
		case SYSFS_KOBJ_ATTR:
500 501
			inode->i_size = PAGE_SIZE;
			inode->i_fop = &sysfs_file_operations;
502 503 504
			break;
		case SYSFS_KOBJ_BIN_ATTR:
			bin_attr = sd->s_elem.bin_attr.bin_attr;
505 506
			inode->i_size = bin_attr->size;
			inode->i_fop = &bin_fops;
507 508
			break;
		case SYSFS_KOBJ_LINK:
509
			inode->i_op = &sysfs_symlink_inode_operations;
510 511 512 513
			break;
		default:
			BUG();
		}
514
	}
515 516 517 518 519

	sysfs_instantiate(dentry, inode);
	sysfs_attach_dentry(sd, dentry);

	return NULL;
L
Linus Torvalds 已提交
520 521
}

522
const struct inode_operations sysfs_dir_inode_operations = {
L
Linus Torvalds 已提交
523
	.lookup		= sysfs_lookup,
524
	.setattr	= sysfs_setattr,
L
Linus Torvalds 已提交
525 526
};

527
static void remove_dir(struct sysfs_dirent *sd)
L
Linus Torvalds 已提交
528
{
529
	struct dentry *parent = sd->s_parent->s_dentry;
L
Linus Torvalds 已提交
530

531
	mutex_lock(&parent->d_inode->i_mutex);
532

533
	sysfs_unlink_sibling(sd);
534
	sd->s_flags |= SYSFS_FLAG_REMOVED;
L
Linus Torvalds 已提交
535

536
	pr_debug(" o %s removing done\n", sd->s_name);
L
Linus Torvalds 已提交
537

538
	mutex_unlock(&parent->d_inode->i_mutex);
539

540
	sysfs_drop_dentry(sd);
541 542
	sysfs_deactivate(sd);
	sysfs_put(sd);
L
Linus Torvalds 已提交
543 544
}

545
void sysfs_remove_subdir(struct sysfs_dirent *sd)
L
Linus Torvalds 已提交
546
{
547
	remove_dir(sd);
L
Linus Torvalds 已提交
548 549 550
}


551
static void __sysfs_remove_dir(struct sysfs_dirent *dir_sd)
L
Linus Torvalds 已提交
552
{
553 554
	struct sysfs_dirent *removed = NULL;
	struct sysfs_dirent **pos;
555
	struct dentry *dir;
L
Linus Torvalds 已提交
556

557
	if (!dir_sd)
L
Linus Torvalds 已提交
558 559
		return;

560 561 562 563 564
	dir = dir_sd->s_dentry;

	pr_debug("sysfs %s: removing dir\n", dir_sd->s_name);
	mutex_lock(&dir->d_inode->i_mutex);
	pos = &dir_sd->s_children;
565 566 567
	while (*pos) {
		struct sysfs_dirent *sd = *pos;

568
		if (sysfs_type(sd) && (sysfs_type(sd) & SYSFS_NOT_PINNED)) {
569
			sd->s_flags |= SYSFS_FLAG_REMOVED;
570 571 572 573 574
			*pos = sd->s_sibling;
			sd->s_sibling = removed;
			removed = sd;
		} else
			pos = &(*pos)->s_sibling;
L
Linus Torvalds 已提交
575
	}
576
	mutex_unlock(&dir->d_inode->i_mutex);
L
Linus Torvalds 已提交
577

578 579 580 581 582 583
	while (removed) {
		struct sysfs_dirent *sd = removed;

		removed = sd->s_sibling;
		sd->s_sibling = NULL;

584
		sysfs_drop_dentry(sd);
585 586 587 588
		sysfs_deactivate(sd);
		sysfs_put(sd);
	}

589
	remove_dir(dir_sd);
590 591 592 593 594 595 596 597 598 599 600 601 602
}

/**
 *	sysfs_remove_dir - remove an object's directory.
 *	@kobj:	object.
 *
 *	The only thing special about this is that we remove any files in
 *	the directory before we remove the directory, and we've inlined
 *	what used to be sysfs_rmdir() below, instead of calling separately.
 */

void sysfs_remove_dir(struct kobject * kobj)
{
603
	struct sysfs_dirent *sd = kobj->sd;
604

T
Tejun Heo 已提交
605
	spin_lock(&sysfs_assoc_lock);
606
	kobj->sd = NULL;
T
Tejun Heo 已提交
607
	spin_unlock(&sysfs_assoc_lock);
608

609
	__sysfs_remove_dir(sd);
L
Linus Torvalds 已提交
610 611
}

612
int sysfs_rename_dir(struct kobject *kobj, struct sysfs_dirent *new_parent_sd,
613
		     const char *new_name)
L
Linus Torvalds 已提交
614
{
615 616
	struct sysfs_dirent *sd = kobj->sd;
	struct dentry *new_parent = new_parent_sd->s_dentry;
T
Tejun Heo 已提交
617 618
	struct dentry *new_dentry;
	char *dup_name;
619
	int error;
L
Linus Torvalds 已提交
620

621
	if (!new_parent_sd)
622
		return -EFAULT;
L
Linus Torvalds 已提交
623 624

	down_write(&sysfs_rename_sem);
625
	mutex_lock(&new_parent->d_inode->i_mutex);
L
Linus Torvalds 已提交
626

627
	new_dentry = lookup_one_len(new_name, new_parent, strlen(new_name));
628 629 630
	if (IS_ERR(new_dentry)) {
		error = PTR_ERR(new_dentry);
		goto out_unlock;
L
Linus Torvalds 已提交
631
	}
632 633 634 635 636 637

	/* By allowing two different directories with the same
	 * d_parent we allow this routine to move between different
	 * shadows of the same directory
	 */
	error = -EINVAL;
638
	if (sd->s_parent->s_dentry->d_inode != new_parent->d_inode ||
639
	    new_dentry->d_parent->d_inode != new_parent->d_inode ||
640
	    new_dentry == sd->s_dentry)
641 642 643 644 645 646
		goto out_dput;

	error = -EEXIST;
	if (new_dentry->d_inode)
		goto out_dput;

T
Tejun Heo 已提交
647 648 649 650 651 652
	/* rename kobject and sysfs_dirent */
	error = -ENOMEM;
	new_name = dup_name = kstrdup(new_name, GFP_KERNEL);
	if (!new_name)
		goto out_drop;

653 654
	error = kobject_set_name(kobj, "%s", new_name);
	if (error)
T
Tejun Heo 已提交
655
		goto out_free;
656

T
Tejun Heo 已提交
657 658 659 660
	kfree(sd->s_name);
	sd->s_name = new_name;

	/* move under the new parent */
661
	d_add(new_dentry, NULL);
662
	d_move(sd->s_dentry, new_dentry);
663

664
	sysfs_unlink_sibling(sd);
665
	sysfs_get(new_parent_sd);
666
	sysfs_put(sd->s_parent);
667
	sd->s_parent = new_parent_sd;
668
	sysfs_link_sibling(sd);
669 670 671 672

	error = 0;
	goto out_unlock;

T
Tejun Heo 已提交
673 674
 out_free:
	kfree(dup_name);
675 676 677 678 679
 out_drop:
	d_drop(new_dentry);
 out_dput:
	dput(new_dentry);
 out_unlock:
680
	mutex_unlock(&new_parent->d_inode->i_mutex);
L
Linus Torvalds 已提交
681 682 683 684
	up_write(&sysfs_rename_sem);
	return error;
}

685 686 687 688 689 690 691
int sysfs_move_dir(struct kobject *kobj, struct kobject *new_parent)
{
	struct dentry *old_parent_dentry, *new_parent_dentry, *new_dentry;
	struct sysfs_dirent *new_parent_sd, *sd;
	int error;

	old_parent_dentry = kobj->parent ?
692
		kobj->parent->sd->s_dentry : sysfs_mount->mnt_sb->s_root;
693
	new_parent_dentry = new_parent ?
694
		new_parent->sd->s_dentry : sysfs_mount->mnt_sb->s_root;
695

M
Mark Lord 已提交
696 697
	if (old_parent_dentry->d_inode == new_parent_dentry->d_inode)
		return 0;	/* nothing to move */
698 699 700 701 702 703 704 705
again:
	mutex_lock(&old_parent_dentry->d_inode->i_mutex);
	if (!mutex_trylock(&new_parent_dentry->d_inode->i_mutex)) {
		mutex_unlock(&old_parent_dentry->d_inode->i_mutex);
		goto again;
	}

	new_parent_sd = new_parent_dentry->d_fsdata;
706
	sd = kobj->sd;
707 708 709 710 711 712 713 714 715

	new_dentry = lookup_one_len(kobj->name, new_parent_dentry,
				    strlen(kobj->name));
	if (IS_ERR(new_dentry)) {
		error = PTR_ERR(new_dentry);
		goto out;
	} else
		error = 0;
	d_add(new_dentry, NULL);
716
	d_move(sd->s_dentry, new_dentry);
717 718 719
	dput(new_dentry);

	/* Remove from old parent's list and insert into new parent's list. */
720
	sysfs_unlink_sibling(sd);
721 722 723
	sysfs_get(new_parent_sd);
	sysfs_put(sd->s_parent);
	sd->s_parent = new_parent_sd;
724
	sysfs_link_sibling(sd);
725 726 727 728 729 730 731 732

out:
	mutex_unlock(&new_parent_dentry->d_inode->i_mutex);
	mutex_unlock(&old_parent_dentry->d_inode->i_mutex);

	return error;
}

L
Linus Torvalds 已提交
733 734
static int sysfs_dir_open(struct inode *inode, struct file *file)
{
735
	struct dentry * dentry = file->f_path.dentry;
L
Linus Torvalds 已提交
736
	struct sysfs_dirent * parent_sd = dentry->d_fsdata;
737
	struct sysfs_dirent * sd;
L
Linus Torvalds 已提交
738

739
	mutex_lock(&dentry->d_inode->i_mutex);
740
	sd = sysfs_new_dirent("_DIR_", 0, 0);
741 742
	if (sd)
		sysfs_attach_dirent(sd, parent_sd, NULL);
743
	mutex_unlock(&dentry->d_inode->i_mutex);
L
Linus Torvalds 已提交
744

745 746
	file->private_data = sd;
	return sd ? 0 : -ENOMEM;
L
Linus Torvalds 已提交
747 748 749 750
}

static int sysfs_dir_close(struct inode *inode, struct file *file)
{
751
	struct dentry * dentry = file->f_path.dentry;
L
Linus Torvalds 已提交
752 753
	struct sysfs_dirent * cursor = file->private_data;

754
	mutex_lock(&dentry->d_inode->i_mutex);
755
	sysfs_unlink_sibling(cursor);
756
	mutex_unlock(&dentry->d_inode->i_mutex);
L
Linus Torvalds 已提交
757 758 759 760 761 762 763 764 765 766 767 768 769 770

	release_sysfs_dirent(cursor);

	return 0;
}

/* Relationship between s_mode and the DT_xxx types */
static inline unsigned char dt_type(struct sysfs_dirent *sd)
{
	return (sd->s_mode >> 12) & 15;
}

static int sysfs_readdir(struct file * filp, void * dirent, filldir_t filldir)
{
771
	struct dentry *dentry = filp->f_path.dentry;
L
Linus Torvalds 已提交
772 773
	struct sysfs_dirent * parent_sd = dentry->d_fsdata;
	struct sysfs_dirent *cursor = filp->private_data;
774
	struct sysfs_dirent **pos;
L
Linus Torvalds 已提交
775 776 777 778 779
	ino_t ino;
	int i = filp->f_pos;

	switch (i) {
		case 0:
780
			ino = parent_sd->s_ino;
L
Linus Torvalds 已提交
781 782 783 784 785 786
			if (filldir(dirent, ".", 1, i, ino, DT_DIR) < 0)
				break;
			filp->f_pos++;
			i++;
			/* fallthrough */
		case 1:
T
Tejun Heo 已提交
787 788 789 790
			if (parent_sd->s_parent)
				ino = parent_sd->s_parent->s_ino;
			else
				ino = parent_sd->s_ino;
L
Linus Torvalds 已提交
791 792 793 794 795 796
			if (filldir(dirent, "..", 2, i, ino, DT_DIR) < 0)
				break;
			filp->f_pos++;
			i++;
			/* fallthrough */
		default:
797 798 799 800 801 802 803
			pos = &parent_sd->s_children;
			while (*pos != cursor)
				pos = &(*pos)->s_sibling;

			/* unlink cursor */
			*pos = cursor->s_sibling;

A
Akinobu Mita 已提交
804
			if (filp->f_pos == 2)
805
				pos = &parent_sd->s_children;
A
Akinobu Mita 已提交
806

807 808
			for ( ; *pos; pos = &(*pos)->s_sibling) {
				struct sysfs_dirent *next = *pos;
L
Linus Torvalds 已提交
809 810 811
				const char * name;
				int len;

812
				if (!sysfs_type(next))
L
Linus Torvalds 已提交
813 814
					continue;

T
Tejun Heo 已提交
815
				name = next->s_name;
L
Linus Torvalds 已提交
816
				len = strlen(name);
817
				ino = next->s_ino;
L
Linus Torvalds 已提交
818 819 820

				if (filldir(dirent, name, len, filp->f_pos, ino,
						 dt_type(next)) < 0)
821
					break;
L
Linus Torvalds 已提交
822 823 824

				filp->f_pos++;
			}
825 826 827 828

			/* put cursor back in */
			cursor->s_sibling = *pos;
			*pos = cursor;
L
Linus Torvalds 已提交
829 830 831 832 833 834
	}
	return 0;
}

static loff_t sysfs_dir_lseek(struct file * file, loff_t offset, int origin)
{
835
	struct dentry * dentry = file->f_path.dentry;
L
Linus Torvalds 已提交
836

837
	mutex_lock(&dentry->d_inode->i_mutex);
L
Linus Torvalds 已提交
838 839 840 841 842 843 844
	switch (origin) {
		case 1:
			offset += file->f_pos;
		case 0:
			if (offset >= 0)
				break;
		default:
845
			mutex_unlock(&file->f_path.dentry->d_inode->i_mutex);
L
Linus Torvalds 已提交
846 847 848 849 850 851 852
			return -EINVAL;
	}
	if (offset != file->f_pos) {
		file->f_pos = offset;
		if (file->f_pos >= 2) {
			struct sysfs_dirent *sd = dentry->d_fsdata;
			struct sysfs_dirent *cursor = file->private_data;
853
			struct sysfs_dirent **pos;
L
Linus Torvalds 已提交
854 855
			loff_t n = file->f_pos - 2;

856 857 858 859 860
			sysfs_unlink_sibling(cursor);

			pos = &sd->s_children;
			while (n && *pos) {
				struct sysfs_dirent *next = *pos;
861
				if (sysfs_type(next))
L
Linus Torvalds 已提交
862
					n--;
863
				pos = &(*pos)->s_sibling;
L
Linus Torvalds 已提交
864
			}
865 866 867

			cursor->s_sibling = *pos;
			*pos = cursor;
L
Linus Torvalds 已提交
868 869
		}
	}
870
	mutex_unlock(&dentry->d_inode->i_mutex);
L
Linus Torvalds 已提交
871 872 873
	return offset;
}

874 875 876 877 878 879 880 881 882 883 884 885

/**
 *	sysfs_make_shadowed_dir - Setup so a directory can be shadowed
 *	@kobj:	object we're creating shadow of.
 */

int sysfs_make_shadowed_dir(struct kobject *kobj,
	void * (*follow_link)(struct dentry *, struct nameidata *))
{
	struct inode *inode;
	struct inode_operations *i_op;

886
	inode = kobj->sd->s_dentry->d_inode;
887 888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912
	if (inode->i_op != &sysfs_dir_inode_operations)
		return -EINVAL;

	i_op = kmalloc(sizeof(*i_op), GFP_KERNEL);
	if (!i_op)
		return -ENOMEM;

	memcpy(i_op, &sysfs_dir_inode_operations, sizeof(*i_op));
	i_op->follow_link = follow_link;

	/* Locking of inode->i_op?
	 * Since setting i_op is a single word write and they
	 * are atomic we should be ok here.
	 */
	inode->i_op = i_op;
	return 0;
}

/**
 *	sysfs_create_shadow_dir - create a shadow directory for an object.
 *	@kobj:	object we're creating directory for.
 *
 *	sysfs_make_shadowed_dir must already have been called on this
 *	directory.
 */

913
struct sysfs_dirent *sysfs_create_shadow_dir(struct kobject *kobj)
914
{
915
	struct dentry *dir = kobj->sd->s_dentry;
T
Tejun Heo 已提交
916 917 918 919
	struct inode *inode = dir->d_inode;
	struct dentry *parent = dir->d_parent;
	struct sysfs_dirent *parent_sd = parent->d_fsdata;
	struct dentry *shadow;
920 921
	struct sysfs_dirent *sd;

922
	sd = ERR_PTR(-EINVAL);
923 924 925 926 927 928 929
	if (!sysfs_is_shadowed_inode(inode))
		goto out;

	shadow = d_alloc(parent, &dir->d_name);
	if (!shadow)
		goto nomem;

930
	sd = sysfs_new_dirent("_SHADOW_", inode->i_mode, SYSFS_DIR);
931 932
	if (!sd)
		goto nomem;
933
	sd->s_elem.dir.kobj = kobj;
T
Tejun Heo 已提交
934 935
	/* point to parent_sd but don't attach to it */
	sd->s_parent = sysfs_get(parent_sd);
936
	sysfs_attach_dirent(sd, NULL, shadow);
937 938 939 940 941 942 943 944

	d_instantiate(shadow, igrab(inode));
	inc_nlink(inode);
	inc_nlink(parent->d_inode);

	dget(shadow);		/* Extra count - pin the dentry in core */

out:
945
	return sd;
946 947
nomem:
	dput(shadow);
948
	sd = ERR_PTR(-ENOMEM);
949 950 951 952 953
	goto out;
}

/**
 *	sysfs_remove_shadow_dir - remove an object's directory.
954
 *	@shadow_sd: sysfs_dirent of shadow directory
955 956 957 958 959 960
 *
 *	The only thing special about this is that we remove any files in
 *	the directory before we remove the directory, and we've inlined
 *	what used to be sysfs_rmdir() below, instead of calling separately.
 */

961
void sysfs_remove_shadow_dir(struct sysfs_dirent *shadow_sd)
962
{
963
	__sysfs_remove_dir(shadow_sd);
964 965
}

966
const struct file_operations sysfs_dir_operations = {
L
Linus Torvalds 已提交
967 968 969 970 971 972
	.open		= sysfs_dir_open,
	.release	= sysfs_dir_close,
	.llseek		= sysfs_dir_lseek,
	.read		= generic_read_dir,
	.readdir	= sysfs_readdir,
};