commoncap.c 18.7 KB
Newer Older
1
/* Common capabilities, needed by capability.o and root_plug.o
L
Linus Torvalds 已提交
2 3 4 5 6 7 8 9
 *
 *	This program is free software; you can redistribute it and/or modify
 *	it under the terms of the GNU General Public License as published by
 *	the Free Software Foundation; either version 2 of the License, or
 *	(at your option) any later version.
 *
 */

10
#include <linux/capability.h>
11
#include <linux/audit.h>
L
Linus Torvalds 已提交
12 13 14 15 16 17 18 19 20 21 22 23 24 25
#include <linux/module.h>
#include <linux/init.h>
#include <linux/kernel.h>
#include <linux/security.h>
#include <linux/file.h>
#include <linux/mm.h>
#include <linux/mman.h>
#include <linux/pagemap.h>
#include <linux/swap.h>
#include <linux/skbuff.h>
#include <linux/netlink.h>
#include <linux/ptrace.h>
#include <linux/xattr.h>
#include <linux/hugetlb.h>
26
#include <linux/mount.h>
27
#include <linux/sched.h>
28 29
#include <linux/prctl.h>
#include <linux/securebits.h>
30

L
Linus Torvalds 已提交
31 32
int cap_netlink_send(struct sock *sk, struct sk_buff *skb)
{
33
	NETLINK_CB(skb).eff_cap = current_cap();
L
Linus Torvalds 已提交
34 35 36
	return 0;
}

37
int cap_netlink_recv(struct sk_buff *skb, int cap)
L
Linus Torvalds 已提交
38
{
39
	if (!cap_raised(NETLINK_CB(skb).eff_cap, cap))
L
Linus Torvalds 已提交
40 41 42 43 44 45
		return -EPERM;
	return 0;
}

EXPORT_SYMBOL(cap_netlink_recv);

46 47 48 49 50 51
/*
 * NOTE WELL: cap_capable() cannot be used like the kernel's capable()
 * function.  That is, it has the reverse semantics: cap_capable()
 * returns 0 when a task has a capability, but the kernel's capable()
 * returns 1 for this case.
 */
52
int cap_capable(struct task_struct *tsk, int cap, int audit)
L
Linus Torvalds 已提交
53
{
54 55
	__u32 cap_raised;

L
Linus Torvalds 已提交
56
	/* Derived from include/linux/sched.h:capable. */
57 58 59 60
	rcu_read_lock();
	cap_raised = cap_raised(__task_cred(tsk)->cap_effective, cap);
	rcu_read_unlock();
	return cap_raised ? 0 : -EPERM;
L
Linus Torvalds 已提交
61 62 63 64 65 66 67 68 69
}

int cap_settime(struct timespec *ts, struct timezone *tz)
{
	if (!capable(CAP_SYS_TIME))
		return -EPERM;
	return 0;
}

70
int cap_ptrace_may_access(struct task_struct *child, unsigned int mode)
L
Linus Torvalds 已提交
71
{
72 73 74
	int ret = 0;

	rcu_read_lock();
D
David Howells 已提交
75 76
	if (!cap_issubset(__task_cred(child)->cap_permitted,
			  current_cred()->cap_permitted) &&
77 78 79 80
	    !capable(CAP_SYS_PTRACE))
		ret = -EPERM;
	rcu_read_unlock();
	return ret;
81 82 83 84
}

int cap_ptrace_traceme(struct task_struct *parent)
{
85 86 87
	int ret = 0;

	rcu_read_lock();
D
David Howells 已提交
88 89
	if (!cap_issubset(current_cred()->cap_permitted,
			  __task_cred(parent)->cap_permitted) &&
90 91 92 93
	    !has_capability(parent, CAP_SYS_PTRACE))
		ret = -EPERM;
	rcu_read_unlock();
	return ret;
L
Linus Torvalds 已提交
94 95 96 97 98
}

int cap_capget (struct task_struct *target, kernel_cap_t *effective,
		kernel_cap_t *inheritable, kernel_cap_t *permitted)
{
99
	const struct cred *cred;
100

L
Linus Torvalds 已提交
101
	/* Derived from kernel/capability.c:sys_capget. */
102 103
	rcu_read_lock();
	cred = __task_cred(target);
104 105 106
	*effective   = cred->cap_effective;
	*inheritable = cred->cap_inheritable;
	*permitted   = cred->cap_permitted;
107
	rcu_read_unlock();
L
Linus Torvalds 已提交
108 109 110
	return 0;
}

111 112 113 114 115
#ifdef CONFIG_SECURITY_FILE_CAPABILITIES

static inline int cap_inh_is_capped(void)
{
	/*
116 117 118
	 * Return 1 if changes to the inheritable set are limited
	 * to the old permitted set. That is, if the current task
	 * does *not* possess the CAP_SETPCAP capability.
119
	 */
D
David Howells 已提交
120
	return cap_capable(current, CAP_SETPCAP, SECURITY_CAP_AUDIT) != 0;
121 122
}

123 124
static inline int cap_limit_ptraced_target(void) { return 1; }

125 126 127
#else /* ie., ndef CONFIG_SECURITY_FILE_CAPABILITIES */

static inline int cap_inh_is_capped(void) { return 1; }
128 129 130 131
static inline int cap_limit_ptraced_target(void)
{
	return !capable(CAP_SETPCAP);
}
132 133 134

#endif /* def CONFIG_SECURITY_FILE_CAPABILITIES */

D
David Howells 已提交
135 136 137 138 139
int cap_capset(struct cred *new,
	       const struct cred *old,
	       const kernel_cap_t *effective,
	       const kernel_cap_t *inheritable,
	       const kernel_cap_t *permitted)
L
Linus Torvalds 已提交
140
{
D
David Howells 已提交
141 142 143 144
	if (cap_inh_is_capped() &&
	    !cap_issubset(*inheritable,
			  cap_combine(old->cap_inheritable,
				      old->cap_permitted)))
145
		/* incapable of using this inheritable set */
L
Linus Torvalds 已提交
146
		return -EPERM;
D
David Howells 已提交
147

148
	if (!cap_issubset(*inheritable,
D
David Howells 已提交
149 150
			  cap_combine(old->cap_inheritable,
				      old->cap_bset)))
151 152
		/* no new pI capabilities outside bounding set */
		return -EPERM;
L
Linus Torvalds 已提交
153 154

	/* verify restrictions on target's new Permitted set */
D
David Howells 已提交
155
	if (!cap_issubset(*permitted, old->cap_permitted))
L
Linus Torvalds 已提交
156 157 158
		return -EPERM;

	/* verify the _new_Effective_ is a subset of the _new_Permitted_ */
D
David Howells 已提交
159
	if (!cap_issubset(*effective, *permitted))
L
Linus Torvalds 已提交
160 161
		return -EPERM;

D
David Howells 已提交
162 163 164
	new->cap_effective   = *effective;
	new->cap_inheritable = *inheritable;
	new->cap_permitted   = *permitted;
L
Linus Torvalds 已提交
165 166 167
	return 0;
}

168 169
static inline void bprm_clear_caps(struct linux_binprm *bprm)
{
170
	cap_clear(bprm->cred->cap_permitted);
171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199
	bprm->cap_effective = false;
}

#ifdef CONFIG_SECURITY_FILE_CAPABILITIES

int cap_inode_need_killpriv(struct dentry *dentry)
{
	struct inode *inode = dentry->d_inode;
	int error;

	if (!inode->i_op || !inode->i_op->getxattr)
	       return 0;

	error = inode->i_op->getxattr(dentry, XATTR_NAME_CAPS, NULL, 0);
	if (error <= 0)
		return 0;
	return 1;
}

int cap_inode_killpriv(struct dentry *dentry)
{
	struct inode *inode = dentry->d_inode;

	if (!inode->i_op || !inode->i_op->removexattr)
	       return 0;

	return inode->i_op->removexattr(dentry, XATTR_NAME_CAPS);
}

200
static inline int bprm_caps_from_vfs_caps(struct cpu_vfs_cap_data *caps,
201 202
					  struct linux_binprm *bprm,
					  bool *effective)
203
{
204
	struct cred *new = bprm->cred;
205 206 207 208
	unsigned i;
	int ret = 0;

	if (caps->magic_etc & VFS_CAP_FLAGS_EFFECTIVE)
209
		*effective = true;
210 211 212 213 214 215 216 217

	CAP_FOR_EACH_U32(i) {
		__u32 permitted = caps->permitted.cap[i];
		__u32 inheritable = caps->inheritable.cap[i];

		/*
		 * pP' = (X & fP) | (pI & fI)
		 */
218 219 220
		new->cap_permitted.cap[i] =
			(new->cap_bset.cap[i] & permitted) |
			(new->cap_inheritable.cap[i] & inheritable);
221

222 223
		if (permitted & ~new->cap_permitted.cap[i])
			/* insufficient to execute correctly */
224 225 226 227 228 229 230 231
			ret = -EPERM;
	}

	/*
	 * For legacy apps, with no internal support for recognizing they
	 * do not have enough capabilities, we return an error if they are
	 * missing some "forced" (aka file-permitted) capabilities.
	 */
232
	return *effective ? ret : 0;
233 234 235 236 237
}

int get_vfs_caps_from_disk(const struct dentry *dentry, struct cpu_vfs_cap_data *cpu_caps)
{
	struct inode *inode = dentry->d_inode;
238
	__u32 magic_etc;
239
	unsigned tocopy, i;
240 241 242 243 244 245 246 247 248 249
	int size;
	struct vfs_cap_data caps;

	memset(cpu_caps, 0, sizeof(struct cpu_vfs_cap_data));

	if (!inode || !inode->i_op || !inode->i_op->getxattr)
		return -ENODATA;

	size = inode->i_op->getxattr((struct dentry *)dentry, XATTR_NAME_CAPS, &caps,
				   XATTR_CAPS_SZ);
250
	if (size == -ENODATA || size == -EOPNOTSUPP)
251 252 253 254
		/* no data, that's ok */
		return -ENODATA;
	if (size < 0)
		return size;
255

256
	if (size < sizeof(magic_etc))
257 258
		return -EINVAL;

259
	cpu_caps->magic_etc = magic_etc = le32_to_cpu(caps.magic_etc);
260

261
	switch (magic_etc & VFS_CAP_REVISION_MASK) {
262 263 264 265 266 267 268 269 270 271
	case VFS_CAP_REVISION_1:
		if (size != XATTR_CAPS_SZ_1)
			return -EINVAL;
		tocopy = VFS_CAP_U32_1;
		break;
	case VFS_CAP_REVISION_2:
		if (size != XATTR_CAPS_SZ_2)
			return -EINVAL;
		tocopy = VFS_CAP_U32_2;
		break;
272 273 274
	default:
		return -EINVAL;
	}
275

276
	CAP_FOR_EACH_U32(i) {
277 278 279 280
		if (i >= tocopy)
			break;
		cpu_caps->permitted.cap[i] = le32_to_cpu(caps.data[i].permitted);
		cpu_caps->inheritable.cap[i] = le32_to_cpu(caps.data[i].inheritable);
281
	}
282

283
	return 0;
284 285 286
}

/* Locate any VFS capabilities: */
287
static int get_file_caps(struct linux_binprm *bprm, bool *effective)
288 289 290
{
	struct dentry *dentry;
	int rc = 0;
291
	struct cpu_vfs_cap_data vcaps;
292

293 294
	bprm_clear_caps(bprm);

295 296 297
	if (!file_caps_enabled)
		return 0;

298
	if (bprm->file->f_vfsmnt->mnt_flags & MNT_NOSUID)
299 300 301 302
		return 0;

	dentry = dget(bprm->file->f_dentry);

303 304 305 306 307 308 309
	rc = get_vfs_caps_from_disk(dentry, &vcaps);
	if (rc < 0) {
		if (rc == -EINVAL)
			printk(KERN_NOTICE "%s: get_vfs_caps_from_disk returned %d for %s\n",
				__func__, rc, bprm->filename);
		else if (rc == -ENODATA)
			rc = 0;
310 311 312
		goto out;
	}

313 314 315 316
	rc = bprm_caps_from_vfs_caps(&vcaps, bprm, effective);
	if (rc == -EINVAL)
		printk(KERN_NOTICE "%s: cap_from_disk returned %d for %s\n",
		       __func__, rc, bprm->filename);
317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336

out:
	dput(dentry);
	if (rc)
		bprm_clear_caps(bprm);

	return rc;
}

#else
int cap_inode_need_killpriv(struct dentry *dentry)
{
	return 0;
}

int cap_inode_killpriv(struct dentry *dentry)
{
	return 0;
}

337
static inline int get_file_caps(struct linux_binprm *bprm, bool *effective)
338 339 340 341 342 343
{
	bprm_clear_caps(bprm);
	return 0;
}
#endif

344 345 346 347
/*
 * set up the new credentials for an exec'd task
 */
int cap_bprm_set_creds(struct linux_binprm *bprm)
L
Linus Torvalds 已提交
348
{
349 350 351
	const struct cred *old = current_cred();
	struct cred *new = bprm->cred;
	bool effective;
352
	int ret;
L
Linus Torvalds 已提交
353

354 355 356 357
	effective = false;
	ret = get_file_caps(bprm, &effective);
	if (ret < 0)
		return ret;
L
Linus Torvalds 已提交
358

359 360 361 362 363 364
	if (!issecure(SECURE_NOROOT)) {
		/*
		 * To support inheritance of root-permissions and suid-root
		 * executables under compatibility mode, we override the
		 * capability sets for the file.
		 *
365
		 * If only the real uid is 0, we do not set the effective bit.
366
		 */
367
		if (new->euid == 0 || new->uid == 0) {
368
			/* pP' = (cap_bset & ~0) | (pI & ~0) */
369 370
			new->cap_permitted = cap_combine(old->cap_bset,
							 old->cap_inheritable);
L
Linus Torvalds 已提交
371
		}
372 373
		if (new->euid == 0)
			effective = true;
L
Linus Torvalds 已提交
374
	}
375

376 377 378 379 380 381 382 383 384 385 386
	/* Don't let someone trace a set[ug]id/setpcap binary with the revised
	 * credentials unless they have the appropriate permit
	 */
	if ((new->euid != old->uid ||
	     new->egid != old->gid ||
	     !cap_issubset(new->cap_permitted, old->cap_permitted)) &&
	    bprm->unsafe & ~LSM_UNSAFE_PTRACE_CAP) {
		/* downgrade; they get no more than they had, and maybe less */
		if (!capable(CAP_SETUID)) {
			new->euid = new->uid;
			new->egid = new->gid;
L
Linus Torvalds 已提交
387
		}
388 389 390
		if (cap_limit_ptraced_target())
			new->cap_permitted = cap_intersect(new->cap_permitted,
							   old->cap_permitted);
L
Linus Torvalds 已提交
391 392
	}

393 394
	new->suid = new->fsuid = new->euid;
	new->sgid = new->fsgid = new->egid;
L
Linus Torvalds 已提交
395

396 397 398
	/* For init, we want to retain the capabilities set in the initial
	 * task.  Thus we skip the usual capability rules
	 */
399
	if (!is_global_init(current)) {
400 401
		if (effective)
			new->cap_effective = new->cap_permitted;
402
		else
D
David Howells 已提交
403
			cap_clear(new->cap_effective);
L
Linus Torvalds 已提交
404
	}
405
	bprm->cap_effective = effective;
L
Linus Torvalds 已提交
406

407 408 409 410 411 412 413 414 415 416 417 418
	/*
	 * Audit candidate if current->cap_effective is set
	 *
	 * We do not bother to audit if 3 things are true:
	 *   1) cap_effective has all caps
	 *   2) we are root
	 *   3) root is supposed to have all caps (SECURE_NOROOT)
	 * Since this is just a normal root execing a process.
	 *
	 * Number 1 above might fail if you don't have a full bset, but I think
	 * that is interesting information to audit.
	 */
D
David Howells 已提交
419 420
	if (!cap_isclear(new->cap_effective)) {
		if (!cap_issubset(CAP_FULL_SET, new->cap_effective) ||
421 422 423 424 425 426
		    new->euid != 0 || new->uid != 0 ||
		    issecure(SECURE_NOROOT)) {
			ret = audit_log_bprm_fcaps(bprm, new, old);
			if (ret < 0)
				return ret;
		}
427
	}
L
Linus Torvalds 已提交
428

D
David Howells 已提交
429
	new->securebits &= ~issecure_mask(SECURE_KEEP_CAPS);
430
	return 0;
L
Linus Torvalds 已提交
431 432
}

433 434 435 436 437 438
/*
 * determine whether a secure execution is required
 * - the creds have been committed at this point, and are no longer available
 *   through bprm
 */
int cap_bprm_secureexec(struct linux_binprm *bprm)
L
Linus Torvalds 已提交
439
{
440
	const struct cred *cred = current_cred();
441 442

	if (cred->uid != 0) {
443 444
		if (bprm->cap_effective)
			return 1;
445
		if (!cap_isclear(cred->cap_permitted))
446 447 448
			return 1;
	}

449 450
	return (cred->euid != cred->uid ||
		cred->egid != cred->gid);
L
Linus Torvalds 已提交
451 452
}

453 454
int cap_inode_setxattr(struct dentry *dentry, const char *name,
		       const void *value, size_t size, int flags)
L
Linus Torvalds 已提交
455
{
456 457 458 459 460
	if (!strcmp(name, XATTR_NAME_CAPS)) {
		if (!capable(CAP_SETFCAP))
			return -EPERM;
		return 0;
	} else if (!strncmp(name, XATTR_SECURITY_PREFIX,
L
Linus Torvalds 已提交
461 462 463 464 465 466
		     sizeof(XATTR_SECURITY_PREFIX) - 1)  &&
	    !capable(CAP_SYS_ADMIN))
		return -EPERM;
	return 0;
}

467
int cap_inode_removexattr(struct dentry *dentry, const char *name)
L
Linus Torvalds 已提交
468
{
469 470 471 472 473
	if (!strcmp(name, XATTR_NAME_CAPS)) {
		if (!capable(CAP_SETFCAP))
			return -EPERM;
		return 0;
	} else if (!strncmp(name, XATTR_SECURITY_PREFIX,
L
Linus Torvalds 已提交
474 475 476 477 478 479 480
		     sizeof(XATTR_SECURITY_PREFIX) - 1)  &&
	    !capable(CAP_SYS_ADMIN))
		return -EPERM;
	return 0;
}

/* moved from kernel/sys.c. */
481
/*
L
Linus Torvalds 已提交
482 483 484 485 486 487 488 489 490 491 492 493 494
 * cap_emulate_setxuid() fixes the effective / permitted capabilities of
 * a process after a call to setuid, setreuid, or setresuid.
 *
 *  1) When set*uiding _from_ one of {r,e,s}uid == 0 _to_ all of
 *  {r,e,s}uid != 0, the permitted and effective capabilities are
 *  cleared.
 *
 *  2) When set*uiding _from_ euid == 0 _to_ euid != 0, the effective
 *  capabilities of the process are cleared.
 *
 *  3) When set*uiding _from_ euid != 0 _to_ euid == 0, the effective
 *  capabilities are set to the permitted capabilities.
 *
495
 *  fsuid is handled elsewhere. fsuid == 0 and {r,e,s}uid!= 0 should
L
Linus Torvalds 已提交
496 497
 *  never happen.
 *
498
 *  -astor
L
Linus Torvalds 已提交
499 500 501 502 503 504 505 506 507 508 509
 *
 * cevans - New behaviour, Oct '99
 * A process may, via prctl(), elect to keep its capabilities when it
 * calls setuid() and switches away from uid==0. Both permitted and
 * effective sets will be retained.
 * Without this change, it was impossible for a daemon to drop only some
 * of its privilege. The call to setuid(!=0) would drop all privileges!
 * Keeping uid 0 is not an option because uid 0 owns too many vital
 * files..
 * Thanks to Olaf Kirch and Peter Benie for spotting this.
 */
D
David Howells 已提交
510
static inline void cap_emulate_setxuid(struct cred *new, const struct cred *old)
L
Linus Torvalds 已提交
511
{
D
David Howells 已提交
512 513
	if ((old->uid == 0 || old->euid == 0 || old->suid == 0) &&
	    (new->uid != 0 && new->euid != 0 && new->suid != 0) &&
514
	    !issecure(SECURE_KEEP_CAPS)) {
D
David Howells 已提交
515 516
		cap_clear(new->cap_permitted);
		cap_clear(new->cap_effective);
L
Linus Torvalds 已提交
517
	}
D
David Howells 已提交
518 519 520 521
	if (old->euid == 0 && new->euid != 0)
		cap_clear(new->cap_effective);
	if (old->euid != 0 && new->euid == 0)
		new->cap_effective = new->cap_permitted;
L
Linus Torvalds 已提交
522 523
}

D
David Howells 已提交
524
int cap_task_fix_setuid(struct cred *new, const struct cred *old, int flags)
L
Linus Torvalds 已提交
525 526 527 528 529 530
{
	switch (flags) {
	case LSM_SETID_RE:
	case LSM_SETID_ID:
	case LSM_SETID_RES:
		/* Copied from kernel/sys.c:setreuid/setuid/setresuid. */
D
David Howells 已提交
531 532
		if (!issecure(SECURE_NO_SETUID_FIXUP))
			cap_emulate_setxuid(new, old);
L
Linus Torvalds 已提交
533 534
		break;
	case LSM_SETID_FS:
D
David Howells 已提交
535
		/* Copied from kernel/sys.c:setfsuid. */
L
Linus Torvalds 已提交
536

D
David Howells 已提交
537 538 539 540 541 542 543 544 545 546 547 548 549
		/*
		 * FIXME - is fsuser used for all CAP_FS_MASK capabilities?
		 *          if not, we might be a bit too harsh here.
		 */
		if (!issecure(SECURE_NO_SETUID_FIXUP)) {
			if (old->fsuid == 0 && new->fsuid != 0) {
				new->cap_effective =
					cap_drop_fs_set(new->cap_effective);
			}
			if (old->fsuid != 0 && new->fsuid == 0) {
				new->cap_effective =
					cap_raise_fs_set(new->cap_effective,
							 new->cap_permitted);
L
Linus Torvalds 已提交
550 551
			}
		}
D
David Howells 已提交
552
		break;
L
Linus Torvalds 已提交
553 554 555 556 557 558 559
	default:
		return -EINVAL;
	}

	return 0;
}

560 561 562 563 564 565 566 567 568 569 570
#ifdef CONFIG_SECURITY_FILE_CAPABILITIES
/*
 * Rationale: code calling task_setscheduler, task_setioprio, and
 * task_setnice, assumes that
 *   . if capable(cap_sys_nice), then those actions should be allowed
 *   . if not capable(cap_sys_nice), but acting on your own processes,
 *   	then those actions should be allowed
 * This is insufficient now since you can call code without suid, but
 * yet with increased caps.
 * So we check for increased caps on the target process.
 */
571
static int cap_safe_nice(struct task_struct *p)
572
{
573 574 575 576 577 578 579 580
	int is_subset;

	rcu_read_lock();
	is_subset = cap_issubset(__task_cred(p)->cap_permitted,
				 current_cred()->cap_permitted);
	rcu_read_unlock();

	if (!is_subset && !capable(CAP_SYS_NICE))
581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600
		return -EPERM;
	return 0;
}

int cap_task_setscheduler (struct task_struct *p, int policy,
			   struct sched_param *lp)
{
	return cap_safe_nice(p);
}

int cap_task_setioprio (struct task_struct *p, int ioprio)
{
	return cap_safe_nice(p);
}

int cap_task_setnice (struct task_struct *p, int nice)
{
	return cap_safe_nice(p);
}

601 602 603 604 605 606 607
/*
 * called from kernel/sys.c for prctl(PR_CABSET_DROP)
 * done without task_capability_lock() because it introduces
 * no new races - i.e. only another task doing capget() on
 * this task could get inconsistent info.  There can be no
 * racing writer bc a task can only change its own caps.
 */
D
David Howells 已提交
608
static long cap_prctl_drop(struct cred *new, unsigned long cap)
609 610 611 612 613
{
	if (!capable(CAP_SETPCAP))
		return -EPERM;
	if (!cap_valid(cap))
		return -EINVAL;
D
David Howells 已提交
614 615

	cap_lower(new->cap_bset, cap);
616 617
	return 0;
}
618

619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634
#else
int cap_task_setscheduler (struct task_struct *p, int policy,
			   struct sched_param *lp)
{
	return 0;
}
int cap_task_setioprio (struct task_struct *p, int ioprio)
{
	return 0;
}
int cap_task_setnice (struct task_struct *p, int nice)
{
	return 0;
}
#endif

635
int cap_task_prctl(int option, unsigned long arg2, unsigned long arg3,
D
David Howells 已提交
636
		   unsigned long arg4, unsigned long arg5)
637
{
D
David Howells 已提交
638
	struct cred *new;
639 640
	long error = 0;

D
David Howells 已提交
641 642 643 644
	new = prepare_creds();
	if (!new)
		return -ENOMEM;

645 646
	switch (option) {
	case PR_CAPBSET_READ:
D
David Howells 已提交
647
		error = -EINVAL;
648
		if (!cap_valid(arg2))
D
David Howells 已提交
649 650 651 652
			goto error;
		error = !!cap_raised(new->cap_bset, arg2);
		goto no_change;

653 654
#ifdef CONFIG_SECURITY_FILE_CAPABILITIES
	case PR_CAPBSET_DROP:
D
David Howells 已提交
655 656 657 658
		error = cap_prctl_drop(new, arg2);
		if (error < 0)
			goto error;
		goto changed;
659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679

	/*
	 * The next four prctl's remain to assist with transitioning a
	 * system from legacy UID=0 based privilege (when filesystem
	 * capabilities are not in use) to a system using filesystem
	 * capabilities only - as the POSIX.1e draft intended.
	 *
	 * Note:
	 *
	 *  PR_SET_SECUREBITS =
	 *      issecure_mask(SECURE_KEEP_CAPS_LOCKED)
	 *    | issecure_mask(SECURE_NOROOT)
	 *    | issecure_mask(SECURE_NOROOT_LOCKED)
	 *    | issecure_mask(SECURE_NO_SETUID_FIXUP)
	 *    | issecure_mask(SECURE_NO_SETUID_FIXUP_LOCKED)
	 *
	 * will ensure that the current process and all of its
	 * children will be locked into a pure
	 * capability-based-privilege environment.
	 */
	case PR_SET_SECUREBITS:
D
David Howells 已提交
680 681 682 683 684 685
		error = -EPERM;
		if ((((new->securebits & SECURE_ALL_LOCKS) >> 1)
		     & (new->securebits ^ arg2))			/*[1]*/
		    || ((new->securebits & SECURE_ALL_LOCKS & ~arg2))	/*[2]*/
		    || (arg2 & ~(SECURE_ALL_LOCKS | SECURE_ALL_BITS))	/*[3]*/
		    || (cap_capable(current, CAP_SETPCAP, SECURITY_CAP_AUDIT) != 0) /*[4]*/
686 687 688 689 690 691 692
			/*
			 * [1] no changing of bits that are locked
			 * [2] no unlocking of locks
			 * [3] no setting of unsupported bits
			 * [4] doing anything requires privilege (go read about
			 *     the "sendmail capabilities bug")
			 */
D
David Howells 已提交
693 694 695 696 697 698
		    )
			/* cannot change a locked bit */
			goto error;
		new->securebits = arg2;
		goto changed;

699
	case PR_GET_SECUREBITS:
D
David Howells 已提交
700 701
		error = new->securebits;
		goto no_change;
702 703 704 705 706 707

#endif /* def CONFIG_SECURITY_FILE_CAPABILITIES */

	case PR_GET_KEEPCAPS:
		if (issecure(SECURE_KEEP_CAPS))
			error = 1;
D
David Howells 已提交
708 709
		goto no_change;

710
	case PR_SET_KEEPCAPS:
D
David Howells 已提交
711
		error = -EINVAL;
712
		if (arg2 > 1) /* Note, we rely on arg2 being unsigned here */
D
David Howells 已提交
713 714 715 716 717 718
			goto error;
		error = -EPERM;
		if (issecure(SECURE_KEEP_CAPS_LOCKED))
			goto error;
		if (arg2)
			new->securebits |= issecure_mask(SECURE_KEEP_CAPS);
719
		else
D
David Howells 已提交
720 721
			new->securebits &= ~issecure_mask(SECURE_KEEP_CAPS);
		goto changed;
722 723 724

	default:
		/* No functionality available - continue with default */
D
David Howells 已提交
725 726
		error = -ENOSYS;
		goto error;
727 728 729
	}

	/* Functionality provided */
D
David Howells 已提交
730 731 732 733 734 735 736 737
changed:
	return commit_creds(new);

no_change:
	error = 0;
error:
	abort_creds(new);
	return error;
L
Linus Torvalds 已提交
738 739 740 741 742 743 744 745 746
}

int cap_syslog (int type)
{
	if ((type != 3 && type != 10) && !capable(CAP_SYS_ADMIN))
		return -EPERM;
	return 0;
}

747
int cap_vm_enough_memory(struct mm_struct *mm, long pages)
L
Linus Torvalds 已提交
748 749 750
{
	int cap_sys_admin = 0;

751
	if (cap_capable(current, CAP_SYS_ADMIN, SECURITY_CAP_NOAUDIT) == 0)
L
Linus Torvalds 已提交
752
		cap_sys_admin = 1;
753
	return __vm_enough_memory(mm, pages, cap_sys_admin);
L
Linus Torvalds 已提交
754
}