kthread.c 17.0 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3
/* Kernel thread helper functions.
 *   Copyright (C) 2004 IBM Corporation, Rusty Russell.
 *
4
 * Creation is done via kthreadd, so that we get a clean environment
L
Linus Torvalds 已提交
5 6 7 8 9 10 11
 * even if we're invoked from userspace (think modprobe, hotplug cpu,
 * etc.).
 */
#include <linux/sched.h>
#include <linux/kthread.h>
#include <linux/completion.h>
#include <linux/err.h>
12
#include <linux/cpuset.h>
L
Linus Torvalds 已提交
13 14
#include <linux/unistd.h>
#include <linux/file.h>
15
#include <linux/export.h>
A
Arjan van de Ven 已提交
16
#include <linux/mutex.h>
T
Tejun Heo 已提交
17 18
#include <linux/slab.h>
#include <linux/freezer.h>
19
#include <linux/ptrace.h>
20
#include <trace/events/sched.h>
L
Linus Torvalds 已提交
21

22 23 24
static DEFINE_SPINLOCK(kthread_create_lock);
static LIST_HEAD(kthread_create_list);
struct task_struct *kthreadd_task;
L
Linus Torvalds 已提交
25 26 27

struct kthread_create_info
{
28
	/* Information passed to kthread() from kthreadd. */
L
Linus Torvalds 已提交
29 30
	int (*threadfn)(void *data);
	void *data;
31
	int node;
L
Linus Torvalds 已提交
32

33
	/* Result passed back to kthread_create() from kthreadd. */
L
Linus Torvalds 已提交
34 35
	struct task_struct *result;
	struct completion done;
36

37
	struct list_head list;
L
Linus Torvalds 已提交
38 39
};

O
Oleg Nesterov 已提交
40
struct kthread {
41 42
	unsigned long flags;
	unsigned int cpu;
T
Tejun Heo 已提交
43
	void *data;
44
	struct completion parked;
O
Oleg Nesterov 已提交
45
	struct completion exited;
L
Linus Torvalds 已提交
46 47
};

48 49 50 51 52 53 54
enum KTHREAD_BITS {
	KTHREAD_IS_PER_CPU = 0,
	KTHREAD_SHOULD_STOP,
	KTHREAD_SHOULD_PARK,
	KTHREAD_IS_PARKED,
};

55 56 57 58 59 60 61 62 63 64 65 66 67 68 69
#define __to_kthread(vfork)	\
	container_of(vfork, struct kthread, exited)

static inline struct kthread *to_kthread(struct task_struct *k)
{
	return __to_kthread(k->vfork_done);
}

static struct kthread *to_live_kthread(struct task_struct *k)
{
	struct completion *vfork = ACCESS_ONCE(k->vfork_done);
	if (likely(vfork))
		return __to_kthread(vfork);
	return NULL;
}
L
Linus Torvalds 已提交
70

71 72 73
/**
 * kthread_should_stop - should this kthread return now?
 *
74
 * When someone calls kthread_stop() on your kthread, it will be woken
75 76 77
 * and this will return true.  You should then return, and your return
 * value will be passed through to kthread_stop().
 */
78
bool kthread_should_stop(void)
L
Linus Torvalds 已提交
79
{
80
	return test_bit(KTHREAD_SHOULD_STOP, &to_kthread(current)->flags);
L
Linus Torvalds 已提交
81 82 83
}
EXPORT_SYMBOL(kthread_should_stop);

84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99
/**
 * kthread_should_park - should this kthread park now?
 *
 * When someone calls kthread_park() on your kthread, it will be woken
 * and this will return true.  You should then do the necessary
 * cleanup and call kthread_parkme()
 *
 * Similar to kthread_should_stop(), but this keeps the thread alive
 * and in a park position. kthread_unpark() "restarts" the thread and
 * calls the thread function again.
 */
bool kthread_should_park(void)
{
	return test_bit(KTHREAD_SHOULD_PARK, &to_kthread(current)->flags);
}

100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124
/**
 * kthread_freezable_should_stop - should this freezable kthread return now?
 * @was_frozen: optional out parameter, indicates whether %current was frozen
 *
 * kthread_should_stop() for freezable kthreads, which will enter
 * refrigerator if necessary.  This function is safe from kthread_stop() /
 * freezer deadlock and freezable kthreads should use this function instead
 * of calling try_to_freeze() directly.
 */
bool kthread_freezable_should_stop(bool *was_frozen)
{
	bool frozen = false;

	might_sleep();

	if (unlikely(freezing(current)))
		frozen = __refrigerator(true);

	if (was_frozen)
		*was_frozen = frozen;

	return kthread_should_stop();
}
EXPORT_SYMBOL_GPL(kthread_freezable_should_stop);

T
Tejun Heo 已提交
125 126 127 128 129 130 131 132 133 134 135 136 137
/**
 * kthread_data - return data value specified on kthread creation
 * @task: kthread task in question
 *
 * Return the data value specified when kthread @task was created.
 * The caller is responsible for ensuring the validity of @task when
 * calling this function.
 */
void *kthread_data(struct task_struct *task)
{
	return to_kthread(task)->data;
}

138 139
static void __kthread_parkme(struct kthread *self)
{
140
	__set_current_state(TASK_PARKED);
141 142 143 144
	while (test_bit(KTHREAD_SHOULD_PARK, &self->flags)) {
		if (!test_and_set_bit(KTHREAD_IS_PARKED, &self->flags))
			complete(&self->parked);
		schedule();
145
		__set_current_state(TASK_PARKED);
146 147 148 149 150 151 152 153 154 155
	}
	clear_bit(KTHREAD_IS_PARKED, &self->flags);
	__set_current_state(TASK_RUNNING);
}

void kthread_parkme(void)
{
	__kthread_parkme(to_kthread(current));
}

L
Linus Torvalds 已提交
156 157
static int kthread(void *_create)
{
O
Oleg Nesterov 已提交
158
	/* Copy data: it's on kthread's stack */
L
Linus Torvalds 已提交
159
	struct kthread_create_info *create = _create;
O
Oleg Nesterov 已提交
160 161 162 163
	int (*threadfn)(void *data) = create->threadfn;
	void *data = create->data;
	struct kthread self;
	int ret;
L
Linus Torvalds 已提交
164

165
	self.flags = 0;
T
Tejun Heo 已提交
166
	self.data = data;
O
Oleg Nesterov 已提交
167
	init_completion(&self.exited);
168
	init_completion(&self.parked);
O
Oleg Nesterov 已提交
169
	current->vfork_done = &self.exited;
L
Linus Torvalds 已提交
170 171

	/* OK, tell user we're spawned, wait for stop or wakeup */
172
	__set_current_state(TASK_UNINTERRUPTIBLE);
173
	create->result = current;
174
	complete(&create->done);
L
Linus Torvalds 已提交
175 176
	schedule();

O
Oleg Nesterov 已提交
177
	ret = -EINTR;
L
Linus Torvalds 已提交
178

179 180 181 182
	if (!test_bit(KTHREAD_SHOULD_STOP, &self.flags)) {
		__kthread_parkme(&self);
		ret = threadfn(data);
	}
O
Oleg Nesterov 已提交
183 184
	/* we can't just return, we must preserve "self" on stack */
	do_exit(ret);
L
Linus Torvalds 已提交
185 186
}

187 188 189 190 191 192 193 194 195 196
/* called from do_fork() to get node information for about to be created task */
int tsk_fork_get_node(struct task_struct *tsk)
{
#ifdef CONFIG_NUMA
	if (tsk == kthreadd_task)
		return tsk->pref_node_fork;
#endif
	return numa_node_id();
}

197
static void create_kthread(struct kthread_create_info *create)
L
Linus Torvalds 已提交
198 199 200
{
	int pid;

201 202 203
#ifdef CONFIG_NUMA
	current->pref_node_fork = create->node;
#endif
L
Linus Torvalds 已提交
204 205
	/* We want our own signal handler (we take no signals by default). */
	pid = kernel_thread(kthread, create, CLONE_FS | CLONE_FILES | SIGCHLD);
206
	if (pid < 0) {
L
Linus Torvalds 已提交
207
		create->result = ERR_PTR(pid);
208 209
		complete(&create->done);
	}
L
Linus Torvalds 已提交
210 211
}

212
/**
213
 * kthread_create_on_node - create a kthread.
214 215
 * @threadfn: the function to run until signal_pending(current).
 * @data: data ptr for @threadfn.
216
 * @node: memory node number.
217 218 219 220
 * @namefmt: printf-style name for the thread.
 *
 * Description: This helper function creates and names a kernel
 * thread.  The thread will be stopped: use wake_up_process() to start
221
 * it.  See also kthread_run().
222
 *
223 224
 * If thread is going to be bound on a particular cpu, give its node
 * in @node, to get NUMA affinity for kthread stack, or else give -1.
225
 * When woken, the thread will run @threadfn() with @data as its
226
 * argument. @threadfn() can either call do_exit() directly if it is a
L
Lucas De Marchi 已提交
227
 * standalone thread for which no one will call kthread_stop(), or
228 229 230 231 232 233
 * return when 'kthread_should_stop()' is true (which means
 * kthread_stop() has been called).  The return value should be zero
 * or a negative error number; it will be passed to kthread_stop().
 *
 * Returns a task_struct or ERR_PTR(-ENOMEM).
 */
234
struct task_struct *kthread_create_on_node(int (*threadfn)(void *data),
235
					   void *data, int node,
236 237
					   const char namefmt[],
					   ...)
L
Linus Torvalds 已提交
238 239 240 241 242
{
	struct kthread_create_info create;

	create.threadfn = threadfn;
	create.data = data;
243
	create.node = node;
L
Linus Torvalds 已提交
244
	init_completion(&create.done);
245 246 247 248 249

	spin_lock(&kthread_create_lock);
	list_add_tail(&create.list, &kthread_create_list);
	spin_unlock(&kthread_create_lock);

250
	wake_up_process(kthreadd_task);
251 252
	wait_for_completion(&create.done);

L
Linus Torvalds 已提交
253
	if (!IS_ERR(create.result)) {
254
		static const struct sched_param param = { .sched_priority = 0 };
L
Linus Torvalds 已提交
255
		va_list args;
256

L
Linus Torvalds 已提交
257 258 259 260
		va_start(args, namefmt);
		vsnprintf(create.result->comm, sizeof(create.result->comm),
			  namefmt, args);
		va_end(args);
261 262 263 264 265 266
		/*
		 * root may have changed our (kthreadd's) priority or CPU mask.
		 * The kernel thread should not inherit these properties.
		 */
		sched_setscheduler_nocheck(create.result, SCHED_NORMAL, &param);
		set_cpus_allowed_ptr(create.result, cpu_all_mask);
L
Linus Torvalds 已提交
267 268 269
	}
	return create.result;
}
270
EXPORT_SYMBOL(kthread_create_on_node);
L
Linus Torvalds 已提交
271

272
static void __kthread_bind(struct task_struct *p, unsigned int cpu, long state)
273
{
274 275 276 277 278
	/* Must have done schedule() in kthread() before we set_task_cpu */
	if (!wait_task_inactive(p, state)) {
		WARN_ON(1);
		return;
	}
279 280
	/* It's safe because the task is inactive. */
	do_set_cpus_allowed(p, cpumask_of(cpu));
281
	p->flags |= PF_NO_SETAFFINITY;
282 283
}

284 285 286 287 288 289 290 291 292 293 294
/**
 * kthread_bind - bind a just-created kthread to a cpu.
 * @p: thread created by kthread_create().
 * @cpu: cpu (might not be online, must be possible) for @k to run on.
 *
 * Description: This function is equivalent to set_cpus_allowed(),
 * except that @cpu doesn't need to be online, and the thread must be
 * stopped (i.e., just returned from kthread_create()).
 */
void kthread_bind(struct task_struct *p, unsigned int cpu)
{
295
	__kthread_bind(p, cpu, TASK_UNINTERRUPTIBLE);
296 297 298
}
EXPORT_SYMBOL(kthread_bind);

299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326
/**
 * kthread_create_on_cpu - Create a cpu bound kthread
 * @threadfn: the function to run until signal_pending(current).
 * @data: data ptr for @threadfn.
 * @cpu: The cpu on which the thread should be bound,
 * @namefmt: printf-style name for the thread. Format is restricted
 *	     to "name.*%u". Code fills in cpu number.
 *
 * Description: This helper function creates and names a kernel thread
 * The thread will be woken and put into park mode.
 */
struct task_struct *kthread_create_on_cpu(int (*threadfn)(void *data),
					  void *data, unsigned int cpu,
					  const char *namefmt)
{
	struct task_struct *p;

	p = kthread_create_on_node(threadfn, data, cpu_to_node(cpu), namefmt,
				   cpu);
	if (IS_ERR(p))
		return p;
	set_bit(KTHREAD_IS_PER_CPU, &to_kthread(p)->flags);
	to_kthread(p)->cpu = cpu;
	/* Park the thread to get it out of TASK_UNINTERRUPTIBLE state */
	kthread_park(p);
	return p;
}

327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342
static void __kthread_unpark(struct task_struct *k, struct kthread *kthread)
{
	clear_bit(KTHREAD_SHOULD_PARK, &kthread->flags);
	/*
	 * We clear the IS_PARKED bit here as we don't wait
	 * until the task has left the park code. So if we'd
	 * park before that happens we'd see the IS_PARKED bit
	 * which might be about to be cleared.
	 */
	if (test_and_clear_bit(KTHREAD_IS_PARKED, &kthread->flags)) {
		if (test_bit(KTHREAD_IS_PER_CPU, &kthread->flags))
			__kthread_bind(k, kthread->cpu, TASK_PARKED);
		wake_up_state(k, TASK_PARKED);
	}
}

343 344 345 346 347 348 349 350 351 352
/**
 * kthread_unpark - unpark a thread created by kthread_create().
 * @k:		thread created by kthread_create().
 *
 * Sets kthread_should_park() for @k to return false, wakes it, and
 * waits for it to return. If the thread is marked percpu then its
 * bound to the cpu again.
 */
void kthread_unpark(struct task_struct *k)
{
353
	struct kthread *kthread = to_live_kthread(k);
354

355 356
	if (kthread)
		__kthread_unpark(k, kthread);
357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372
}

/**
 * kthread_park - park a thread created by kthread_create().
 * @k: thread created by kthread_create().
 *
 * Sets kthread_should_park() for @k to return true, wakes it, and
 * waits for it to return. This can also be called after kthread_create()
 * instead of calling wake_up_process(): the thread will park without
 * calling threadfn().
 *
 * Returns 0 if the thread is parked, -ENOSYS if the thread exited.
 * If called by the kthread itself just the park bit is set.
 */
int kthread_park(struct task_struct *k)
{
373
	struct kthread *kthread = to_live_kthread(k);
374 375 376 377 378 379 380 381 382 383 384 385 386 387 388
	int ret = -ENOSYS;

	if (kthread) {
		if (!test_bit(KTHREAD_IS_PARKED, &kthread->flags)) {
			set_bit(KTHREAD_SHOULD_PARK, &kthread->flags);
			if (k != current) {
				wake_up_process(k);
				wait_for_completion(&kthread->parked);
			}
		}
		ret = 0;
	}
	return ret;
}

389 390 391 392 393
/**
 * kthread_stop - stop a thread created by kthread_create().
 * @k: thread created by kthread_create().
 *
 * Sets kthread_should_stop() for @k to return true, wakes it, and
394 395 396 397 398 399
 * waits for it to exit. This can also be called after kthread_create()
 * instead of calling wake_up_process(): the thread will exit without
 * calling threadfn().
 *
 * If threadfn() may call do_exit() itself, the caller must ensure
 * task_struct can't go away.
400 401 402 403
 *
 * Returns the result of threadfn(), or %-EINTR if wake_up_process()
 * was never called.
 */
L
Linus Torvalds 已提交
404 405
int kthread_stop(struct task_struct *k)
{
406
	struct kthread *kthread;
L
Linus Torvalds 已提交
407 408
	int ret;

409
	trace_sched_kthread_stop(k);
410 411 412

	get_task_struct(k);
	kthread = to_live_kthread(k);
413 414
	if (kthread) {
		set_bit(KTHREAD_SHOULD_STOP, &kthread->flags);
415
		__kthread_unpark(k, kthread);
O
Oleg Nesterov 已提交
416 417 418 419
		wake_up_process(k);
		wait_for_completion(&kthread->exited);
	}
	ret = k->exit_code;
L
Linus Torvalds 已提交
420
	put_task_struct(k);
421

422
	trace_sched_kthread_stop_ret(ret);
L
Linus Torvalds 已提交
423 424
	return ret;
}
425
EXPORT_SYMBOL(kthread_stop);
L
Linus Torvalds 已提交
426

427
int kthreadd(void *unused)
L
Linus Torvalds 已提交
428
{
429
	struct task_struct *tsk = current;
L
Linus Torvalds 已提交
430

431
	/* Setup a clean context for our children to inherit. */
432
	set_task_comm(tsk, "kthreadd");
433
	ignore_signals(tsk);
434
	set_cpus_allowed_ptr(tsk, cpu_all_mask);
435
	set_mems_allowed(node_states[N_MEMORY]);
436

437
	current->flags |= PF_NOFREEZE;
438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462

	for (;;) {
		set_current_state(TASK_INTERRUPTIBLE);
		if (list_empty(&kthread_create_list))
			schedule();
		__set_current_state(TASK_RUNNING);

		spin_lock(&kthread_create_lock);
		while (!list_empty(&kthread_create_list)) {
			struct kthread_create_info *create;

			create = list_entry(kthread_create_list.next,
					    struct kthread_create_info, list);
			list_del_init(&create->list);
			spin_unlock(&kthread_create_lock);

			create_kthread(create);

			spin_lock(&kthread_create_lock);
		}
		spin_unlock(&kthread_create_lock);
	}

	return 0;
}
T
Tejun Heo 已提交
463

Y
Yong Zhang 已提交
464 465 466 467 468 469 470 471 472 473 474
void __init_kthread_worker(struct kthread_worker *worker,
				const char *name,
				struct lock_class_key *key)
{
	spin_lock_init(&worker->lock);
	lockdep_set_class_and_name(&worker->lock, key, name);
	INIT_LIST_HEAD(&worker->work_list);
	worker->task = NULL;
}
EXPORT_SYMBOL_GPL(__init_kthread_worker);

T
Tejun Heo 已提交
475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514
/**
 * kthread_worker_fn - kthread function to process kthread_worker
 * @worker_ptr: pointer to initialized kthread_worker
 *
 * This function can be used as @threadfn to kthread_create() or
 * kthread_run() with @worker_ptr argument pointing to an initialized
 * kthread_worker.  The started kthread will process work_list until
 * the it is stopped with kthread_stop().  A kthread can also call
 * this function directly after extra initialization.
 *
 * Different kthreads can be used for the same kthread_worker as long
 * as there's only one kthread attached to it at any given time.  A
 * kthread_worker without an attached kthread simply collects queued
 * kthread_works.
 */
int kthread_worker_fn(void *worker_ptr)
{
	struct kthread_worker *worker = worker_ptr;
	struct kthread_work *work;

	WARN_ON(worker->task);
	worker->task = current;
repeat:
	set_current_state(TASK_INTERRUPTIBLE);	/* mb paired w/ kthread_stop */

	if (kthread_should_stop()) {
		__set_current_state(TASK_RUNNING);
		spin_lock_irq(&worker->lock);
		worker->task = NULL;
		spin_unlock_irq(&worker->lock);
		return 0;
	}

	work = NULL;
	spin_lock_irq(&worker->lock);
	if (!list_empty(&worker->work_list)) {
		work = list_first_entry(&worker->work_list,
					struct kthread_work, node);
		list_del_init(&work->node);
	}
515
	worker->current_work = work;
T
Tejun Heo 已提交
516 517 518 519 520 521 522 523 524 525 526 527 528
	spin_unlock_irq(&worker->lock);

	if (work) {
		__set_current_state(TASK_RUNNING);
		work->func(work);
	} else if (!freezing(current))
		schedule();

	try_to_freeze();
	goto repeat;
}
EXPORT_SYMBOL_GPL(kthread_worker_fn);

529 530 531 532 533 534 535 536
/* insert @work before @pos in @worker */
static void insert_kthread_work(struct kthread_worker *worker,
			       struct kthread_work *work,
			       struct list_head *pos)
{
	lockdep_assert_held(&worker->lock);

	list_add_tail(&work->node, pos);
537
	work->worker = worker;
538 539 540 541
	if (likely(worker->task))
		wake_up_process(worker->task);
}

T
Tejun Heo 已提交
542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558
/**
 * queue_kthread_work - queue a kthread_work
 * @worker: target kthread_worker
 * @work: kthread_work to queue
 *
 * Queue @work to work processor @task for async execution.  @task
 * must have been created with kthread_worker_create().  Returns %true
 * if @work was successfully queued, %false if it was already pending.
 */
bool queue_kthread_work(struct kthread_worker *worker,
			struct kthread_work *work)
{
	bool ret = false;
	unsigned long flags;

	spin_lock_irqsave(&worker->lock, flags);
	if (list_empty(&work->node)) {
559
		insert_kthread_work(worker, work, &worker->work_list);
T
Tejun Heo 已提交
560 561 562 563 564 565 566
		ret = true;
	}
	spin_unlock_irqrestore(&worker->lock, flags);
	return ret;
}
EXPORT_SYMBOL_GPL(queue_kthread_work);

567 568 569 570 571 572 573 574 575 576 577 578
struct kthread_flush_work {
	struct kthread_work	work;
	struct completion	done;
};

static void kthread_flush_work_fn(struct kthread_work *work)
{
	struct kthread_flush_work *fwork =
		container_of(work, struct kthread_flush_work, work);
	complete(&fwork->done);
}

T
Tejun Heo 已提交
579 580 581 582 583 584 585 586
/**
 * flush_kthread_work - flush a kthread_work
 * @work: work to flush
 *
 * If @work is queued or executing, wait for it to finish execution.
 */
void flush_kthread_work(struct kthread_work *work)
{
587 588 589 590 591 592 593 594 595 596 597
	struct kthread_flush_work fwork = {
		KTHREAD_WORK_INIT(fwork.work, kthread_flush_work_fn),
		COMPLETION_INITIALIZER_ONSTACK(fwork.done),
	};
	struct kthread_worker *worker;
	bool noop = false;

retry:
	worker = work->worker;
	if (!worker)
		return;
T
Tejun Heo 已提交
598

599 600 601 602 603
	spin_lock_irq(&worker->lock);
	if (work->worker != worker) {
		spin_unlock_irq(&worker->lock);
		goto retry;
	}
T
Tejun Heo 已提交
604

605 606 607 608 609 610
	if (!list_empty(&work->node))
		insert_kthread_work(worker, &fwork.work, work->node.next);
	else if (worker->current_work == work)
		insert_kthread_work(worker, &fwork.work, worker->work_list.next);
	else
		noop = true;
T
Tejun Heo 已提交
611

612
	spin_unlock_irq(&worker->lock);
T
Tejun Heo 已提交
613

614 615
	if (!noop)
		wait_for_completion(&fwork.done);
T
Tejun Heo 已提交
616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636
}
EXPORT_SYMBOL_GPL(flush_kthread_work);

/**
 * flush_kthread_worker - flush all current works on a kthread_worker
 * @worker: worker to flush
 *
 * Wait until all currently executing or pending works on @worker are
 * finished.
 */
void flush_kthread_worker(struct kthread_worker *worker)
{
	struct kthread_flush_work fwork = {
		KTHREAD_WORK_INIT(fwork.work, kthread_flush_work_fn),
		COMPLETION_INITIALIZER_ONSTACK(fwork.done),
	};

	queue_kthread_work(worker, &fwork.work);
	wait_for_completion(&fwork.done);
}
EXPORT_SYMBOL_GPL(flush_kthread_worker);