blob: b6d216a92639fdeea3049a47b361660e7e44fa09 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/* Kernel thread helper functions.
2 * Copyright (C) 2004 IBM Corporation, Rusty Russell.
3 *
Eric W. Biederman73c27992007-05-09 02:34:32 -07004 * Creation is done via kthreadd, so that we get a clean environment
Linus Torvalds1da177e2005-04-16 15:20:36 -07005 * even if we're invoked from userspace (think modprobe, hotplug cpu,
6 * etc.).
7 */
8#include <linux/sched.h>
9#include <linux/kthread.h>
10#include <linux/completion.h>
11#include <linux/err.h>
Miao Xie58568d22009-06-16 15:31:49 -070012#include <linux/cpuset.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070013#include <linux/unistd.h>
14#include <linux/file.h>
Paul Gortmaker9984de12011-05-23 14:51:41 -040015#include <linux/export.h>
Arjan van de Ven97d1f152006-03-23 03:00:24 -080016#include <linux/mutex.h>
Tejun Heob56c0d82010-06-29 10:07:09 +020017#include <linux/slab.h>
18#include <linux/freezer.h>
Steven Rostedtad8d75f2009-04-14 19:39:12 -040019#include <trace/events/sched.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070020
Eric W. Biederman73c27992007-05-09 02:34:32 -070021static DEFINE_SPINLOCK(kthread_create_lock);
22static LIST_HEAD(kthread_create_list);
23struct task_struct *kthreadd_task;
Linus Torvalds1da177e2005-04-16 15:20:36 -070024
25struct kthread_create_info
26{
Eric W. Biederman73c27992007-05-09 02:34:32 -070027 /* Information passed to kthread() from kthreadd. */
Linus Torvalds1da177e2005-04-16 15:20:36 -070028 int (*threadfn)(void *data);
29 void *data;
Eric Dumazet207205a2011-03-22 16:30:44 -070030 int node;
Linus Torvalds1da177e2005-04-16 15:20:36 -070031
Eric W. Biederman73c27992007-05-09 02:34:32 -070032 /* Result passed back to kthread_create() from kthreadd. */
Linus Torvalds1da177e2005-04-16 15:20:36 -070033 struct task_struct *result;
34 struct completion done;
David Howells65f27f32006-11-22 14:55:48 +000035
Eric W. Biederman73c27992007-05-09 02:34:32 -070036 struct list_head list;
Linus Torvalds1da177e2005-04-16 15:20:36 -070037};
38
Oleg Nesterov63706172009-06-17 16:27:45 -070039struct kthread {
40 int should_stop;
Tejun Heo82805ab2010-06-29 10:07:09 +020041 void *data;
Oleg Nesterov63706172009-06-17 16:27:45 -070042 struct completion exited;
Linus Torvalds1da177e2005-04-16 15:20:36 -070043};
44
Oleg Nesterov63706172009-06-17 16:27:45 -070045#define to_kthread(tsk) \
46 container_of((tsk)->vfork_done, struct kthread, exited)
Linus Torvalds1da177e2005-04-16 15:20:36 -070047
Randy Dunlap9e37bd32006-06-25 05:49:19 -070048/**
49 * kthread_should_stop - should this kthread return now?
50 *
Robert P. J. Day72fd4a32007-02-10 01:45:59 -080051 * When someone calls kthread_stop() on your kthread, it will be woken
Randy Dunlap9e37bd32006-06-25 05:49:19 -070052 * and this will return true. You should then return, and your return
53 * value will be passed through to kthread_stop().
54 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070055int kthread_should_stop(void)
56{
Oleg Nesterov63706172009-06-17 16:27:45 -070057 return to_kthread(current)->should_stop;
Linus Torvalds1da177e2005-04-16 15:20:36 -070058}
59EXPORT_SYMBOL(kthread_should_stop);
60
Tejun Heo82805ab2010-06-29 10:07:09 +020061/**
62 * kthread_data - return data value specified on kthread creation
63 * @task: kthread task in question
64 *
65 * Return the data value specified when kthread @task was created.
66 * The caller is responsible for ensuring the validity of @task when
67 * calling this function.
68 */
69void *kthread_data(struct task_struct *task)
70{
71 return to_kthread(task)->data;
72}
73
Linus Torvalds1da177e2005-04-16 15:20:36 -070074static int kthread(void *_create)
75{
Eric W. Biederman73c27992007-05-09 02:34:32 -070076 /* Copy data: it's on kthread's stack */
Oleg Nesterov63706172009-06-17 16:27:45 -070077 struct kthread_create_info *create = _create;
78 int (*threadfn)(void *data) = create->threadfn;
79 void *data = create->data;
80 struct kthread self;
81 int ret;
82
83 self.should_stop = 0;
Tejun Heo82805ab2010-06-29 10:07:09 +020084 self.data = data;
Oleg Nesterov63706172009-06-17 16:27:45 -070085 init_completion(&self.exited);
86 current->vfork_done = &self.exited;
Linus Torvalds1da177e2005-04-16 15:20:36 -070087
Linus Torvalds1da177e2005-04-16 15:20:36 -070088 /* OK, tell user we're spawned, wait for stop or wakeup */
Oleg Nesterova076e4b2007-05-23 13:57:27 -070089 __set_current_state(TASK_UNINTERRUPTIBLE);
Vitaliy Gusev3217ab92009-04-09 09:50:35 -060090 create->result = current;
Oleg Nesterovcdd140b2009-06-17 16:27:43 -070091 complete(&create->done);
Linus Torvalds1da177e2005-04-16 15:20:36 -070092 schedule();
93
Oleg Nesterov63706172009-06-17 16:27:45 -070094 ret = -EINTR;
95 if (!self.should_stop)
Linus Torvalds1da177e2005-04-16 15:20:36 -070096 ret = threadfn(data);
97
Oleg Nesterov63706172009-06-17 16:27:45 -070098 /* we can't just return, we must preserve "self" on stack */
99 do_exit(ret);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700100}
101
Eric Dumazet207205a2011-03-22 16:30:44 -0700102/* called from do_fork() to get node information for about to be created task */
103int tsk_fork_get_node(struct task_struct *tsk)
104{
105#ifdef CONFIG_NUMA
106 if (tsk == kthreadd_task)
107 return tsk->pref_node_fork;
108#endif
109 return numa_node_id();
110}
111
Eric W. Biederman73c27992007-05-09 02:34:32 -0700112static void create_kthread(struct kthread_create_info *create)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700113{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114 int pid;
115
Eric Dumazet207205a2011-03-22 16:30:44 -0700116#ifdef CONFIG_NUMA
117 current->pref_node_fork = create->node;
118#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700119 /* We want our own signal handler (we take no signals by default). */
120 pid = kernel_thread(kthread, create, CLONE_FS | CLONE_FILES | SIGCHLD);
Oleg Nesterovcdd140b2009-06-17 16:27:43 -0700121 if (pid < 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700122 create->result = ERR_PTR(pid);
Oleg Nesterovcdd140b2009-06-17 16:27:43 -0700123 complete(&create->done);
124 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700125}
126
Randy Dunlap9e37bd32006-06-25 05:49:19 -0700127/**
Eric Dumazet207205a2011-03-22 16:30:44 -0700128 * kthread_create_on_node - create a kthread.
Randy Dunlap9e37bd32006-06-25 05:49:19 -0700129 * @threadfn: the function to run until signal_pending(current).
130 * @data: data ptr for @threadfn.
Eric Dumazet207205a2011-03-22 16:30:44 -0700131 * @node: memory node number.
Randy Dunlap9e37bd32006-06-25 05:49:19 -0700132 * @namefmt: printf-style name for the thread.
133 *
134 * Description: This helper function creates and names a kernel
135 * thread. The thread will be stopped: use wake_up_process() to start
Anton Blanchard301ba042010-02-09 15:07:40 +1100136 * it. See also kthread_run().
Randy Dunlap9e37bd32006-06-25 05:49:19 -0700137 *
Eric Dumazet207205a2011-03-22 16:30:44 -0700138 * If thread is going to be bound on a particular cpu, give its node
139 * in @node, to get NUMA affinity for kthread stack, or else give -1.
Randy Dunlap9e37bd32006-06-25 05:49:19 -0700140 * When woken, the thread will run @threadfn() with @data as its
Robert P. J. Day72fd4a32007-02-10 01:45:59 -0800141 * argument. @threadfn() can either call do_exit() directly if it is a
Lucas De Marchi25985ed2011-03-30 22:57:33 -0300142 * standalone thread for which no one will call kthread_stop(), or
Randy Dunlap9e37bd32006-06-25 05:49:19 -0700143 * return when 'kthread_should_stop()' is true (which means
144 * kthread_stop() has been called). The return value should be zero
145 * or a negative error number; it will be passed to kthread_stop().
146 *
147 * Returns a task_struct or ERR_PTR(-ENOMEM).
148 */
Eric Dumazet207205a2011-03-22 16:30:44 -0700149struct task_struct *kthread_create_on_node(int (*threadfn)(void *data),
150 void *data,
151 int node,
152 const char namefmt[],
153 ...)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700154{
155 struct kthread_create_info create;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700156
157 create.threadfn = threadfn;
158 create.data = data;
Eric Dumazet207205a2011-03-22 16:30:44 -0700159 create.node = node;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700160 init_completion(&create.done);
161
Eric W. Biederman73c27992007-05-09 02:34:32 -0700162 spin_lock(&kthread_create_lock);
163 list_add_tail(&create.list, &kthread_create_list);
Eric W. Biederman73c27992007-05-09 02:34:32 -0700164 spin_unlock(&kthread_create_lock);
165
Dmitry Adamushkocbd9b672008-04-29 00:59:23 -0700166 wake_up_process(kthreadd_task);
Eric W. Biederman73c27992007-05-09 02:34:32 -0700167 wait_for_completion(&create.done);
168
Linus Torvalds1da177e2005-04-16 15:20:36 -0700169 if (!IS_ERR(create.result)) {
Peter Zijlstrac9b5f502011-01-07 13:41:40 +0100170 static const struct sched_param param = { .sched_priority = 0 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700171 va_list args;
Oleg Nesterov1c993152009-04-09 09:50:36 -0600172
Linus Torvalds1da177e2005-04-16 15:20:36 -0700173 va_start(args, namefmt);
174 vsnprintf(create.result->comm, sizeof(create.result->comm),
175 namefmt, args);
176 va_end(args);
Oleg Nesterov1c993152009-04-09 09:50:36 -0600177 /*
178 * root may have changed our (kthreadd's) priority or CPU mask.
179 * The kernel thread should not inherit these properties.
180 */
181 sched_setscheduler_nocheck(create.result, SCHED_NORMAL, &param);
Oleg Nesterov1c993152009-04-09 09:50:36 -0600182 set_cpus_allowed_ptr(create.result, cpu_all_mask);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700183 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700184 return create.result;
185}
Eric Dumazet207205a2011-03-22 16:30:44 -0700186EXPORT_SYMBOL(kthread_create_on_node);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700187
Randy Dunlap9e37bd32006-06-25 05:49:19 -0700188/**
Peter Zijlstra881232b2009-12-16 18:04:39 +0100189 * kthread_bind - bind a just-created kthread to a cpu.
190 * @p: thread created by kthread_create().
191 * @cpu: cpu (might not be online, must be possible) for @k to run on.
192 *
193 * Description: This function is equivalent to set_cpus_allowed(),
194 * except that @cpu doesn't need to be online, and the thread must be
195 * stopped (i.e., just returned from kthread_create()).
196 */
197void kthread_bind(struct task_struct *p, unsigned int cpu)
198{
199 /* Must have done schedule() in kthread() before we set_task_cpu */
200 if (!wait_task_inactive(p, TASK_UNINTERRUPTIBLE)) {
201 WARN_ON(1);
202 return;
203 }
204
KOSAKI Motohiro1e1b6c52011-05-19 15:08:58 +0900205 /* It's safe because the task is inactive. */
206 do_set_cpus_allowed(p, cpumask_of(cpu));
Peter Zijlstra881232b2009-12-16 18:04:39 +0100207 p->flags |= PF_THREAD_BOUND;
208}
209EXPORT_SYMBOL(kthread_bind);
210
211/**
Randy Dunlap9e37bd32006-06-25 05:49:19 -0700212 * kthread_stop - stop a thread created by kthread_create().
213 * @k: thread created by kthread_create().
214 *
215 * Sets kthread_should_stop() for @k to return true, wakes it, and
Oleg Nesterov9ae26022009-06-19 02:51:13 +0200216 * waits for it to exit. This can also be called after kthread_create()
217 * instead of calling wake_up_process(): the thread will exit without
218 * calling threadfn().
219 *
220 * If threadfn() may call do_exit() itself, the caller must ensure
221 * task_struct can't go away.
Randy Dunlap9e37bd32006-06-25 05:49:19 -0700222 *
223 * Returns the result of threadfn(), or %-EINTR if wake_up_process()
224 * was never called.
225 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700226int kthread_stop(struct task_struct *k)
227{
Oleg Nesterov63706172009-06-17 16:27:45 -0700228 struct kthread *kthread;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229 int ret;
230
Oleg Nesterov63706172009-06-17 16:27:45 -0700231 trace_sched_kthread_stop(k);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700232 get_task_struct(k);
233
Oleg Nesterov63706172009-06-17 16:27:45 -0700234 kthread = to_kthread(k);
235 barrier(); /* it might have exited */
236 if (k->vfork_done != NULL) {
237 kthread->should_stop = 1;
238 wake_up_process(k);
239 wait_for_completion(&kthread->exited);
240 }
241 ret = k->exit_code;
Mathieu Desnoyers0a16b602008-07-18 12:16:17 -0400242
Linus Torvalds1da177e2005-04-16 15:20:36 -0700243 put_task_struct(k);
Mathieu Desnoyers0a16b602008-07-18 12:16:17 -0400244 trace_sched_kthread_stop_ret(ret);
245
Linus Torvalds1da177e2005-04-16 15:20:36 -0700246 return ret;
247}
Adrian Bunk52e92e52006-07-14 00:24:05 -0700248EXPORT_SYMBOL(kthread_stop);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700249
Satyam Sharmae804a4a2007-07-31 00:39:16 -0700250int kthreadd(void *unused)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700251{
Eric W. Biederman73c27992007-05-09 02:34:32 -0700252 struct task_struct *tsk = current;
Eric W. Biederman73c27992007-05-09 02:34:32 -0700253
Satyam Sharmae804a4a2007-07-31 00:39:16 -0700254 /* Setup a clean context for our children to inherit. */
Eric W. Biederman73c27992007-05-09 02:34:32 -0700255 set_task_comm(tsk, "kthreadd");
Oleg Nesterov10ab8252007-05-09 02:34:37 -0700256 ignore_signals(tsk);
Rusty Russell1a2142a2009-03-30 22:05:10 -0600257 set_cpus_allowed_ptr(tsk, cpu_all_mask);
Miao Xie5ab116c2010-03-23 13:35:34 -0700258 set_mems_allowed(node_states[N_HIGH_MEMORY]);
Eric W. Biederman73c27992007-05-09 02:34:32 -0700259
Rafael J. Wysockiebb12db2008-06-11 22:04:29 +0200260 current->flags |= PF_NOFREEZE | PF_FREEZER_NOSIG;
Eric W. Biederman73c27992007-05-09 02:34:32 -0700261
262 for (;;) {
263 set_current_state(TASK_INTERRUPTIBLE);
264 if (list_empty(&kthread_create_list))
265 schedule();
266 __set_current_state(TASK_RUNNING);
267
268 spin_lock(&kthread_create_lock);
269 while (!list_empty(&kthread_create_list)) {
270 struct kthread_create_info *create;
271
272 create = list_entry(kthread_create_list.next,
273 struct kthread_create_info, list);
274 list_del_init(&create->list);
275 spin_unlock(&kthread_create_lock);
276
277 create_kthread(create);
278
279 spin_lock(&kthread_create_lock);
280 }
281 spin_unlock(&kthread_create_lock);
282 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700283
284 return 0;
285}
Tejun Heob56c0d82010-06-29 10:07:09 +0200286
Yong Zhang4f32e9b2010-12-22 10:27:53 +0100287void __init_kthread_worker(struct kthread_worker *worker,
288 const char *name,
289 struct lock_class_key *key)
290{
291 spin_lock_init(&worker->lock);
292 lockdep_set_class_and_name(&worker->lock, key, name);
293 INIT_LIST_HEAD(&worker->work_list);
294 worker->task = NULL;
295}
296EXPORT_SYMBOL_GPL(__init_kthread_worker);
297
Tejun Heob56c0d82010-06-29 10:07:09 +0200298/**
299 * kthread_worker_fn - kthread function to process kthread_worker
300 * @worker_ptr: pointer to initialized kthread_worker
301 *
302 * This function can be used as @threadfn to kthread_create() or
303 * kthread_run() with @worker_ptr argument pointing to an initialized
304 * kthread_worker. The started kthread will process work_list until
305 * the it is stopped with kthread_stop(). A kthread can also call
306 * this function directly after extra initialization.
307 *
308 * Different kthreads can be used for the same kthread_worker as long
309 * as there's only one kthread attached to it at any given time. A
310 * kthread_worker without an attached kthread simply collects queued
311 * kthread_works.
312 */
313int kthread_worker_fn(void *worker_ptr)
314{
315 struct kthread_worker *worker = worker_ptr;
316 struct kthread_work *work;
317
318 WARN_ON(worker->task);
319 worker->task = current;
320repeat:
321 set_current_state(TASK_INTERRUPTIBLE); /* mb paired w/ kthread_stop */
322
323 if (kthread_should_stop()) {
324 __set_current_state(TASK_RUNNING);
325 spin_lock_irq(&worker->lock);
326 worker->task = NULL;
327 spin_unlock_irq(&worker->lock);
328 return 0;
329 }
330
331 work = NULL;
332 spin_lock_irq(&worker->lock);
333 if (!list_empty(&worker->work_list)) {
334 work = list_first_entry(&worker->work_list,
335 struct kthread_work, node);
336 list_del_init(&work->node);
337 }
338 spin_unlock_irq(&worker->lock);
339
340 if (work) {
341 __set_current_state(TASK_RUNNING);
342 work->func(work);
343 smp_wmb(); /* wmb worker-b0 paired with flush-b1 */
344 work->done_seq = work->queue_seq;
345 smp_mb(); /* mb worker-b1 paired with flush-b0 */
346 if (atomic_read(&work->flushing))
347 wake_up_all(&work->done);
348 } else if (!freezing(current))
349 schedule();
350
351 try_to_freeze();
352 goto repeat;
353}
354EXPORT_SYMBOL_GPL(kthread_worker_fn);
355
356/**
357 * queue_kthread_work - queue a kthread_work
358 * @worker: target kthread_worker
359 * @work: kthread_work to queue
360 *
361 * Queue @work to work processor @task for async execution. @task
362 * must have been created with kthread_worker_create(). Returns %true
363 * if @work was successfully queued, %false if it was already pending.
364 */
365bool queue_kthread_work(struct kthread_worker *worker,
366 struct kthread_work *work)
367{
368 bool ret = false;
369 unsigned long flags;
370
371 spin_lock_irqsave(&worker->lock, flags);
372 if (list_empty(&work->node)) {
373 list_add_tail(&work->node, &worker->work_list);
374 work->queue_seq++;
375 if (likely(worker->task))
376 wake_up_process(worker->task);
377 ret = true;
378 }
379 spin_unlock_irqrestore(&worker->lock, flags);
380 return ret;
381}
382EXPORT_SYMBOL_GPL(queue_kthread_work);
383
384/**
385 * flush_kthread_work - flush a kthread_work
386 * @work: work to flush
387 *
388 * If @work is queued or executing, wait for it to finish execution.
389 */
390void flush_kthread_work(struct kthread_work *work)
391{
392 int seq = work->queue_seq;
393
394 atomic_inc(&work->flushing);
395
396 /*
397 * mb flush-b0 paired with worker-b1, to make sure either
398 * worker sees the above increment or we see done_seq update.
399 */
400 smp_mb__after_atomic_inc();
401
402 /* A - B <= 0 tests whether B is in front of A regardless of overflow */
403 wait_event(work->done, seq - work->done_seq <= 0);
404 atomic_dec(&work->flushing);
405
406 /*
407 * rmb flush-b1 paired with worker-b0, to make sure our caller
408 * sees every change made by work->func().
409 */
410 smp_mb__after_atomic_dec();
411}
412EXPORT_SYMBOL_GPL(flush_kthread_work);
413
414struct kthread_flush_work {
415 struct kthread_work work;
416 struct completion done;
417};
418
419static void kthread_flush_work_fn(struct kthread_work *work)
420{
421 struct kthread_flush_work *fwork =
422 container_of(work, struct kthread_flush_work, work);
423 complete(&fwork->done);
424}
425
426/**
427 * flush_kthread_worker - flush all current works on a kthread_worker
428 * @worker: worker to flush
429 *
430 * Wait until all currently executing or pending works on @worker are
431 * finished.
432 */
433void flush_kthread_worker(struct kthread_worker *worker)
434{
435 struct kthread_flush_work fwork = {
436 KTHREAD_WORK_INIT(fwork.work, kthread_flush_work_fn),
437 COMPLETION_INITIALIZER_ONSTACK(fwork.done),
438 };
439
440 queue_kthread_work(worker, &fwork.work);
441 wait_for_completion(&fwork.done);
442}
443EXPORT_SYMBOL_GPL(flush_kthread_worker);