Merge branch 'akpm'
[linux-2.6/next.git] / kernel / kthread.c
blob1c36deaae2f1fee24ff03d8518ff9b4fa6afdfc3
1 /* Kernel thread helper functions.
2 * Copyright (C) 2004 IBM Corporation, Rusty Russell.
4 * Creation is done via kthreadd, so that we get a clean environment
5 * even if we're invoked from userspace (think modprobe, hotplug cpu,
6 * etc.).
7 */
8 #include <linux/sched.h>
9 #include <linux/kthread.h>
10 #include <linux/completion.h>
11 #include <linux/err.h>
12 #include <linux/cpuset.h>
13 #include <linux/unistd.h>
14 #include <linux/file.h>
15 #include <linux/export.h>
16 #include <linux/mutex.h>
17 #include <linux/slab.h>
18 #include <linux/freezer.h>
19 #include <trace/events/sched.h>
21 static DEFINE_SPINLOCK(kthread_create_lock);
22 static LIST_HEAD(kthread_create_list);
23 struct task_struct *kthreadd_task;
25 struct kthread_create_info
27 /* Information passed to kthread() from kthreadd. */
28 int (*threadfn)(void *data);
29 void *data;
30 int node;
32 /* Result passed back to kthread_create() from kthreadd. */
33 struct task_struct *result;
34 struct completion done;
36 struct list_head list;
39 struct kthread {
40 int should_stop;
41 void *data;
42 struct completion exited;
45 #define to_kthread(tsk) \
46 container_of((tsk)->vfork_done, struct kthread, exited)
48 /**
49 * kthread_should_stop - should this kthread return now?
51 * When someone calls kthread_stop() on your kthread, it will be woken
52 * and this will return true. You should then return, and your return
53 * value will be passed through to kthread_stop().
55 int kthread_should_stop(void)
57 return to_kthread(current)->should_stop;
59 EXPORT_SYMBOL(kthread_should_stop);
61 /**
62 * kthread_freezable_should_stop - should this freezable kthread return now?
63 * @was_frozen: optional out parameter, indicates whether %current was frozen
65 * kthread_should_stop() for freezable kthreads, which will enter
66 * refrigerator if necessary. This function is safe from kthread_stop() /
67 * freezer deadlock and freezable kthreads should use this function instead
68 * of calling try_to_freeze() directly.
70 bool kthread_freezable_should_stop(bool *was_frozen)
72 bool frozen = false;
74 might_sleep();
76 if (unlikely(freezing(current)))
77 frozen = __refrigerator(true);
79 if (was_frozen)
80 *was_frozen = frozen;
82 return kthread_should_stop();
84 EXPORT_SYMBOL_GPL(kthread_freezable_should_stop);
86 /**
87 * kthread_data - return data value specified on kthread creation
88 * @task: kthread task in question
90 * Return the data value specified when kthread @task was created.
91 * The caller is responsible for ensuring the validity of @task when
92 * calling this function.
94 void *kthread_data(struct task_struct *task)
96 return to_kthread(task)->data;
99 static int kthread(void *_create)
101 /* Copy data: it's on kthread's stack */
102 struct kthread_create_info *create = _create;
103 int (*threadfn)(void *data) = create->threadfn;
104 void *data = create->data;
105 struct kthread self;
106 int ret;
108 self.should_stop = 0;
109 self.data = data;
110 init_completion(&self.exited);
111 current->vfork_done = &self.exited;
113 /* OK, tell user we're spawned, wait for stop or wakeup */
114 __set_current_state(TASK_UNINTERRUPTIBLE);
115 create->result = current;
116 complete(&create->done);
117 schedule();
119 ret = -EINTR;
120 if (!self.should_stop)
121 ret = threadfn(data);
123 /* we can't just return, we must preserve "self" on stack */
124 do_exit(ret);
127 /* called from do_fork() to get node information for about to be created task */
128 int tsk_fork_get_node(struct task_struct *tsk)
130 #ifdef CONFIG_NUMA
131 if (tsk == kthreadd_task)
132 return tsk->pref_node_fork;
133 #endif
134 return numa_node_id();
137 static void create_kthread(struct kthread_create_info *create)
139 int pid;
141 #ifdef CONFIG_NUMA
142 current->pref_node_fork = create->node;
143 #endif
144 /* We want our own signal handler (we take no signals by default). */
145 pid = kernel_thread(kthread, create, CLONE_FS | CLONE_FILES | SIGCHLD);
146 if (pid < 0) {
147 create->result = ERR_PTR(pid);
148 complete(&create->done);
153 * kthread_create_on_node - create a kthread.
154 * @threadfn: the function to run until signal_pending(current).
155 * @data: data ptr for @threadfn.
156 * @node: memory node number.
157 * @namefmt: printf-style name for the thread.
159 * Description: This helper function creates and names a kernel
160 * thread. The thread will be stopped: use wake_up_process() to start
161 * it. See also kthread_run().
163 * If thread is going to be bound on a particular cpu, give its node
164 * in @node, to get NUMA affinity for kthread stack, or else give -1.
165 * When woken, the thread will run @threadfn() with @data as its
166 * argument. @threadfn() can either call do_exit() directly if it is a
167 * standalone thread for which no one will call kthread_stop(), or
168 * return when 'kthread_should_stop()' is true (which means
169 * kthread_stop() has been called). The return value should be zero
170 * or a negative error number; it will be passed to kthread_stop().
172 * Returns a task_struct or ERR_PTR(-ENOMEM).
174 struct task_struct *kthread_create_on_node(int (*threadfn)(void *data),
175 void *data,
176 int node,
177 const char namefmt[],
178 ...)
180 struct kthread_create_info create;
182 create.threadfn = threadfn;
183 create.data = data;
184 create.node = node;
185 init_completion(&create.done);
187 spin_lock(&kthread_create_lock);
188 list_add_tail(&create.list, &kthread_create_list);
189 spin_unlock(&kthread_create_lock);
191 wake_up_process(kthreadd_task);
192 wait_for_completion(&create.done);
194 if (!IS_ERR(create.result)) {
195 static const struct sched_param param = { .sched_priority = 0 };
196 va_list args;
198 va_start(args, namefmt);
199 vsnprintf(create.result->comm, sizeof(create.result->comm),
200 namefmt, args);
201 va_end(args);
203 * root may have changed our (kthreadd's) priority or CPU mask.
204 * The kernel thread should not inherit these properties.
206 sched_setscheduler_nocheck(create.result, SCHED_NORMAL, &param);
207 set_cpus_allowed_ptr(create.result, cpu_all_mask);
209 return create.result;
211 EXPORT_SYMBOL(kthread_create_on_node);
214 * kthread_bind - bind a just-created kthread to a cpu.
215 * @p: thread created by kthread_create().
216 * @cpu: cpu (might not be online, must be possible) for @k to run on.
218 * Description: This function is equivalent to set_cpus_allowed(),
219 * except that @cpu doesn't need to be online, and the thread must be
220 * stopped (i.e., just returned from kthread_create()).
222 void kthread_bind(struct task_struct *p, unsigned int cpu)
224 /* Must have done schedule() in kthread() before we set_task_cpu */
225 if (!wait_task_inactive(p, TASK_UNINTERRUPTIBLE)) {
226 WARN_ON(1);
227 return;
230 /* It's safe because the task is inactive. */
231 do_set_cpus_allowed(p, cpumask_of(cpu));
232 p->flags |= PF_THREAD_BOUND;
234 EXPORT_SYMBOL(kthread_bind);
237 * kthread_stop - stop a thread created by kthread_create().
238 * @k: thread created by kthread_create().
240 * Sets kthread_should_stop() for @k to return true, wakes it, and
241 * waits for it to exit. This can also be called after kthread_create()
242 * instead of calling wake_up_process(): the thread will exit without
243 * calling threadfn().
245 * If threadfn() may call do_exit() itself, the caller must ensure
246 * task_struct can't go away.
248 * Returns the result of threadfn(), or %-EINTR if wake_up_process()
249 * was never called.
251 int kthread_stop(struct task_struct *k)
253 struct kthread *kthread;
254 int ret;
256 trace_sched_kthread_stop(k);
257 get_task_struct(k);
259 kthread = to_kthread(k);
260 barrier(); /* it might have exited */
261 if (k->vfork_done != NULL) {
262 kthread->should_stop = 1;
263 wake_up_process(k);
264 wait_for_completion(&kthread->exited);
266 ret = k->exit_code;
268 put_task_struct(k);
269 trace_sched_kthread_stop_ret(ret);
271 return ret;
273 EXPORT_SYMBOL(kthread_stop);
275 int kthreadd(void *unused)
277 struct task_struct *tsk = current;
279 /* Setup a clean context for our children to inherit. */
280 set_task_comm(tsk, "kthreadd");
281 ignore_signals(tsk);
282 set_cpus_allowed_ptr(tsk, cpu_all_mask);
283 set_mems_allowed(node_states[N_HIGH_MEMORY]);
285 current->flags |= PF_NOFREEZE | PF_FREEZER_NOSIG;
287 for (;;) {
288 set_current_state(TASK_INTERRUPTIBLE);
289 if (list_empty(&kthread_create_list))
290 schedule();
291 __set_current_state(TASK_RUNNING);
293 spin_lock(&kthread_create_lock);
294 while (!list_empty(&kthread_create_list)) {
295 struct kthread_create_info *create;
297 create = list_entry(kthread_create_list.next,
298 struct kthread_create_info, list);
299 list_del_init(&create->list);
300 spin_unlock(&kthread_create_lock);
302 create_kthread(create);
304 spin_lock(&kthread_create_lock);
306 spin_unlock(&kthread_create_lock);
309 return 0;
312 void __init_kthread_worker(struct kthread_worker *worker,
313 const char *name,
314 struct lock_class_key *key)
316 spin_lock_init(&worker->lock);
317 lockdep_set_class_and_name(&worker->lock, key, name);
318 INIT_LIST_HEAD(&worker->work_list);
319 worker->task = NULL;
321 EXPORT_SYMBOL_GPL(__init_kthread_worker);
324 * kthread_worker_fn - kthread function to process kthread_worker
325 * @worker_ptr: pointer to initialized kthread_worker
327 * This function can be used as @threadfn to kthread_create() or
328 * kthread_run() with @worker_ptr argument pointing to an initialized
329 * kthread_worker. The started kthread will process work_list until
330 * the it is stopped with kthread_stop(). A kthread can also call
331 * this function directly after extra initialization.
333 * Different kthreads can be used for the same kthread_worker as long
334 * as there's only one kthread attached to it at any given time. A
335 * kthread_worker without an attached kthread simply collects queued
336 * kthread_works.
338 int kthread_worker_fn(void *worker_ptr)
340 struct kthread_worker *worker = worker_ptr;
341 struct kthread_work *work;
343 WARN_ON(worker->task);
344 worker->task = current;
345 repeat:
346 set_current_state(TASK_INTERRUPTIBLE); /* mb paired w/ kthread_stop */
348 if (kthread_should_stop()) {
349 __set_current_state(TASK_RUNNING);
350 spin_lock_irq(&worker->lock);
351 worker->task = NULL;
352 spin_unlock_irq(&worker->lock);
353 return 0;
356 work = NULL;
357 spin_lock_irq(&worker->lock);
358 if (!list_empty(&worker->work_list)) {
359 work = list_first_entry(&worker->work_list,
360 struct kthread_work, node);
361 list_del_init(&work->node);
363 spin_unlock_irq(&worker->lock);
365 if (work) {
366 __set_current_state(TASK_RUNNING);
367 work->func(work);
368 smp_wmb(); /* wmb worker-b0 paired with flush-b1 */
369 work->done_seq = work->queue_seq;
370 smp_mb(); /* mb worker-b1 paired with flush-b0 */
371 if (atomic_read(&work->flushing))
372 wake_up_all(&work->done);
373 } else if (!freezing(current))
374 schedule();
376 try_to_freeze();
377 goto repeat;
379 EXPORT_SYMBOL_GPL(kthread_worker_fn);
382 * queue_kthread_work - queue a kthread_work
383 * @worker: target kthread_worker
384 * @work: kthread_work to queue
386 * Queue @work to work processor @task for async execution. @task
387 * must have been created with kthread_worker_create(). Returns %true
388 * if @work was successfully queued, %false if it was already pending.
390 bool queue_kthread_work(struct kthread_worker *worker,
391 struct kthread_work *work)
393 bool ret = false;
394 unsigned long flags;
396 spin_lock_irqsave(&worker->lock, flags);
397 if (list_empty(&work->node)) {
398 list_add_tail(&work->node, &worker->work_list);
399 work->queue_seq++;
400 if (likely(worker->task))
401 wake_up_process(worker->task);
402 ret = true;
404 spin_unlock_irqrestore(&worker->lock, flags);
405 return ret;
407 EXPORT_SYMBOL_GPL(queue_kthread_work);
410 * flush_kthread_work - flush a kthread_work
411 * @work: work to flush
413 * If @work is queued or executing, wait for it to finish execution.
415 void flush_kthread_work(struct kthread_work *work)
417 int seq = work->queue_seq;
419 atomic_inc(&work->flushing);
422 * mb flush-b0 paired with worker-b1, to make sure either
423 * worker sees the above increment or we see done_seq update.
425 smp_mb__after_atomic_inc();
427 /* A - B <= 0 tests whether B is in front of A regardless of overflow */
428 wait_event(work->done, seq - work->done_seq <= 0);
429 atomic_dec(&work->flushing);
432 * rmb flush-b1 paired with worker-b0, to make sure our caller
433 * sees every change made by work->func().
435 smp_mb__after_atomic_dec();
437 EXPORT_SYMBOL_GPL(flush_kthread_work);
439 struct kthread_flush_work {
440 struct kthread_work work;
441 struct completion done;
444 static void kthread_flush_work_fn(struct kthread_work *work)
446 struct kthread_flush_work *fwork =
447 container_of(work, struct kthread_flush_work, work);
448 complete(&fwork->done);
452 * flush_kthread_worker - flush all current works on a kthread_worker
453 * @worker: worker to flush
455 * Wait until all currently executing or pending works on @worker are
456 * finished.
458 void flush_kthread_worker(struct kthread_worker *worker)
460 struct kthread_flush_work fwork = {
461 KTHREAD_WORK_INIT(fwork.work, kthread_flush_work_fn),
462 COMPLETION_INITIALIZER_ONSTACK(fwork.done),
465 queue_kthread_work(worker, &fwork.work);
466 wait_for_completion(&fwork.done);
468 EXPORT_SYMBOL_GPL(flush_kthread_worker);