kthread_worker: reorganize to prepare for flush_kthread_work() reimplementation
[linux-2.6-block.git] / kernel / kthread.c
CommitLineData
1da177e4
LT
1/* Kernel thread helper functions.
2 * Copyright (C) 2004 IBM Corporation, Rusty Russell.
3 *
73c27992 4 * Creation is done via kthreadd, so that we get a clean environment
1da177e4
LT
5 * even if we're invoked from userspace (think modprobe, hotplug cpu,
6 * etc.).
7 */
8#include <linux/sched.h>
9#include <linux/kthread.h>
10#include <linux/completion.h>
11#include <linux/err.h>
58568d2a 12#include <linux/cpuset.h>
1da177e4
LT
13#include <linux/unistd.h>
14#include <linux/file.h>
9984de1a 15#include <linux/export.h>
97d1f15b 16#include <linux/mutex.h>
b56c0d89
TH
17#include <linux/slab.h>
18#include <linux/freezer.h>
ad8d75ff 19#include <trace/events/sched.h>
1da177e4 20
73c27992
EB
21static DEFINE_SPINLOCK(kthread_create_lock);
22static LIST_HEAD(kthread_create_list);
23struct task_struct *kthreadd_task;
1da177e4
LT
24
25struct kthread_create_info
26{
73c27992 27 /* Information passed to kthread() from kthreadd. */
1da177e4
LT
28 int (*threadfn)(void *data);
29 void *data;
207205a2 30 int node;
1da177e4 31
73c27992 32 /* Result passed back to kthread_create() from kthreadd. */
1da177e4
LT
33 struct task_struct *result;
34 struct completion done;
65f27f38 35
73c27992 36 struct list_head list;
1da177e4
LT
37};
38
63706172
ON
39struct kthread {
40 int should_stop;
82805ab7 41 void *data;
63706172 42 struct completion exited;
1da177e4
LT
43};
44
63706172
ON
45#define to_kthread(tsk) \
46 container_of((tsk)->vfork_done, struct kthread, exited)
1da177e4 47
9e37bd30
RD
48/**
49 * kthread_should_stop - should this kthread return now?
50 *
72fd4a35 51 * When someone calls kthread_stop() on your kthread, it will be woken
9e37bd30
RD
52 * and this will return true. You should then return, and your return
53 * value will be passed through to kthread_stop().
54 */
1da177e4
LT
55int kthread_should_stop(void)
56{
63706172 57 return to_kthread(current)->should_stop;
1da177e4
LT
58}
59EXPORT_SYMBOL(kthread_should_stop);
60
8a32c441
TH
61/**
62 * kthread_freezable_should_stop - should this freezable kthread return now?
63 * @was_frozen: optional out parameter, indicates whether %current was frozen
64 *
65 * kthread_should_stop() for freezable kthreads, which will enter
66 * refrigerator if necessary. This function is safe from kthread_stop() /
67 * freezer deadlock and freezable kthreads should use this function instead
68 * of calling try_to_freeze() directly.
69 */
70bool kthread_freezable_should_stop(bool *was_frozen)
71{
72 bool frozen = false;
73
74 might_sleep();
75
76 if (unlikely(freezing(current)))
77 frozen = __refrigerator(true);
78
79 if (was_frozen)
80 *was_frozen = frozen;
81
82 return kthread_should_stop();
83}
84EXPORT_SYMBOL_GPL(kthread_freezable_should_stop);
85
82805ab7
TH
86/**
87 * kthread_data - return data value specified on kthread creation
88 * @task: kthread task in question
89 *
90 * Return the data value specified when kthread @task was created.
91 * The caller is responsible for ensuring the validity of @task when
92 * calling this function.
93 */
94void *kthread_data(struct task_struct *task)
95{
96 return to_kthread(task)->data;
97}
98
1da177e4
LT
99static int kthread(void *_create)
100{
63706172 101 /* Copy data: it's on kthread's stack */
1da177e4 102 struct kthread_create_info *create = _create;
63706172
ON
103 int (*threadfn)(void *data) = create->threadfn;
104 void *data = create->data;
105 struct kthread self;
106 int ret;
1da177e4 107
63706172 108 self.should_stop = 0;
82805ab7 109 self.data = data;
63706172
ON
110 init_completion(&self.exited);
111 current->vfork_done = &self.exited;
1da177e4 112
1da177e4 113 /* OK, tell user we're spawned, wait for stop or wakeup */
a076e4bc 114 __set_current_state(TASK_UNINTERRUPTIBLE);
3217ab97 115 create->result = current;
cdd140bd 116 complete(&create->done);
1da177e4
LT
117 schedule();
118
63706172
ON
119 ret = -EINTR;
120 if (!self.should_stop)
1da177e4
LT
121 ret = threadfn(data);
122
63706172
ON
123 /* we can't just return, we must preserve "self" on stack */
124 do_exit(ret);
1da177e4
LT
125}
126
207205a2
ED
127/* called from do_fork() to get node information for about to be created task */
128int tsk_fork_get_node(struct task_struct *tsk)
129{
130#ifdef CONFIG_NUMA
131 if (tsk == kthreadd_task)
132 return tsk->pref_node_fork;
133#endif
134 return numa_node_id();
135}
136
73c27992 137static void create_kthread(struct kthread_create_info *create)
1da177e4 138{
1da177e4
LT
139 int pid;
140
207205a2
ED
141#ifdef CONFIG_NUMA
142 current->pref_node_fork = create->node;
143#endif
1da177e4
LT
144 /* We want our own signal handler (we take no signals by default). */
145 pid = kernel_thread(kthread, create, CLONE_FS | CLONE_FILES | SIGCHLD);
cdd140bd 146 if (pid < 0) {
1da177e4 147 create->result = ERR_PTR(pid);
cdd140bd
ON
148 complete(&create->done);
149 }
1da177e4
LT
150}
151
9e37bd30 152/**
207205a2 153 * kthread_create_on_node - create a kthread.
9e37bd30
RD
154 * @threadfn: the function to run until signal_pending(current).
155 * @data: data ptr for @threadfn.
207205a2 156 * @node: memory node number.
9e37bd30
RD
157 * @namefmt: printf-style name for the thread.
158 *
159 * Description: This helper function creates and names a kernel
160 * thread. The thread will be stopped: use wake_up_process() to start
301ba045 161 * it. See also kthread_run().
9e37bd30 162 *
207205a2
ED
163 * If thread is going to be bound on a particular cpu, give its node
164 * in @node, to get NUMA affinity for kthread stack, or else give -1.
9e37bd30 165 * When woken, the thread will run @threadfn() with @data as its
72fd4a35 166 * argument. @threadfn() can either call do_exit() directly if it is a
25985edc 167 * standalone thread for which no one will call kthread_stop(), or
9e37bd30
RD
168 * return when 'kthread_should_stop()' is true (which means
169 * kthread_stop() has been called). The return value should be zero
170 * or a negative error number; it will be passed to kthread_stop().
171 *
172 * Returns a task_struct or ERR_PTR(-ENOMEM).
173 */
207205a2
ED
174struct task_struct *kthread_create_on_node(int (*threadfn)(void *data),
175 void *data,
176 int node,
177 const char namefmt[],
178 ...)
1da177e4
LT
179{
180 struct kthread_create_info create;
1da177e4
LT
181
182 create.threadfn = threadfn;
183 create.data = data;
207205a2 184 create.node = node;
1da177e4 185 init_completion(&create.done);
73c27992
EB
186
187 spin_lock(&kthread_create_lock);
188 list_add_tail(&create.list, &kthread_create_list);
73c27992
EB
189 spin_unlock(&kthread_create_lock);
190
cbd9b67b 191 wake_up_process(kthreadd_task);
73c27992
EB
192 wait_for_completion(&create.done);
193
1da177e4 194 if (!IS_ERR(create.result)) {
c9b5f501 195 static const struct sched_param param = { .sched_priority = 0 };
1da177e4 196 va_list args;
1c99315b 197
1da177e4
LT
198 va_start(args, namefmt);
199 vsnprintf(create.result->comm, sizeof(create.result->comm),
200 namefmt, args);
201 va_end(args);
1c99315b
ON
202 /*
203 * root may have changed our (kthreadd's) priority or CPU mask.
204 * The kernel thread should not inherit these properties.
205 */
206 sched_setscheduler_nocheck(create.result, SCHED_NORMAL, &param);
1c99315b 207 set_cpus_allowed_ptr(create.result, cpu_all_mask);
1da177e4 208 }
1da177e4
LT
209 return create.result;
210}
207205a2 211EXPORT_SYMBOL(kthread_create_on_node);
1da177e4 212
881232b7
PZ
213/**
214 * kthread_bind - bind a just-created kthread to a cpu.
215 * @p: thread created by kthread_create().
216 * @cpu: cpu (might not be online, must be possible) for @k to run on.
217 *
218 * Description: This function is equivalent to set_cpus_allowed(),
219 * except that @cpu doesn't need to be online, and the thread must be
220 * stopped (i.e., just returned from kthread_create()).
221 */
222void kthread_bind(struct task_struct *p, unsigned int cpu)
223{
224 /* Must have done schedule() in kthread() before we set_task_cpu */
225 if (!wait_task_inactive(p, TASK_UNINTERRUPTIBLE)) {
226 WARN_ON(1);
227 return;
228 }
229
1e1b6c51
KM
230 /* It's safe because the task is inactive. */
231 do_set_cpus_allowed(p, cpumask_of(cpu));
881232b7
PZ
232 p->flags |= PF_THREAD_BOUND;
233}
234EXPORT_SYMBOL(kthread_bind);
235
9e37bd30
RD
236/**
237 * kthread_stop - stop a thread created by kthread_create().
238 * @k: thread created by kthread_create().
239 *
240 * Sets kthread_should_stop() for @k to return true, wakes it, and
9ae26027
ON
241 * waits for it to exit. This can also be called after kthread_create()
242 * instead of calling wake_up_process(): the thread will exit without
243 * calling threadfn().
244 *
245 * If threadfn() may call do_exit() itself, the caller must ensure
246 * task_struct can't go away.
9e37bd30
RD
247 *
248 * Returns the result of threadfn(), or %-EINTR if wake_up_process()
249 * was never called.
250 */
1da177e4
LT
251int kthread_stop(struct task_struct *k)
252{
63706172 253 struct kthread *kthread;
1da177e4
LT
254 int ret;
255
0a16b607 256 trace_sched_kthread_stop(k);
63706172 257 get_task_struct(k);
0a16b607 258
63706172
ON
259 kthread = to_kthread(k);
260 barrier(); /* it might have exited */
261 if (k->vfork_done != NULL) {
262 kthread->should_stop = 1;
263 wake_up_process(k);
264 wait_for_completion(&kthread->exited);
265 }
266 ret = k->exit_code;
1da177e4 267
1da177e4 268 put_task_struct(k);
0a16b607
MD
269 trace_sched_kthread_stop_ret(ret);
270
1da177e4
LT
271 return ret;
272}
52e92e57 273EXPORT_SYMBOL(kthread_stop);
1da177e4 274
e804a4a4 275int kthreadd(void *unused)
1da177e4 276{
73c27992 277 struct task_struct *tsk = current;
1da177e4 278
e804a4a4 279 /* Setup a clean context for our children to inherit. */
73c27992 280 set_task_comm(tsk, "kthreadd");
10ab825b 281 ignore_signals(tsk);
1a2142af 282 set_cpus_allowed_ptr(tsk, cpu_all_mask);
5ab116c9 283 set_mems_allowed(node_states[N_HIGH_MEMORY]);
73c27992 284
34b087e4 285 current->flags |= PF_NOFREEZE;
73c27992
EB
286
287 for (;;) {
288 set_current_state(TASK_INTERRUPTIBLE);
289 if (list_empty(&kthread_create_list))
290 schedule();
291 __set_current_state(TASK_RUNNING);
292
293 spin_lock(&kthread_create_lock);
294 while (!list_empty(&kthread_create_list)) {
295 struct kthread_create_info *create;
296
297 create = list_entry(kthread_create_list.next,
298 struct kthread_create_info, list);
299 list_del_init(&create->list);
300 spin_unlock(&kthread_create_lock);
301
302 create_kthread(create);
303
304 spin_lock(&kthread_create_lock);
305 }
306 spin_unlock(&kthread_create_lock);
307 }
308
309 return 0;
310}
b56c0d89 311
4f32e9b1
YZ
312void __init_kthread_worker(struct kthread_worker *worker,
313 const char *name,
314 struct lock_class_key *key)
315{
316 spin_lock_init(&worker->lock);
317 lockdep_set_class_and_name(&worker->lock, key, name);
318 INIT_LIST_HEAD(&worker->work_list);
319 worker->task = NULL;
320}
321EXPORT_SYMBOL_GPL(__init_kthread_worker);
322
b56c0d89
TH
323/**
324 * kthread_worker_fn - kthread function to process kthread_worker
325 * @worker_ptr: pointer to initialized kthread_worker
326 *
327 * This function can be used as @threadfn to kthread_create() or
328 * kthread_run() with @worker_ptr argument pointing to an initialized
329 * kthread_worker. The started kthread will process work_list until
330 * the it is stopped with kthread_stop(). A kthread can also call
331 * this function directly after extra initialization.
332 *
333 * Different kthreads can be used for the same kthread_worker as long
334 * as there's only one kthread attached to it at any given time. A
335 * kthread_worker without an attached kthread simply collects queued
336 * kthread_works.
337 */
338int kthread_worker_fn(void *worker_ptr)
339{
340 struct kthread_worker *worker = worker_ptr;
341 struct kthread_work *work;
342
343 WARN_ON(worker->task);
344 worker->task = current;
345repeat:
346 set_current_state(TASK_INTERRUPTIBLE); /* mb paired w/ kthread_stop */
347
348 if (kthread_should_stop()) {
349 __set_current_state(TASK_RUNNING);
350 spin_lock_irq(&worker->lock);
351 worker->task = NULL;
352 spin_unlock_irq(&worker->lock);
353 return 0;
354 }
355
356 work = NULL;
357 spin_lock_irq(&worker->lock);
358 if (!list_empty(&worker->work_list)) {
359 work = list_first_entry(&worker->work_list,
360 struct kthread_work, node);
361 list_del_init(&work->node);
362 }
363 spin_unlock_irq(&worker->lock);
364
365 if (work) {
366 __set_current_state(TASK_RUNNING);
367 work->func(work);
368 smp_wmb(); /* wmb worker-b0 paired with flush-b1 */
369 work->done_seq = work->queue_seq;
370 smp_mb(); /* mb worker-b1 paired with flush-b0 */
371 if (atomic_read(&work->flushing))
372 wake_up_all(&work->done);
373 } else if (!freezing(current))
374 schedule();
375
376 try_to_freeze();
377 goto repeat;
378}
379EXPORT_SYMBOL_GPL(kthread_worker_fn);
380
9a2e03d8
TH
381/* insert @work before @pos in @worker */
382static void insert_kthread_work(struct kthread_worker *worker,
383 struct kthread_work *work,
384 struct list_head *pos)
385{
386 lockdep_assert_held(&worker->lock);
387
388 list_add_tail(&work->node, pos);
389 work->queue_seq++;
390 if (likely(worker->task))
391 wake_up_process(worker->task);
392}
393
b56c0d89
TH
394/**
395 * queue_kthread_work - queue a kthread_work
396 * @worker: target kthread_worker
397 * @work: kthread_work to queue
398 *
399 * Queue @work to work processor @task for async execution. @task
400 * must have been created with kthread_worker_create(). Returns %true
401 * if @work was successfully queued, %false if it was already pending.
402 */
403bool queue_kthread_work(struct kthread_worker *worker,
404 struct kthread_work *work)
405{
406 bool ret = false;
407 unsigned long flags;
408
409 spin_lock_irqsave(&worker->lock, flags);
410 if (list_empty(&work->node)) {
9a2e03d8 411 insert_kthread_work(worker, work, &worker->work_list);
b56c0d89
TH
412 ret = true;
413 }
414 spin_unlock_irqrestore(&worker->lock, flags);
415 return ret;
416}
417EXPORT_SYMBOL_GPL(queue_kthread_work);
418
9a2e03d8
TH
419struct kthread_flush_work {
420 struct kthread_work work;
421 struct completion done;
422};
423
424static void kthread_flush_work_fn(struct kthread_work *work)
425{
426 struct kthread_flush_work *fwork =
427 container_of(work, struct kthread_flush_work, work);
428 complete(&fwork->done);
429}
430
b56c0d89
TH
431/**
432 * flush_kthread_work - flush a kthread_work
433 * @work: work to flush
434 *
435 * If @work is queued or executing, wait for it to finish execution.
436 */
437void flush_kthread_work(struct kthread_work *work)
438{
439 int seq = work->queue_seq;
440
441 atomic_inc(&work->flushing);
442
443 /*
444 * mb flush-b0 paired with worker-b1, to make sure either
445 * worker sees the above increment or we see done_seq update.
446 */
447 smp_mb__after_atomic_inc();
448
449 /* A - B <= 0 tests whether B is in front of A regardless of overflow */
450 wait_event(work->done, seq - work->done_seq <= 0);
451 atomic_dec(&work->flushing);
452
453 /*
454 * rmb flush-b1 paired with worker-b0, to make sure our caller
455 * sees every change made by work->func().
456 */
457 smp_mb__after_atomic_dec();
458}
459EXPORT_SYMBOL_GPL(flush_kthread_work);
460
b56c0d89
TH
461/**
462 * flush_kthread_worker - flush all current works on a kthread_worker
463 * @worker: worker to flush
464 *
465 * Wait until all currently executing or pending works on @worker are
466 * finished.
467 */
468void flush_kthread_worker(struct kthread_worker *worker)
469{
470 struct kthread_flush_work fwork = {
471 KTHREAD_WORK_INIT(fwork.work, kthread_flush_work_fn),
472 COMPLETION_INITIALIZER_ONSTACK(fwork.done),
473 };
474
475 queue_kthread_work(worker, &fwork.work);
476 wait_for_completion(&fwork.done);
477}
478EXPORT_SYMBOL_GPL(flush_kthread_worker);