]> git.proxmox.com Git - mirror_ubuntu-hirsute-kernel.git/blame - kernel/kthread.c
kthread, sched/wait: Fix kthread_parkme() wait-loop
[mirror_ubuntu-hirsute-kernel.git] / kernel / kthread.c
CommitLineData
1da177e4
LT
1/* Kernel thread helper functions.
2 * Copyright (C) 2004 IBM Corporation, Rusty Russell.
3 *
73c27992 4 * Creation is done via kthreadd, so that we get a clean environment
1da177e4
LT
5 * even if we're invoked from userspace (think modprobe, hotplug cpu,
6 * etc.).
7 */
ae7e81c0 8#include <uapi/linux/sched/types.h>
1da177e4 9#include <linux/sched.h>
29930025 10#include <linux/sched/task.h>
1da177e4
LT
11#include <linux/kthread.h>
12#include <linux/completion.h>
13#include <linux/err.h>
58568d2a 14#include <linux/cpuset.h>
1da177e4
LT
15#include <linux/unistd.h>
16#include <linux/file.h>
9984de1a 17#include <linux/export.h>
97d1f15b 18#include <linux/mutex.h>
b56c0d89
TH
19#include <linux/slab.h>
20#include <linux/freezer.h>
a74fb73c 21#include <linux/ptrace.h>
cd42d559 22#include <linux/uaccess.h>
ad8d75ff 23#include <trace/events/sched.h>
1da177e4 24
73c27992
EB
25static DEFINE_SPINLOCK(kthread_create_lock);
26static LIST_HEAD(kthread_create_list);
27struct task_struct *kthreadd_task;
1da177e4
LT
28
29struct kthread_create_info
30{
73c27992 31 /* Information passed to kthread() from kthreadd. */
1da177e4
LT
32 int (*threadfn)(void *data);
33 void *data;
207205a2 34 int node;
1da177e4 35
73c27992 36 /* Result passed back to kthread_create() from kthreadd. */
1da177e4 37 struct task_struct *result;
786235ee 38 struct completion *done;
65f27f38 39
73c27992 40 struct list_head list;
1da177e4
LT
41};
42
63706172 43struct kthread {
2a1d4460
TG
44 unsigned long flags;
45 unsigned int cpu;
82805ab7 46 void *data;
2a1d4460 47 struct completion parked;
63706172 48 struct completion exited;
0b508bc9 49#ifdef CONFIG_BLK_CGROUP
05e3db95
SL
50 struct cgroup_subsys_state *blkcg_css;
51#endif
1da177e4
LT
52};
53
2a1d4460
TG
54enum KTHREAD_BITS {
55 KTHREAD_IS_PER_CPU = 0,
56 KTHREAD_SHOULD_STOP,
57 KTHREAD_SHOULD_PARK,
58 KTHREAD_IS_PARKED,
59};
60
1da5c46f
ON
61static inline void set_kthread_struct(void *kthread)
62{
63 /*
64 * We abuse ->set_child_tid to avoid the new member and because it
65 * can't be wrongly copied by copy_process(). We also rely on fact
66 * that the caller can't exec, so PF_KTHREAD can't be cleared.
67 */
68 current->set_child_tid = (__force void __user *)kthread;
69}
4ecdafc8
ON
70
71static inline struct kthread *to_kthread(struct task_struct *k)
72{
1da5c46f
ON
73 WARN_ON(!(k->flags & PF_KTHREAD));
74 return (__force void *)k->set_child_tid;
4ecdafc8
ON
75}
76
1da5c46f
ON
77void free_kthread_struct(struct task_struct *k)
78{
05e3db95
SL
79 struct kthread *kthread;
80
1da5c46f
ON
81 /*
82 * Can be NULL if this kthread was created by kernel_thread()
83 * or if kmalloc() in kthread() failed.
84 */
05e3db95 85 kthread = to_kthread(k);
0b508bc9 86#ifdef CONFIG_BLK_CGROUP
05e3db95
SL
87 WARN_ON_ONCE(kthread && kthread->blkcg_css);
88#endif
89 kfree(kthread);
1da5c46f
ON
90}
91
9e37bd30
RD
92/**
93 * kthread_should_stop - should this kthread return now?
94 *
72fd4a35 95 * When someone calls kthread_stop() on your kthread, it will be woken
9e37bd30
RD
96 * and this will return true. You should then return, and your return
97 * value will be passed through to kthread_stop().
98 */
2a1d4460 99bool kthread_should_stop(void)
1da177e4 100{
2a1d4460 101 return test_bit(KTHREAD_SHOULD_STOP, &to_kthread(current)->flags);
1da177e4
LT
102}
103EXPORT_SYMBOL(kthread_should_stop);
104
2a1d4460
TG
105/**
106 * kthread_should_park - should this kthread park now?
107 *
108 * When someone calls kthread_park() on your kthread, it will be woken
109 * and this will return true. You should then do the necessary
110 * cleanup and call kthread_parkme()
111 *
112 * Similar to kthread_should_stop(), but this keeps the thread alive
113 * and in a park position. kthread_unpark() "restarts" the thread and
114 * calls the thread function again.
115 */
116bool kthread_should_park(void)
117{
118 return test_bit(KTHREAD_SHOULD_PARK, &to_kthread(current)->flags);
119}
18896451 120EXPORT_SYMBOL_GPL(kthread_should_park);
2a1d4460 121
8a32c441
TH
122/**
123 * kthread_freezable_should_stop - should this freezable kthread return now?
124 * @was_frozen: optional out parameter, indicates whether %current was frozen
125 *
126 * kthread_should_stop() for freezable kthreads, which will enter
127 * refrigerator if necessary. This function is safe from kthread_stop() /
128 * freezer deadlock and freezable kthreads should use this function instead
129 * of calling try_to_freeze() directly.
130 */
131bool kthread_freezable_should_stop(bool *was_frozen)
132{
133 bool frozen = false;
134
135 might_sleep();
136
137 if (unlikely(freezing(current)))
138 frozen = __refrigerator(true);
139
140 if (was_frozen)
141 *was_frozen = frozen;
142
143 return kthread_should_stop();
144}
145EXPORT_SYMBOL_GPL(kthread_freezable_should_stop);
146
82805ab7
TH
147/**
148 * kthread_data - return data value specified on kthread creation
149 * @task: kthread task in question
150 *
151 * Return the data value specified when kthread @task was created.
152 * The caller is responsible for ensuring the validity of @task when
153 * calling this function.
154 */
155void *kthread_data(struct task_struct *task)
156{
157 return to_kthread(task)->data;
158}
159
cd42d559 160/**
e700591a 161 * kthread_probe_data - speculative version of kthread_data()
cd42d559
TH
162 * @task: possible kthread task in question
163 *
164 * @task could be a kthread task. Return the data value specified when it
165 * was created if accessible. If @task isn't a kthread task or its data is
166 * inaccessible for any reason, %NULL is returned. This function requires
167 * that @task itself is safe to dereference.
168 */
e700591a 169void *kthread_probe_data(struct task_struct *task)
cd42d559
TH
170{
171 struct kthread *kthread = to_kthread(task);
172 void *data = NULL;
173
174 probe_kernel_read(&data, &kthread->data, sizeof(data));
175 return data;
176}
177
2a1d4460
TG
178static void __kthread_parkme(struct kthread *self)
179{
741a76b3
PZ
180 for (;;) {
181 set_current_state(TASK_PARKED);
182 if (!test_bit(KTHREAD_SHOULD_PARK, &self->flags))
183 break;
2a1d4460
TG
184 if (!test_and_set_bit(KTHREAD_IS_PARKED, &self->flags))
185 complete(&self->parked);
186 schedule();
2a1d4460
TG
187 }
188 clear_bit(KTHREAD_IS_PARKED, &self->flags);
189 __set_current_state(TASK_RUNNING);
190}
191
192void kthread_parkme(void)
193{
194 __kthread_parkme(to_kthread(current));
195}
18896451 196EXPORT_SYMBOL_GPL(kthread_parkme);
2a1d4460 197
1da177e4
LT
198static int kthread(void *_create)
199{
63706172 200 /* Copy data: it's on kthread's stack */
1da177e4 201 struct kthread_create_info *create = _create;
63706172
ON
202 int (*threadfn)(void *data) = create->threadfn;
203 void *data = create->data;
786235ee 204 struct completion *done;
1da5c46f 205 struct kthread *self;
63706172 206 int ret;
1da177e4 207
e10237cc 208 self = kzalloc(sizeof(*self), GFP_KERNEL);
1da5c46f 209 set_kthread_struct(self);
1da177e4 210
786235ee
TH
211 /* If user was SIGKILLed, I release the structure. */
212 done = xchg(&create->done, NULL);
213 if (!done) {
214 kfree(create);
215 do_exit(-EINTR);
216 }
1da5c46f
ON
217
218 if (!self) {
219 create->result = ERR_PTR(-ENOMEM);
220 complete(done);
221 do_exit(-ENOMEM);
222 }
223
1da5c46f
ON
224 self->data = data;
225 init_completion(&self->exited);
226 init_completion(&self->parked);
227 current->vfork_done = &self->exited;
228
1da177e4 229 /* OK, tell user we're spawned, wait for stop or wakeup */
a076e4bc 230 __set_current_state(TASK_UNINTERRUPTIBLE);
3217ab97 231 create->result = current;
786235ee 232 complete(done);
1da177e4
LT
233 schedule();
234
63706172 235 ret = -EINTR;
1da5c46f 236 if (!test_bit(KTHREAD_SHOULD_STOP, &self->flags)) {
77f88796 237 cgroup_kthread_ready();
1da5c46f 238 __kthread_parkme(self);
2a1d4460
TG
239 ret = threadfn(data);
240 }
63706172 241 do_exit(ret);
1da177e4
LT
242}
243
207205a2
ED
244/* called from do_fork() to get node information for about to be created task */
245int tsk_fork_get_node(struct task_struct *tsk)
246{
247#ifdef CONFIG_NUMA
248 if (tsk == kthreadd_task)
249 return tsk->pref_node_fork;
250#endif
81c98869 251 return NUMA_NO_NODE;
207205a2
ED
252}
253
73c27992 254static void create_kthread(struct kthread_create_info *create)
1da177e4 255{
1da177e4
LT
256 int pid;
257
207205a2
ED
258#ifdef CONFIG_NUMA
259 current->pref_node_fork = create->node;
260#endif
1da177e4
LT
261 /* We want our own signal handler (we take no signals by default). */
262 pid = kernel_thread(kthread, create, CLONE_FS | CLONE_FILES | SIGCHLD);
cdd140bd 263 if (pid < 0) {
786235ee
TH
264 /* If user was SIGKILLed, I release the structure. */
265 struct completion *done = xchg(&create->done, NULL);
266
267 if (!done) {
268 kfree(create);
269 return;
270 }
1da177e4 271 create->result = ERR_PTR(pid);
786235ee 272 complete(done);
cdd140bd 273 }
1da177e4
LT
274}
275
c0b942a7
NI
276static __printf(4, 0)
277struct task_struct *__kthread_create_on_node(int (*threadfn)(void *data),
255451e4
PM
278 void *data, int node,
279 const char namefmt[],
280 va_list args)
1da177e4 281{
786235ee
TH
282 DECLARE_COMPLETION_ONSTACK(done);
283 struct task_struct *task;
284 struct kthread_create_info *create = kmalloc(sizeof(*create),
285 GFP_KERNEL);
286
287 if (!create)
288 return ERR_PTR(-ENOMEM);
289 create->threadfn = threadfn;
290 create->data = data;
291 create->node = node;
292 create->done = &done;
73c27992
EB
293
294 spin_lock(&kthread_create_lock);
786235ee 295 list_add_tail(&create->list, &kthread_create_list);
73c27992
EB
296 spin_unlock(&kthread_create_lock);
297
cbd9b67b 298 wake_up_process(kthreadd_task);
786235ee
TH
299 /*
300 * Wait for completion in killable state, for I might be chosen by
301 * the OOM killer while kthreadd is trying to allocate memory for
302 * new kernel thread.
303 */
304 if (unlikely(wait_for_completion_killable(&done))) {
305 /*
306 * If I was SIGKILLed before kthreadd (or new kernel thread)
307 * calls complete(), leave the cleanup of this structure to
308 * that thread.
309 */
310 if (xchg(&create->done, NULL))
8fe6929c 311 return ERR_PTR(-EINTR);
786235ee
TH
312 /*
313 * kthreadd (or new kernel thread) will call complete()
314 * shortly.
315 */
316 wait_for_completion(&done);
317 }
318 task = create->result;
319 if (!IS_ERR(task)) {
c9b5f501 320 static const struct sched_param param = { .sched_priority = 0 };
1c99315b 321
786235ee 322 vsnprintf(task->comm, sizeof(task->comm), namefmt, args);
1c99315b
ON
323 /*
324 * root may have changed our (kthreadd's) priority or CPU mask.
325 * The kernel thread should not inherit these properties.
326 */
786235ee
TH
327 sched_setscheduler_nocheck(task, SCHED_NORMAL, &param);
328 set_cpus_allowed_ptr(task, cpu_all_mask);
1da177e4 329 }
786235ee
TH
330 kfree(create);
331 return task;
1da177e4 332}
255451e4
PM
333
334/**
335 * kthread_create_on_node - create a kthread.
336 * @threadfn: the function to run until signal_pending(current).
337 * @data: data ptr for @threadfn.
338 * @node: task and thread structures for the thread are allocated on this node
339 * @namefmt: printf-style name for the thread.
340 *
341 * Description: This helper function creates and names a kernel
342 * thread. The thread will be stopped: use wake_up_process() to start
343 * it. See also kthread_run(). The new thread has SCHED_NORMAL policy and
344 * is affine to all CPUs.
345 *
346 * If thread is going to be bound on a particular cpu, give its node
347 * in @node, to get NUMA affinity for kthread stack, or else give NUMA_NO_NODE.
348 * When woken, the thread will run @threadfn() with @data as its
349 * argument. @threadfn() can either call do_exit() directly if it is a
350 * standalone thread for which no one will call kthread_stop(), or
351 * return when 'kthread_should_stop()' is true (which means
352 * kthread_stop() has been called). The return value should be zero
353 * or a negative error number; it will be passed to kthread_stop().
354 *
355 * Returns a task_struct or ERR_PTR(-ENOMEM) or ERR_PTR(-EINTR).
356 */
357struct task_struct *kthread_create_on_node(int (*threadfn)(void *data),
358 void *data, int node,
359 const char namefmt[],
360 ...)
361{
362 struct task_struct *task;
363 va_list args;
364
365 va_start(args, namefmt);
366 task = __kthread_create_on_node(threadfn, data, node, namefmt, args);
367 va_end(args);
368
369 return task;
370}
207205a2 371EXPORT_SYMBOL(kthread_create_on_node);
1da177e4 372
25834c73 373static void __kthread_bind_mask(struct task_struct *p, const struct cpumask *mask, long state)
2a1d4460 374{
25834c73
PZ
375 unsigned long flags;
376
f2530dc7
TG
377 if (!wait_task_inactive(p, state)) {
378 WARN_ON(1);
379 return;
380 }
25834c73 381
2a1d4460 382 /* It's safe because the task is inactive. */
25834c73
PZ
383 raw_spin_lock_irqsave(&p->pi_lock, flags);
384 do_set_cpus_allowed(p, mask);
14a40ffc 385 p->flags |= PF_NO_SETAFFINITY;
25834c73
PZ
386 raw_spin_unlock_irqrestore(&p->pi_lock, flags);
387}
388
389static void __kthread_bind(struct task_struct *p, unsigned int cpu, long state)
390{
391 __kthread_bind_mask(p, cpumask_of(cpu), state);
392}
393
394void kthread_bind_mask(struct task_struct *p, const struct cpumask *mask)
395{
396 __kthread_bind_mask(p, mask, TASK_UNINTERRUPTIBLE);
2a1d4460
TG
397}
398
881232b7
PZ
399/**
400 * kthread_bind - bind a just-created kthread to a cpu.
401 * @p: thread created by kthread_create().
402 * @cpu: cpu (might not be online, must be possible) for @k to run on.
403 *
404 * Description: This function is equivalent to set_cpus_allowed(),
405 * except that @cpu doesn't need to be online, and the thread must be
406 * stopped (i.e., just returned from kthread_create()).
407 */
408void kthread_bind(struct task_struct *p, unsigned int cpu)
409{
f2530dc7 410 __kthread_bind(p, cpu, TASK_UNINTERRUPTIBLE);
881232b7
PZ
411}
412EXPORT_SYMBOL(kthread_bind);
413
2a1d4460
TG
414/**
415 * kthread_create_on_cpu - Create a cpu bound kthread
416 * @threadfn: the function to run until signal_pending(current).
417 * @data: data ptr for @threadfn.
418 * @cpu: The cpu on which the thread should be bound,
419 * @namefmt: printf-style name for the thread. Format is restricted
420 * to "name.*%u". Code fills in cpu number.
421 *
422 * Description: This helper function creates and names a kernel thread
423 * The thread will be woken and put into park mode.
424 */
425struct task_struct *kthread_create_on_cpu(int (*threadfn)(void *data),
426 void *data, unsigned int cpu,
427 const char *namefmt)
428{
429 struct task_struct *p;
430
10922838 431 p = kthread_create_on_node(threadfn, data, cpu_to_node(cpu), namefmt,
2a1d4460
TG
432 cpu);
433 if (IS_ERR(p))
434 return p;
a65d4096
PM
435 kthread_bind(p, cpu);
436 /* CPU hotplug need to bind once again when unparking the thread. */
2a1d4460
TG
437 set_bit(KTHREAD_IS_PER_CPU, &to_kthread(p)->flags);
438 to_kthread(p)->cpu = cpu;
2a1d4460
TG
439 return p;
440}
441
cf380a4a
ON
442/**
443 * kthread_unpark - unpark a thread created by kthread_create().
444 * @k: thread created by kthread_create().
445 *
446 * Sets kthread_should_park() for @k to return false, wakes it, and
447 * waits for it to return. If the thread is marked percpu then its
448 * bound to the cpu again.
449 */
450void kthread_unpark(struct task_struct *k)
f2530dc7 451{
cf380a4a
ON
452 struct kthread *kthread = to_kthread(k);
453
f2530dc7
TG
454 clear_bit(KTHREAD_SHOULD_PARK, &kthread->flags);
455 /*
456 * We clear the IS_PARKED bit here as we don't wait
457 * until the task has left the park code. So if we'd
458 * park before that happens we'd see the IS_PARKED bit
459 * which might be about to be cleared.
460 */
461 if (test_and_clear_bit(KTHREAD_IS_PARKED, &kthread->flags)) {
a65d4096
PM
462 /*
463 * Newly created kthread was parked when the CPU was offline.
464 * The binding was lost and we need to set it again.
465 */
f2530dc7
TG
466 if (test_bit(KTHREAD_IS_PER_CPU, &kthread->flags))
467 __kthread_bind(k, kthread->cpu, TASK_PARKED);
468 wake_up_state(k, TASK_PARKED);
469 }
470}
18896451 471EXPORT_SYMBOL_GPL(kthread_unpark);
2a1d4460
TG
472
473/**
474 * kthread_park - park a thread created by kthread_create().
475 * @k: thread created by kthread_create().
476 *
477 * Sets kthread_should_park() for @k to return true, wakes it, and
478 * waits for it to return. This can also be called after kthread_create()
479 * instead of calling wake_up_process(): the thread will park without
480 * calling threadfn().
481 *
482 * Returns 0 if the thread is parked, -ENOSYS if the thread exited.
483 * If called by the kthread itself just the park bit is set.
484 */
485int kthread_park(struct task_struct *k)
486{
cf380a4a
ON
487 struct kthread *kthread = to_kthread(k);
488
489 if (WARN_ON(k->flags & PF_EXITING))
490 return -ENOSYS;
491
492 if (!test_bit(KTHREAD_IS_PARKED, &kthread->flags)) {
493 set_bit(KTHREAD_SHOULD_PARK, &kthread->flags);
494 if (k != current) {
495 wake_up_process(k);
496 wait_for_completion(&kthread->parked);
2a1d4460 497 }
2a1d4460 498 }
cf380a4a
ON
499
500 return 0;
2a1d4460 501}
18896451 502EXPORT_SYMBOL_GPL(kthread_park);
2a1d4460 503
9e37bd30
RD
504/**
505 * kthread_stop - stop a thread created by kthread_create().
506 * @k: thread created by kthread_create().
507 *
508 * Sets kthread_should_stop() for @k to return true, wakes it, and
9ae26027
ON
509 * waits for it to exit. This can also be called after kthread_create()
510 * instead of calling wake_up_process(): the thread will exit without
511 * calling threadfn().
512 *
513 * If threadfn() may call do_exit() itself, the caller must ensure
514 * task_struct can't go away.
9e37bd30
RD
515 *
516 * Returns the result of threadfn(), or %-EINTR if wake_up_process()
517 * was never called.
518 */
1da177e4
LT
519int kthread_stop(struct task_struct *k)
520{
b5c5442b 521 struct kthread *kthread;
1da177e4
LT
522 int ret;
523
0a16b607 524 trace_sched_kthread_stop(k);
b5c5442b
ON
525
526 get_task_struct(k);
efb29fbf
ON
527 kthread = to_kthread(k);
528 set_bit(KTHREAD_SHOULD_STOP, &kthread->flags);
cf380a4a 529 kthread_unpark(k);
efb29fbf
ON
530 wake_up_process(k);
531 wait_for_completion(&kthread->exited);
63706172 532 ret = k->exit_code;
1da177e4 533 put_task_struct(k);
0a16b607 534
b5c5442b 535 trace_sched_kthread_stop_ret(ret);
1da177e4
LT
536 return ret;
537}
52e92e57 538EXPORT_SYMBOL(kthread_stop);
1da177e4 539
e804a4a4 540int kthreadd(void *unused)
1da177e4 541{
73c27992 542 struct task_struct *tsk = current;
1da177e4 543
e804a4a4 544 /* Setup a clean context for our children to inherit. */
73c27992 545 set_task_comm(tsk, "kthreadd");
10ab825b 546 ignore_signals(tsk);
1a2142af 547 set_cpus_allowed_ptr(tsk, cpu_all_mask);
aee4faa4 548 set_mems_allowed(node_states[N_MEMORY]);
73c27992 549
34b087e4 550 current->flags |= PF_NOFREEZE;
77f88796 551 cgroup_init_kthreadd();
73c27992
EB
552
553 for (;;) {
554 set_current_state(TASK_INTERRUPTIBLE);
555 if (list_empty(&kthread_create_list))
556 schedule();
557 __set_current_state(TASK_RUNNING);
558
559 spin_lock(&kthread_create_lock);
560 while (!list_empty(&kthread_create_list)) {
561 struct kthread_create_info *create;
562
563 create = list_entry(kthread_create_list.next,
564 struct kthread_create_info, list);
565 list_del_init(&create->list);
566 spin_unlock(&kthread_create_lock);
567
568 create_kthread(create);
569
570 spin_lock(&kthread_create_lock);
571 }
572 spin_unlock(&kthread_create_lock);
573 }
574
575 return 0;
576}
b56c0d89 577
3989144f 578void __kthread_init_worker(struct kthread_worker *worker,
4f32e9b1
YZ
579 const char *name,
580 struct lock_class_key *key)
581{
dbf52682 582 memset(worker, 0, sizeof(struct kthread_worker));
4f32e9b1
YZ
583 spin_lock_init(&worker->lock);
584 lockdep_set_class_and_name(&worker->lock, key, name);
585 INIT_LIST_HEAD(&worker->work_list);
22597dc3 586 INIT_LIST_HEAD(&worker->delayed_work_list);
4f32e9b1 587}
3989144f 588EXPORT_SYMBOL_GPL(__kthread_init_worker);
4f32e9b1 589
b56c0d89
TH
590/**
591 * kthread_worker_fn - kthread function to process kthread_worker
592 * @worker_ptr: pointer to initialized kthread_worker
593 *
fbae2d44
PM
594 * This function implements the main cycle of kthread worker. It processes
595 * work_list until it is stopped with kthread_stop(). It sleeps when the queue
596 * is empty.
b56c0d89 597 *
fbae2d44
PM
598 * The works are not allowed to keep any locks, disable preemption or interrupts
599 * when they finish. There is defined a safe point for freezing when one work
600 * finishes and before a new one is started.
8197b3d4
PM
601 *
602 * Also the works must not be handled by more than one worker at the same time,
603 * see also kthread_queue_work().
b56c0d89
TH
604 */
605int kthread_worker_fn(void *worker_ptr)
606{
607 struct kthread_worker *worker = worker_ptr;
608 struct kthread_work *work;
609
fbae2d44
PM
610 /*
611 * FIXME: Update the check and remove the assignment when all kthread
612 * worker users are created using kthread_create_worker*() functions.
613 */
614 WARN_ON(worker->task && worker->task != current);
b56c0d89 615 worker->task = current;
dbf52682
PM
616
617 if (worker->flags & KTW_FREEZABLE)
618 set_freezable();
619
b56c0d89
TH
620repeat:
621 set_current_state(TASK_INTERRUPTIBLE); /* mb paired w/ kthread_stop */
622
623 if (kthread_should_stop()) {
624 __set_current_state(TASK_RUNNING);
625 spin_lock_irq(&worker->lock);
626 worker->task = NULL;
627 spin_unlock_irq(&worker->lock);
628 return 0;
629 }
630
631 work = NULL;
632 spin_lock_irq(&worker->lock);
633 if (!list_empty(&worker->work_list)) {
634 work = list_first_entry(&worker->work_list,
635 struct kthread_work, node);
636 list_del_init(&work->node);
637 }
46f3d976 638 worker->current_work = work;
b56c0d89
TH
639 spin_unlock_irq(&worker->lock);
640
641 if (work) {
642 __set_current_state(TASK_RUNNING);
643 work->func(work);
b56c0d89
TH
644 } else if (!freezing(current))
645 schedule();
646
647 try_to_freeze();
22cf8bc6 648 cond_resched();
b56c0d89
TH
649 goto repeat;
650}
651EXPORT_SYMBOL_GPL(kthread_worker_fn);
652
c0b942a7 653static __printf(3, 0) struct kthread_worker *
dbf52682
PM
654__kthread_create_worker(int cpu, unsigned int flags,
655 const char namefmt[], va_list args)
fbae2d44
PM
656{
657 struct kthread_worker *worker;
658 struct task_struct *task;
8fb9dcbd 659 int node = -1;
fbae2d44
PM
660
661 worker = kzalloc(sizeof(*worker), GFP_KERNEL);
662 if (!worker)
663 return ERR_PTR(-ENOMEM);
664
665 kthread_init_worker(worker);
666
8fb9dcbd
ON
667 if (cpu >= 0)
668 node = cpu_to_node(cpu);
fbae2d44 669
8fb9dcbd
ON
670 task = __kthread_create_on_node(kthread_worker_fn, worker,
671 node, namefmt, args);
fbae2d44
PM
672 if (IS_ERR(task))
673 goto fail_task;
674
8fb9dcbd
ON
675 if (cpu >= 0)
676 kthread_bind(task, cpu);
677
dbf52682 678 worker->flags = flags;
fbae2d44
PM
679 worker->task = task;
680 wake_up_process(task);
681 return worker;
682
683fail_task:
684 kfree(worker);
685 return ERR_CAST(task);
686}
687
688/**
689 * kthread_create_worker - create a kthread worker
dbf52682 690 * @flags: flags modifying the default behavior of the worker
fbae2d44
PM
691 * @namefmt: printf-style name for the kthread worker (task).
692 *
693 * Returns a pointer to the allocated worker on success, ERR_PTR(-ENOMEM)
694 * when the needed structures could not get allocated, and ERR_PTR(-EINTR)
695 * when the worker was SIGKILLed.
696 */
697struct kthread_worker *
dbf52682 698kthread_create_worker(unsigned int flags, const char namefmt[], ...)
fbae2d44
PM
699{
700 struct kthread_worker *worker;
701 va_list args;
702
703 va_start(args, namefmt);
dbf52682 704 worker = __kthread_create_worker(-1, flags, namefmt, args);
fbae2d44
PM
705 va_end(args);
706
707 return worker;
708}
709EXPORT_SYMBOL(kthread_create_worker);
710
711/**
712 * kthread_create_worker_on_cpu - create a kthread worker and bind it
713 * it to a given CPU and the associated NUMA node.
714 * @cpu: CPU number
dbf52682 715 * @flags: flags modifying the default behavior of the worker
fbae2d44
PM
716 * @namefmt: printf-style name for the kthread worker (task).
717 *
718 * Use a valid CPU number if you want to bind the kthread worker
719 * to the given CPU and the associated NUMA node.
720 *
721 * A good practice is to add the cpu number also into the worker name.
722 * For example, use kthread_create_worker_on_cpu(cpu, "helper/%d", cpu).
723 *
724 * Returns a pointer to the allocated worker on success, ERR_PTR(-ENOMEM)
725 * when the needed structures could not get allocated, and ERR_PTR(-EINTR)
726 * when the worker was SIGKILLed.
727 */
728struct kthread_worker *
dbf52682
PM
729kthread_create_worker_on_cpu(int cpu, unsigned int flags,
730 const char namefmt[], ...)
fbae2d44
PM
731{
732 struct kthread_worker *worker;
733 va_list args;
734
735 va_start(args, namefmt);
dbf52682 736 worker = __kthread_create_worker(cpu, flags, namefmt, args);
fbae2d44
PM
737 va_end(args);
738
739 return worker;
740}
741EXPORT_SYMBOL(kthread_create_worker_on_cpu);
742
37be45d4
PM
743/*
744 * Returns true when the work could not be queued at the moment.
745 * It happens when it is already pending in a worker list
746 * or when it is being cancelled.
747 */
748static inline bool queuing_blocked(struct kthread_worker *worker,
749 struct kthread_work *work)
750{
751 lockdep_assert_held(&worker->lock);
752
753 return !list_empty(&work->node) || work->canceling;
754}
755
8197b3d4
PM
756static void kthread_insert_work_sanity_check(struct kthread_worker *worker,
757 struct kthread_work *work)
758{
759 lockdep_assert_held(&worker->lock);
760 WARN_ON_ONCE(!list_empty(&work->node));
761 /* Do not use a work with >1 worker, see kthread_queue_work() */
762 WARN_ON_ONCE(work->worker && work->worker != worker);
763}
764
9a2e03d8 765/* insert @work before @pos in @worker */
3989144f 766static void kthread_insert_work(struct kthread_worker *worker,
8197b3d4
PM
767 struct kthread_work *work,
768 struct list_head *pos)
9a2e03d8 769{
8197b3d4 770 kthread_insert_work_sanity_check(worker, work);
9a2e03d8
TH
771
772 list_add_tail(&work->node, pos);
46f3d976 773 work->worker = worker;
ed1403ec 774 if (!worker->current_work && likely(worker->task))
9a2e03d8
TH
775 wake_up_process(worker->task);
776}
777
b56c0d89 778/**
3989144f 779 * kthread_queue_work - queue a kthread_work
b56c0d89
TH
780 * @worker: target kthread_worker
781 * @work: kthread_work to queue
782 *
783 * Queue @work to work processor @task for async execution. @task
784 * must have been created with kthread_worker_create(). Returns %true
785 * if @work was successfully queued, %false if it was already pending.
8197b3d4
PM
786 *
787 * Reinitialize the work if it needs to be used by another worker.
788 * For example, when the worker was stopped and started again.
b56c0d89 789 */
3989144f 790bool kthread_queue_work(struct kthread_worker *worker,
b56c0d89
TH
791 struct kthread_work *work)
792{
793 bool ret = false;
794 unsigned long flags;
795
796 spin_lock_irqsave(&worker->lock, flags);
37be45d4 797 if (!queuing_blocked(worker, work)) {
3989144f 798 kthread_insert_work(worker, work, &worker->work_list);
b56c0d89
TH
799 ret = true;
800 }
801 spin_unlock_irqrestore(&worker->lock, flags);
802 return ret;
803}
3989144f 804EXPORT_SYMBOL_GPL(kthread_queue_work);
b56c0d89 805
22597dc3
PM
806/**
807 * kthread_delayed_work_timer_fn - callback that queues the associated kthread
808 * delayed work when the timer expires.
fe5c3b69 809 * @t: pointer to the expired timer
22597dc3
PM
810 *
811 * The format of the function is defined by struct timer_list.
812 * It should have been called from irqsafe timer with irq already off.
813 */
fe5c3b69 814void kthread_delayed_work_timer_fn(struct timer_list *t)
22597dc3 815{
fe5c3b69 816 struct kthread_delayed_work *dwork = from_timer(dwork, t, timer);
22597dc3
PM
817 struct kthread_work *work = &dwork->work;
818 struct kthread_worker *worker = work->worker;
819
820 /*
821 * This might happen when a pending work is reinitialized.
822 * It means that it is used a wrong way.
823 */
824 if (WARN_ON_ONCE(!worker))
825 return;
826
827 spin_lock(&worker->lock);
828 /* Work must not be used with >1 worker, see kthread_queue_work(). */
829 WARN_ON_ONCE(work->worker != worker);
830
831 /* Move the work from worker->delayed_work_list. */
832 WARN_ON_ONCE(list_empty(&work->node));
833 list_del_init(&work->node);
834 kthread_insert_work(worker, work, &worker->work_list);
835
836 spin_unlock(&worker->lock);
837}
838EXPORT_SYMBOL(kthread_delayed_work_timer_fn);
839
840void __kthread_queue_delayed_work(struct kthread_worker *worker,
841 struct kthread_delayed_work *dwork,
842 unsigned long delay)
843{
844 struct timer_list *timer = &dwork->timer;
845 struct kthread_work *work = &dwork->work;
846
841b86f3 847 WARN_ON_ONCE(timer->function != kthread_delayed_work_timer_fn);
22597dc3
PM
848
849 /*
850 * If @delay is 0, queue @dwork->work immediately. This is for
851 * both optimization and correctness. The earliest @timer can
852 * expire is on the closest next tick and delayed_work users depend
853 * on that there's no such delay when @delay is 0.
854 */
855 if (!delay) {
856 kthread_insert_work(worker, work, &worker->work_list);
857 return;
858 }
859
860 /* Be paranoid and try to detect possible races already now. */
861 kthread_insert_work_sanity_check(worker, work);
862
863 list_add(&work->node, &worker->delayed_work_list);
864 work->worker = worker;
22597dc3
PM
865 timer->expires = jiffies + delay;
866 add_timer(timer);
867}
868
869/**
870 * kthread_queue_delayed_work - queue the associated kthread work
871 * after a delay.
872 * @worker: target kthread_worker
873 * @dwork: kthread_delayed_work to queue
874 * @delay: number of jiffies to wait before queuing
875 *
876 * If the work has not been pending it starts a timer that will queue
877 * the work after the given @delay. If @delay is zero, it queues the
878 * work immediately.
879 *
880 * Return: %false if the @work has already been pending. It means that
881 * either the timer was running or the work was queued. It returns %true
882 * otherwise.
883 */
884bool kthread_queue_delayed_work(struct kthread_worker *worker,
885 struct kthread_delayed_work *dwork,
886 unsigned long delay)
887{
888 struct kthread_work *work = &dwork->work;
889 unsigned long flags;
890 bool ret = false;
891
892 spin_lock_irqsave(&worker->lock, flags);
893
37be45d4 894 if (!queuing_blocked(worker, work)) {
22597dc3
PM
895 __kthread_queue_delayed_work(worker, dwork, delay);
896 ret = true;
897 }
898
899 spin_unlock_irqrestore(&worker->lock, flags);
900 return ret;
901}
902EXPORT_SYMBOL_GPL(kthread_queue_delayed_work);
903
9a2e03d8
TH
904struct kthread_flush_work {
905 struct kthread_work work;
906 struct completion done;
907};
908
909static void kthread_flush_work_fn(struct kthread_work *work)
910{
911 struct kthread_flush_work *fwork =
912 container_of(work, struct kthread_flush_work, work);
913 complete(&fwork->done);
914}
915
b56c0d89 916/**
3989144f 917 * kthread_flush_work - flush a kthread_work
b56c0d89
TH
918 * @work: work to flush
919 *
920 * If @work is queued or executing, wait for it to finish execution.
921 */
3989144f 922void kthread_flush_work(struct kthread_work *work)
b56c0d89 923{
46f3d976
TH
924 struct kthread_flush_work fwork = {
925 KTHREAD_WORK_INIT(fwork.work, kthread_flush_work_fn),
926 COMPLETION_INITIALIZER_ONSTACK(fwork.done),
927 };
928 struct kthread_worker *worker;
929 bool noop = false;
930
46f3d976
TH
931 worker = work->worker;
932 if (!worker)
933 return;
b56c0d89 934
46f3d976 935 spin_lock_irq(&worker->lock);
8197b3d4
PM
936 /* Work must not be used with >1 worker, see kthread_queue_work(). */
937 WARN_ON_ONCE(work->worker != worker);
b56c0d89 938
46f3d976 939 if (!list_empty(&work->node))
3989144f 940 kthread_insert_work(worker, &fwork.work, work->node.next);
46f3d976 941 else if (worker->current_work == work)
3989144f
PM
942 kthread_insert_work(worker, &fwork.work,
943 worker->work_list.next);
46f3d976
TH
944 else
945 noop = true;
b56c0d89 946
46f3d976 947 spin_unlock_irq(&worker->lock);
b56c0d89 948
46f3d976
TH
949 if (!noop)
950 wait_for_completion(&fwork.done);
b56c0d89 951}
3989144f 952EXPORT_SYMBOL_GPL(kthread_flush_work);
b56c0d89 953
37be45d4
PM
954/*
955 * This function removes the work from the worker queue. Also it makes sure
956 * that it won't get queued later via the delayed work's timer.
957 *
958 * The work might still be in use when this function finishes. See the
959 * current_work proceed by the worker.
960 *
961 * Return: %true if @work was pending and successfully canceled,
962 * %false if @work was not pending
963 */
964static bool __kthread_cancel_work(struct kthread_work *work, bool is_dwork,
965 unsigned long *flags)
966{
967 /* Try to cancel the timer if exists. */
968 if (is_dwork) {
969 struct kthread_delayed_work *dwork =
970 container_of(work, struct kthread_delayed_work, work);
971 struct kthread_worker *worker = work->worker;
972
973 /*
974 * del_timer_sync() must be called to make sure that the timer
975 * callback is not running. The lock must be temporary released
976 * to avoid a deadlock with the callback. In the meantime,
977 * any queuing is blocked by setting the canceling counter.
978 */
979 work->canceling++;
980 spin_unlock_irqrestore(&worker->lock, *flags);
981 del_timer_sync(&dwork->timer);
982 spin_lock_irqsave(&worker->lock, *flags);
983 work->canceling--;
984 }
985
986 /*
987 * Try to remove the work from a worker list. It might either
988 * be from worker->work_list or from worker->delayed_work_list.
989 */
990 if (!list_empty(&work->node)) {
991 list_del_init(&work->node);
992 return true;
993 }
994
995 return false;
996}
997
9a6b06c8
PM
998/**
999 * kthread_mod_delayed_work - modify delay of or queue a kthread delayed work
1000 * @worker: kthread worker to use
1001 * @dwork: kthread delayed work to queue
1002 * @delay: number of jiffies to wait before queuing
1003 *
1004 * If @dwork is idle, equivalent to kthread_queue_delayed_work(). Otherwise,
1005 * modify @dwork's timer so that it expires after @delay. If @delay is zero,
1006 * @work is guaranteed to be queued immediately.
1007 *
1008 * Return: %true if @dwork was pending and its timer was modified,
1009 * %false otherwise.
1010 *
1011 * A special case is when the work is being canceled in parallel.
1012 * It might be caused either by the real kthread_cancel_delayed_work_sync()
1013 * or yet another kthread_mod_delayed_work() call. We let the other command
1014 * win and return %false here. The caller is supposed to synchronize these
1015 * operations a reasonable way.
1016 *
1017 * This function is safe to call from any context including IRQ handler.
1018 * See __kthread_cancel_work() and kthread_delayed_work_timer_fn()
1019 * for details.
1020 */
1021bool kthread_mod_delayed_work(struct kthread_worker *worker,
1022 struct kthread_delayed_work *dwork,
1023 unsigned long delay)
1024{
1025 struct kthread_work *work = &dwork->work;
1026 unsigned long flags;
1027 int ret = false;
1028
1029 spin_lock_irqsave(&worker->lock, flags);
1030
1031 /* Do not bother with canceling when never queued. */
1032 if (!work->worker)
1033 goto fast_queue;
1034
1035 /* Work must not be used with >1 worker, see kthread_queue_work() */
1036 WARN_ON_ONCE(work->worker != worker);
1037
1038 /* Do not fight with another command that is canceling this work. */
1039 if (work->canceling)
1040 goto out;
1041
1042 ret = __kthread_cancel_work(work, true, &flags);
1043fast_queue:
1044 __kthread_queue_delayed_work(worker, dwork, delay);
1045out:
1046 spin_unlock_irqrestore(&worker->lock, flags);
1047 return ret;
1048}
1049EXPORT_SYMBOL_GPL(kthread_mod_delayed_work);
1050
37be45d4
PM
1051static bool __kthread_cancel_work_sync(struct kthread_work *work, bool is_dwork)
1052{
1053 struct kthread_worker *worker = work->worker;
1054 unsigned long flags;
1055 int ret = false;
1056
1057 if (!worker)
1058 goto out;
1059
1060 spin_lock_irqsave(&worker->lock, flags);
1061 /* Work must not be used with >1 worker, see kthread_queue_work(). */
1062 WARN_ON_ONCE(work->worker != worker);
1063
1064 ret = __kthread_cancel_work(work, is_dwork, &flags);
1065
1066 if (worker->current_work != work)
1067 goto out_fast;
1068
1069 /*
1070 * The work is in progress and we need to wait with the lock released.
1071 * In the meantime, block any queuing by setting the canceling counter.
1072 */
1073 work->canceling++;
1074 spin_unlock_irqrestore(&worker->lock, flags);
1075 kthread_flush_work(work);
1076 spin_lock_irqsave(&worker->lock, flags);
1077 work->canceling--;
1078
1079out_fast:
1080 spin_unlock_irqrestore(&worker->lock, flags);
1081out:
1082 return ret;
1083}
1084
1085/**
1086 * kthread_cancel_work_sync - cancel a kthread work and wait for it to finish
1087 * @work: the kthread work to cancel
1088 *
1089 * Cancel @work and wait for its execution to finish. This function
1090 * can be used even if the work re-queues itself. On return from this
1091 * function, @work is guaranteed to be not pending or executing on any CPU.
1092 *
1093 * kthread_cancel_work_sync(&delayed_work->work) must not be used for
1094 * delayed_work's. Use kthread_cancel_delayed_work_sync() instead.
1095 *
1096 * The caller must ensure that the worker on which @work was last
1097 * queued can't be destroyed before this function returns.
1098 *
1099 * Return: %true if @work was pending, %false otherwise.
1100 */
1101bool kthread_cancel_work_sync(struct kthread_work *work)
1102{
1103 return __kthread_cancel_work_sync(work, false);
1104}
1105EXPORT_SYMBOL_GPL(kthread_cancel_work_sync);
1106
1107/**
1108 * kthread_cancel_delayed_work_sync - cancel a kthread delayed work and
1109 * wait for it to finish.
1110 * @dwork: the kthread delayed work to cancel
1111 *
1112 * This is kthread_cancel_work_sync() for delayed works.
1113 *
1114 * Return: %true if @dwork was pending, %false otherwise.
1115 */
1116bool kthread_cancel_delayed_work_sync(struct kthread_delayed_work *dwork)
1117{
1118 return __kthread_cancel_work_sync(&dwork->work, true);
1119}
1120EXPORT_SYMBOL_GPL(kthread_cancel_delayed_work_sync);
1121
b56c0d89 1122/**
3989144f 1123 * kthread_flush_worker - flush all current works on a kthread_worker
b56c0d89
TH
1124 * @worker: worker to flush
1125 *
1126 * Wait until all currently executing or pending works on @worker are
1127 * finished.
1128 */
3989144f 1129void kthread_flush_worker(struct kthread_worker *worker)
b56c0d89
TH
1130{
1131 struct kthread_flush_work fwork = {
1132 KTHREAD_WORK_INIT(fwork.work, kthread_flush_work_fn),
1133 COMPLETION_INITIALIZER_ONSTACK(fwork.done),
1134 };
1135
3989144f 1136 kthread_queue_work(worker, &fwork.work);
b56c0d89
TH
1137 wait_for_completion(&fwork.done);
1138}
3989144f 1139EXPORT_SYMBOL_GPL(kthread_flush_worker);
35033fe9
PM
1140
1141/**
1142 * kthread_destroy_worker - destroy a kthread worker
1143 * @worker: worker to be destroyed
1144 *
1145 * Flush and destroy @worker. The simple flush is enough because the kthread
1146 * worker API is used only in trivial scenarios. There are no multi-step state
1147 * machines needed.
1148 */
1149void kthread_destroy_worker(struct kthread_worker *worker)
1150{
1151 struct task_struct *task;
1152
1153 task = worker->task;
1154 if (WARN_ON(!task))
1155 return;
1156
1157 kthread_flush_worker(worker);
1158 kthread_stop(task);
1159 WARN_ON(!list_empty(&worker->work_list));
1160 kfree(worker);
1161}
1162EXPORT_SYMBOL(kthread_destroy_worker);
05e3db95 1163
0b508bc9 1164#ifdef CONFIG_BLK_CGROUP
05e3db95
SL
1165/**
1166 * kthread_associate_blkcg - associate blkcg to current kthread
1167 * @css: the cgroup info
1168 *
1169 * Current thread must be a kthread. The thread is running jobs on behalf of
1170 * other threads. In some cases, we expect the jobs attach cgroup info of
1171 * original threads instead of that of current thread. This function stores
1172 * original thread's cgroup info in current kthread context for later
1173 * retrieval.
1174 */
1175void kthread_associate_blkcg(struct cgroup_subsys_state *css)
1176{
1177 struct kthread *kthread;
1178
1179 if (!(current->flags & PF_KTHREAD))
1180 return;
1181 kthread = to_kthread(current);
1182 if (!kthread)
1183 return;
1184
1185 if (kthread->blkcg_css) {
1186 css_put(kthread->blkcg_css);
1187 kthread->blkcg_css = NULL;
1188 }
1189 if (css) {
1190 css_get(css);
1191 kthread->blkcg_css = css;
1192 }
1193}
1194EXPORT_SYMBOL(kthread_associate_blkcg);
1195
1196/**
1197 * kthread_blkcg - get associated blkcg css of current kthread
1198 *
1199 * Current thread must be a kthread.
1200 */
1201struct cgroup_subsys_state *kthread_blkcg(void)
1202{
1203 struct kthread *kthread;
1204
1205 if (current->flags & PF_KTHREAD) {
1206 kthread = to_kthread(current);
1207 if (kthread)
1208 return kthread->blkcg_css;
1209 }
1210 return NULL;
1211}
1212EXPORT_SYMBOL(kthread_blkcg);
1213#endif