xref: /openbmc/linux/kernel/kthread.c (revision 174cd4b1)
1 /* Kernel thread helper functions.
2  *   Copyright (C) 2004 IBM Corporation, Rusty Russell.
3  *
4  * Creation is done via kthreadd, so that we get a clean environment
5  * even if we're invoked from userspace (think modprobe, hotplug cpu,
6  * etc.).
7  */
8 #include <uapi/linux/sched/types.h>
9 #include <linux/sched.h>
10 #include <linux/kthread.h>
11 #include <linux/completion.h>
12 #include <linux/err.h>
13 #include <linux/cpuset.h>
14 #include <linux/unistd.h>
15 #include <linux/file.h>
16 #include <linux/export.h>
17 #include <linux/mutex.h>
18 #include <linux/slab.h>
19 #include <linux/freezer.h>
20 #include <linux/ptrace.h>
21 #include <linux/uaccess.h>
22 #include <trace/events/sched.h>
23 
24 static DEFINE_SPINLOCK(kthread_create_lock);
25 static LIST_HEAD(kthread_create_list);
26 struct task_struct *kthreadd_task;
27 
28 struct kthread_create_info
29 {
30 	/* Information passed to kthread() from kthreadd. */
31 	int (*threadfn)(void *data);
32 	void *data;
33 	int node;
34 
35 	/* Result passed back to kthread_create() from kthreadd. */
36 	struct task_struct *result;
37 	struct completion *done;
38 
39 	struct list_head list;
40 };
41 
42 struct kthread {
43 	unsigned long flags;
44 	unsigned int cpu;
45 	void *data;
46 	struct completion parked;
47 	struct completion exited;
48 };
49 
50 enum KTHREAD_BITS {
51 	KTHREAD_IS_PER_CPU = 0,
52 	KTHREAD_SHOULD_STOP,
53 	KTHREAD_SHOULD_PARK,
54 	KTHREAD_IS_PARKED,
55 };
56 
57 static inline void set_kthread_struct(void *kthread)
58 {
59 	/*
60 	 * We abuse ->set_child_tid to avoid the new member and because it
61 	 * can't be wrongly copied by copy_process(). We also rely on fact
62 	 * that the caller can't exec, so PF_KTHREAD can't be cleared.
63 	 */
64 	current->set_child_tid = (__force void __user *)kthread;
65 }
66 
67 static inline struct kthread *to_kthread(struct task_struct *k)
68 {
69 	WARN_ON(!(k->flags & PF_KTHREAD));
70 	return (__force void *)k->set_child_tid;
71 }
72 
73 void free_kthread_struct(struct task_struct *k)
74 {
75 	/*
76 	 * Can be NULL if this kthread was created by kernel_thread()
77 	 * or if kmalloc() in kthread() failed.
78 	 */
79 	kfree(to_kthread(k));
80 }
81 
82 /**
83  * kthread_should_stop - should this kthread return now?
84  *
85  * When someone calls kthread_stop() on your kthread, it will be woken
86  * and this will return true.  You should then return, and your return
87  * value will be passed through to kthread_stop().
88  */
89 bool kthread_should_stop(void)
90 {
91 	return test_bit(KTHREAD_SHOULD_STOP, &to_kthread(current)->flags);
92 }
93 EXPORT_SYMBOL(kthread_should_stop);
94 
95 /**
96  * kthread_should_park - should this kthread park now?
97  *
98  * When someone calls kthread_park() on your kthread, it will be woken
99  * and this will return true.  You should then do the necessary
100  * cleanup and call kthread_parkme()
101  *
102  * Similar to kthread_should_stop(), but this keeps the thread alive
103  * and in a park position. kthread_unpark() "restarts" the thread and
104  * calls the thread function again.
105  */
106 bool kthread_should_park(void)
107 {
108 	return test_bit(KTHREAD_SHOULD_PARK, &to_kthread(current)->flags);
109 }
110 EXPORT_SYMBOL_GPL(kthread_should_park);
111 
112 /**
113  * kthread_freezable_should_stop - should this freezable kthread return now?
114  * @was_frozen: optional out parameter, indicates whether %current was frozen
115  *
116  * kthread_should_stop() for freezable kthreads, which will enter
117  * refrigerator if necessary.  This function is safe from kthread_stop() /
118  * freezer deadlock and freezable kthreads should use this function instead
119  * of calling try_to_freeze() directly.
120  */
121 bool kthread_freezable_should_stop(bool *was_frozen)
122 {
123 	bool frozen = false;
124 
125 	might_sleep();
126 
127 	if (unlikely(freezing(current)))
128 		frozen = __refrigerator(true);
129 
130 	if (was_frozen)
131 		*was_frozen = frozen;
132 
133 	return kthread_should_stop();
134 }
135 EXPORT_SYMBOL_GPL(kthread_freezable_should_stop);
136 
137 /**
138  * kthread_data - return data value specified on kthread creation
139  * @task: kthread task in question
140  *
141  * Return the data value specified when kthread @task was created.
142  * The caller is responsible for ensuring the validity of @task when
143  * calling this function.
144  */
145 void *kthread_data(struct task_struct *task)
146 {
147 	return to_kthread(task)->data;
148 }
149 
150 /**
151  * kthread_probe_data - speculative version of kthread_data()
152  * @task: possible kthread task in question
153  *
154  * @task could be a kthread task.  Return the data value specified when it
155  * was created if accessible.  If @task isn't a kthread task or its data is
156  * inaccessible for any reason, %NULL is returned.  This function requires
157  * that @task itself is safe to dereference.
158  */
159 void *kthread_probe_data(struct task_struct *task)
160 {
161 	struct kthread *kthread = to_kthread(task);
162 	void *data = NULL;
163 
164 	probe_kernel_read(&data, &kthread->data, sizeof(data));
165 	return data;
166 }
167 
168 static void __kthread_parkme(struct kthread *self)
169 {
170 	__set_current_state(TASK_PARKED);
171 	while (test_bit(KTHREAD_SHOULD_PARK, &self->flags)) {
172 		if (!test_and_set_bit(KTHREAD_IS_PARKED, &self->flags))
173 			complete(&self->parked);
174 		schedule();
175 		__set_current_state(TASK_PARKED);
176 	}
177 	clear_bit(KTHREAD_IS_PARKED, &self->flags);
178 	__set_current_state(TASK_RUNNING);
179 }
180 
181 void kthread_parkme(void)
182 {
183 	__kthread_parkme(to_kthread(current));
184 }
185 EXPORT_SYMBOL_GPL(kthread_parkme);
186 
187 static int kthread(void *_create)
188 {
189 	/* Copy data: it's on kthread's stack */
190 	struct kthread_create_info *create = _create;
191 	int (*threadfn)(void *data) = create->threadfn;
192 	void *data = create->data;
193 	struct completion *done;
194 	struct kthread *self;
195 	int ret;
196 
197 	self = kmalloc(sizeof(*self), GFP_KERNEL);
198 	set_kthread_struct(self);
199 
200 	/* If user was SIGKILLed, I release the structure. */
201 	done = xchg(&create->done, NULL);
202 	if (!done) {
203 		kfree(create);
204 		do_exit(-EINTR);
205 	}
206 
207 	if (!self) {
208 		create->result = ERR_PTR(-ENOMEM);
209 		complete(done);
210 		do_exit(-ENOMEM);
211 	}
212 
213 	self->flags = 0;
214 	self->data = data;
215 	init_completion(&self->exited);
216 	init_completion(&self->parked);
217 	current->vfork_done = &self->exited;
218 
219 	/* OK, tell user we're spawned, wait for stop or wakeup */
220 	__set_current_state(TASK_UNINTERRUPTIBLE);
221 	create->result = current;
222 	complete(done);
223 	schedule();
224 
225 	ret = -EINTR;
226 	if (!test_bit(KTHREAD_SHOULD_STOP, &self->flags)) {
227 		__kthread_parkme(self);
228 		ret = threadfn(data);
229 	}
230 	do_exit(ret);
231 }
232 
233 /* called from do_fork() to get node information for about to be created task */
234 int tsk_fork_get_node(struct task_struct *tsk)
235 {
236 #ifdef CONFIG_NUMA
237 	if (tsk == kthreadd_task)
238 		return tsk->pref_node_fork;
239 #endif
240 	return NUMA_NO_NODE;
241 }
242 
243 static void create_kthread(struct kthread_create_info *create)
244 {
245 	int pid;
246 
247 #ifdef CONFIG_NUMA
248 	current->pref_node_fork = create->node;
249 #endif
250 	/* We want our own signal handler (we take no signals by default). */
251 	pid = kernel_thread(kthread, create, CLONE_FS | CLONE_FILES | SIGCHLD);
252 	if (pid < 0) {
253 		/* If user was SIGKILLed, I release the structure. */
254 		struct completion *done = xchg(&create->done, NULL);
255 
256 		if (!done) {
257 			kfree(create);
258 			return;
259 		}
260 		create->result = ERR_PTR(pid);
261 		complete(done);
262 	}
263 }
264 
265 static __printf(4, 0)
266 struct task_struct *__kthread_create_on_node(int (*threadfn)(void *data),
267 						    void *data, int node,
268 						    const char namefmt[],
269 						    va_list args)
270 {
271 	DECLARE_COMPLETION_ONSTACK(done);
272 	struct task_struct *task;
273 	struct kthread_create_info *create = kmalloc(sizeof(*create),
274 						     GFP_KERNEL);
275 
276 	if (!create)
277 		return ERR_PTR(-ENOMEM);
278 	create->threadfn = threadfn;
279 	create->data = data;
280 	create->node = node;
281 	create->done = &done;
282 
283 	spin_lock(&kthread_create_lock);
284 	list_add_tail(&create->list, &kthread_create_list);
285 	spin_unlock(&kthread_create_lock);
286 
287 	wake_up_process(kthreadd_task);
288 	/*
289 	 * Wait for completion in killable state, for I might be chosen by
290 	 * the OOM killer while kthreadd is trying to allocate memory for
291 	 * new kernel thread.
292 	 */
293 	if (unlikely(wait_for_completion_killable(&done))) {
294 		/*
295 		 * If I was SIGKILLed before kthreadd (or new kernel thread)
296 		 * calls complete(), leave the cleanup of this structure to
297 		 * that thread.
298 		 */
299 		if (xchg(&create->done, NULL))
300 			return ERR_PTR(-EINTR);
301 		/*
302 		 * kthreadd (or new kernel thread) will call complete()
303 		 * shortly.
304 		 */
305 		wait_for_completion(&done);
306 	}
307 	task = create->result;
308 	if (!IS_ERR(task)) {
309 		static const struct sched_param param = { .sched_priority = 0 };
310 
311 		vsnprintf(task->comm, sizeof(task->comm), namefmt, args);
312 		/*
313 		 * root may have changed our (kthreadd's) priority or CPU mask.
314 		 * The kernel thread should not inherit these properties.
315 		 */
316 		sched_setscheduler_nocheck(task, SCHED_NORMAL, &param);
317 		set_cpus_allowed_ptr(task, cpu_all_mask);
318 	}
319 	kfree(create);
320 	return task;
321 }
322 
323 /**
324  * kthread_create_on_node - create a kthread.
325  * @threadfn: the function to run until signal_pending(current).
326  * @data: data ptr for @threadfn.
327  * @node: task and thread structures for the thread are allocated on this node
328  * @namefmt: printf-style name for the thread.
329  *
330  * Description: This helper function creates and names a kernel
331  * thread.  The thread will be stopped: use wake_up_process() to start
332  * it.  See also kthread_run().  The new thread has SCHED_NORMAL policy and
333  * is affine to all CPUs.
334  *
335  * If thread is going to be bound on a particular cpu, give its node
336  * in @node, to get NUMA affinity for kthread stack, or else give NUMA_NO_NODE.
337  * When woken, the thread will run @threadfn() with @data as its
338  * argument. @threadfn() can either call do_exit() directly if it is a
339  * standalone thread for which no one will call kthread_stop(), or
340  * return when 'kthread_should_stop()' is true (which means
341  * kthread_stop() has been called).  The return value should be zero
342  * or a negative error number; it will be passed to kthread_stop().
343  *
344  * Returns a task_struct or ERR_PTR(-ENOMEM) or ERR_PTR(-EINTR).
345  */
346 struct task_struct *kthread_create_on_node(int (*threadfn)(void *data),
347 					   void *data, int node,
348 					   const char namefmt[],
349 					   ...)
350 {
351 	struct task_struct *task;
352 	va_list args;
353 
354 	va_start(args, namefmt);
355 	task = __kthread_create_on_node(threadfn, data, node, namefmt, args);
356 	va_end(args);
357 
358 	return task;
359 }
360 EXPORT_SYMBOL(kthread_create_on_node);
361 
362 static void __kthread_bind_mask(struct task_struct *p, const struct cpumask *mask, long state)
363 {
364 	unsigned long flags;
365 
366 	if (!wait_task_inactive(p, state)) {
367 		WARN_ON(1);
368 		return;
369 	}
370 
371 	/* It's safe because the task is inactive. */
372 	raw_spin_lock_irqsave(&p->pi_lock, flags);
373 	do_set_cpus_allowed(p, mask);
374 	p->flags |= PF_NO_SETAFFINITY;
375 	raw_spin_unlock_irqrestore(&p->pi_lock, flags);
376 }
377 
378 static void __kthread_bind(struct task_struct *p, unsigned int cpu, long state)
379 {
380 	__kthread_bind_mask(p, cpumask_of(cpu), state);
381 }
382 
383 void kthread_bind_mask(struct task_struct *p, const struct cpumask *mask)
384 {
385 	__kthread_bind_mask(p, mask, TASK_UNINTERRUPTIBLE);
386 }
387 
388 /**
389  * kthread_bind - bind a just-created kthread to a cpu.
390  * @p: thread created by kthread_create().
391  * @cpu: cpu (might not be online, must be possible) for @k to run on.
392  *
393  * Description: This function is equivalent to set_cpus_allowed(),
394  * except that @cpu doesn't need to be online, and the thread must be
395  * stopped (i.e., just returned from kthread_create()).
396  */
397 void kthread_bind(struct task_struct *p, unsigned int cpu)
398 {
399 	__kthread_bind(p, cpu, TASK_UNINTERRUPTIBLE);
400 }
401 EXPORT_SYMBOL(kthread_bind);
402 
403 /**
404  * kthread_create_on_cpu - Create a cpu bound kthread
405  * @threadfn: the function to run until signal_pending(current).
406  * @data: data ptr for @threadfn.
407  * @cpu: The cpu on which the thread should be bound,
408  * @namefmt: printf-style name for the thread. Format is restricted
409  *	     to "name.*%u". Code fills in cpu number.
410  *
411  * Description: This helper function creates and names a kernel thread
412  * The thread will be woken and put into park mode.
413  */
414 struct task_struct *kthread_create_on_cpu(int (*threadfn)(void *data),
415 					  void *data, unsigned int cpu,
416 					  const char *namefmt)
417 {
418 	struct task_struct *p;
419 
420 	p = kthread_create_on_node(threadfn, data, cpu_to_node(cpu), namefmt,
421 				   cpu);
422 	if (IS_ERR(p))
423 		return p;
424 	kthread_bind(p, cpu);
425 	/* CPU hotplug need to bind once again when unparking the thread. */
426 	set_bit(KTHREAD_IS_PER_CPU, &to_kthread(p)->flags);
427 	to_kthread(p)->cpu = cpu;
428 	return p;
429 }
430 
431 /**
432  * kthread_unpark - unpark a thread created by kthread_create().
433  * @k:		thread created by kthread_create().
434  *
435  * Sets kthread_should_park() for @k to return false, wakes it, and
436  * waits for it to return. If the thread is marked percpu then its
437  * bound to the cpu again.
438  */
439 void kthread_unpark(struct task_struct *k)
440 {
441 	struct kthread *kthread = to_kthread(k);
442 
443 	clear_bit(KTHREAD_SHOULD_PARK, &kthread->flags);
444 	/*
445 	 * We clear the IS_PARKED bit here as we don't wait
446 	 * until the task has left the park code. So if we'd
447 	 * park before that happens we'd see the IS_PARKED bit
448 	 * which might be about to be cleared.
449 	 */
450 	if (test_and_clear_bit(KTHREAD_IS_PARKED, &kthread->flags)) {
451 		/*
452 		 * Newly created kthread was parked when the CPU was offline.
453 		 * The binding was lost and we need to set it again.
454 		 */
455 		if (test_bit(KTHREAD_IS_PER_CPU, &kthread->flags))
456 			__kthread_bind(k, kthread->cpu, TASK_PARKED);
457 		wake_up_state(k, TASK_PARKED);
458 	}
459 }
460 EXPORT_SYMBOL_GPL(kthread_unpark);
461 
462 /**
463  * kthread_park - park a thread created by kthread_create().
464  * @k: thread created by kthread_create().
465  *
466  * Sets kthread_should_park() for @k to return true, wakes it, and
467  * waits for it to return. This can also be called after kthread_create()
468  * instead of calling wake_up_process(): the thread will park without
469  * calling threadfn().
470  *
471  * Returns 0 if the thread is parked, -ENOSYS if the thread exited.
472  * If called by the kthread itself just the park bit is set.
473  */
474 int kthread_park(struct task_struct *k)
475 {
476 	struct kthread *kthread = to_kthread(k);
477 
478 	if (WARN_ON(k->flags & PF_EXITING))
479 		return -ENOSYS;
480 
481 	if (!test_bit(KTHREAD_IS_PARKED, &kthread->flags)) {
482 		set_bit(KTHREAD_SHOULD_PARK, &kthread->flags);
483 		if (k != current) {
484 			wake_up_process(k);
485 			wait_for_completion(&kthread->parked);
486 		}
487 	}
488 
489 	return 0;
490 }
491 EXPORT_SYMBOL_GPL(kthread_park);
492 
493 /**
494  * kthread_stop - stop a thread created by kthread_create().
495  * @k: thread created by kthread_create().
496  *
497  * Sets kthread_should_stop() for @k to return true, wakes it, and
498  * waits for it to exit. This can also be called after kthread_create()
499  * instead of calling wake_up_process(): the thread will exit without
500  * calling threadfn().
501  *
502  * If threadfn() may call do_exit() itself, the caller must ensure
503  * task_struct can't go away.
504  *
505  * Returns the result of threadfn(), or %-EINTR if wake_up_process()
506  * was never called.
507  */
508 int kthread_stop(struct task_struct *k)
509 {
510 	struct kthread *kthread;
511 	int ret;
512 
513 	trace_sched_kthread_stop(k);
514 
515 	get_task_struct(k);
516 	kthread = to_kthread(k);
517 	set_bit(KTHREAD_SHOULD_STOP, &kthread->flags);
518 	kthread_unpark(k);
519 	wake_up_process(k);
520 	wait_for_completion(&kthread->exited);
521 	ret = k->exit_code;
522 	put_task_struct(k);
523 
524 	trace_sched_kthread_stop_ret(ret);
525 	return ret;
526 }
527 EXPORT_SYMBOL(kthread_stop);
528 
529 int kthreadd(void *unused)
530 {
531 	struct task_struct *tsk = current;
532 
533 	/* Setup a clean context for our children to inherit. */
534 	set_task_comm(tsk, "kthreadd");
535 	ignore_signals(tsk);
536 	set_cpus_allowed_ptr(tsk, cpu_all_mask);
537 	set_mems_allowed(node_states[N_MEMORY]);
538 
539 	current->flags |= PF_NOFREEZE;
540 
541 	for (;;) {
542 		set_current_state(TASK_INTERRUPTIBLE);
543 		if (list_empty(&kthread_create_list))
544 			schedule();
545 		__set_current_state(TASK_RUNNING);
546 
547 		spin_lock(&kthread_create_lock);
548 		while (!list_empty(&kthread_create_list)) {
549 			struct kthread_create_info *create;
550 
551 			create = list_entry(kthread_create_list.next,
552 					    struct kthread_create_info, list);
553 			list_del_init(&create->list);
554 			spin_unlock(&kthread_create_lock);
555 
556 			create_kthread(create);
557 
558 			spin_lock(&kthread_create_lock);
559 		}
560 		spin_unlock(&kthread_create_lock);
561 	}
562 
563 	return 0;
564 }
565 
566 void __kthread_init_worker(struct kthread_worker *worker,
567 				const char *name,
568 				struct lock_class_key *key)
569 {
570 	memset(worker, 0, sizeof(struct kthread_worker));
571 	spin_lock_init(&worker->lock);
572 	lockdep_set_class_and_name(&worker->lock, key, name);
573 	INIT_LIST_HEAD(&worker->work_list);
574 	INIT_LIST_HEAD(&worker->delayed_work_list);
575 }
576 EXPORT_SYMBOL_GPL(__kthread_init_worker);
577 
578 /**
579  * kthread_worker_fn - kthread function to process kthread_worker
580  * @worker_ptr: pointer to initialized kthread_worker
581  *
582  * This function implements the main cycle of kthread worker. It processes
583  * work_list until it is stopped with kthread_stop(). It sleeps when the queue
584  * is empty.
585  *
586  * The works are not allowed to keep any locks, disable preemption or interrupts
587  * when they finish. There is defined a safe point for freezing when one work
588  * finishes and before a new one is started.
589  *
590  * Also the works must not be handled by more than one worker at the same time,
591  * see also kthread_queue_work().
592  */
593 int kthread_worker_fn(void *worker_ptr)
594 {
595 	struct kthread_worker *worker = worker_ptr;
596 	struct kthread_work *work;
597 
598 	/*
599 	 * FIXME: Update the check and remove the assignment when all kthread
600 	 * worker users are created using kthread_create_worker*() functions.
601 	 */
602 	WARN_ON(worker->task && worker->task != current);
603 	worker->task = current;
604 
605 	if (worker->flags & KTW_FREEZABLE)
606 		set_freezable();
607 
608 repeat:
609 	set_current_state(TASK_INTERRUPTIBLE);	/* mb paired w/ kthread_stop */
610 
611 	if (kthread_should_stop()) {
612 		__set_current_state(TASK_RUNNING);
613 		spin_lock_irq(&worker->lock);
614 		worker->task = NULL;
615 		spin_unlock_irq(&worker->lock);
616 		return 0;
617 	}
618 
619 	work = NULL;
620 	spin_lock_irq(&worker->lock);
621 	if (!list_empty(&worker->work_list)) {
622 		work = list_first_entry(&worker->work_list,
623 					struct kthread_work, node);
624 		list_del_init(&work->node);
625 	}
626 	worker->current_work = work;
627 	spin_unlock_irq(&worker->lock);
628 
629 	if (work) {
630 		__set_current_state(TASK_RUNNING);
631 		work->func(work);
632 	} else if (!freezing(current))
633 		schedule();
634 
635 	try_to_freeze();
636 	goto repeat;
637 }
638 EXPORT_SYMBOL_GPL(kthread_worker_fn);
639 
640 static __printf(3, 0) struct kthread_worker *
641 __kthread_create_worker(int cpu, unsigned int flags,
642 			const char namefmt[], va_list args)
643 {
644 	struct kthread_worker *worker;
645 	struct task_struct *task;
646 	int node = -1;
647 
648 	worker = kzalloc(sizeof(*worker), GFP_KERNEL);
649 	if (!worker)
650 		return ERR_PTR(-ENOMEM);
651 
652 	kthread_init_worker(worker);
653 
654 	if (cpu >= 0)
655 		node = cpu_to_node(cpu);
656 
657 	task = __kthread_create_on_node(kthread_worker_fn, worker,
658 						node, namefmt, args);
659 	if (IS_ERR(task))
660 		goto fail_task;
661 
662 	if (cpu >= 0)
663 		kthread_bind(task, cpu);
664 
665 	worker->flags = flags;
666 	worker->task = task;
667 	wake_up_process(task);
668 	return worker;
669 
670 fail_task:
671 	kfree(worker);
672 	return ERR_CAST(task);
673 }
674 
675 /**
676  * kthread_create_worker - create a kthread worker
677  * @flags: flags modifying the default behavior of the worker
678  * @namefmt: printf-style name for the kthread worker (task).
679  *
680  * Returns a pointer to the allocated worker on success, ERR_PTR(-ENOMEM)
681  * when the needed structures could not get allocated, and ERR_PTR(-EINTR)
682  * when the worker was SIGKILLed.
683  */
684 struct kthread_worker *
685 kthread_create_worker(unsigned int flags, const char namefmt[], ...)
686 {
687 	struct kthread_worker *worker;
688 	va_list args;
689 
690 	va_start(args, namefmt);
691 	worker = __kthread_create_worker(-1, flags, namefmt, args);
692 	va_end(args);
693 
694 	return worker;
695 }
696 EXPORT_SYMBOL(kthread_create_worker);
697 
698 /**
699  * kthread_create_worker_on_cpu - create a kthread worker and bind it
700  *	it to a given CPU and the associated NUMA node.
701  * @cpu: CPU number
702  * @flags: flags modifying the default behavior of the worker
703  * @namefmt: printf-style name for the kthread worker (task).
704  *
705  * Use a valid CPU number if you want to bind the kthread worker
706  * to the given CPU and the associated NUMA node.
707  *
708  * A good practice is to add the cpu number also into the worker name.
709  * For example, use kthread_create_worker_on_cpu(cpu, "helper/%d", cpu).
710  *
711  * Returns a pointer to the allocated worker on success, ERR_PTR(-ENOMEM)
712  * when the needed structures could not get allocated, and ERR_PTR(-EINTR)
713  * when the worker was SIGKILLed.
714  */
715 struct kthread_worker *
716 kthread_create_worker_on_cpu(int cpu, unsigned int flags,
717 			     const char namefmt[], ...)
718 {
719 	struct kthread_worker *worker;
720 	va_list args;
721 
722 	va_start(args, namefmt);
723 	worker = __kthread_create_worker(cpu, flags, namefmt, args);
724 	va_end(args);
725 
726 	return worker;
727 }
728 EXPORT_SYMBOL(kthread_create_worker_on_cpu);
729 
730 /*
731  * Returns true when the work could not be queued at the moment.
732  * It happens when it is already pending in a worker list
733  * or when it is being cancelled.
734  */
735 static inline bool queuing_blocked(struct kthread_worker *worker,
736 				   struct kthread_work *work)
737 {
738 	lockdep_assert_held(&worker->lock);
739 
740 	return !list_empty(&work->node) || work->canceling;
741 }
742 
743 static void kthread_insert_work_sanity_check(struct kthread_worker *worker,
744 					     struct kthread_work *work)
745 {
746 	lockdep_assert_held(&worker->lock);
747 	WARN_ON_ONCE(!list_empty(&work->node));
748 	/* Do not use a work with >1 worker, see kthread_queue_work() */
749 	WARN_ON_ONCE(work->worker && work->worker != worker);
750 }
751 
752 /* insert @work before @pos in @worker */
753 static void kthread_insert_work(struct kthread_worker *worker,
754 				struct kthread_work *work,
755 				struct list_head *pos)
756 {
757 	kthread_insert_work_sanity_check(worker, work);
758 
759 	list_add_tail(&work->node, pos);
760 	work->worker = worker;
761 	if (!worker->current_work && likely(worker->task))
762 		wake_up_process(worker->task);
763 }
764 
765 /**
766  * kthread_queue_work - queue a kthread_work
767  * @worker: target kthread_worker
768  * @work: kthread_work to queue
769  *
770  * Queue @work to work processor @task for async execution.  @task
771  * must have been created with kthread_worker_create().  Returns %true
772  * if @work was successfully queued, %false if it was already pending.
773  *
774  * Reinitialize the work if it needs to be used by another worker.
775  * For example, when the worker was stopped and started again.
776  */
777 bool kthread_queue_work(struct kthread_worker *worker,
778 			struct kthread_work *work)
779 {
780 	bool ret = false;
781 	unsigned long flags;
782 
783 	spin_lock_irqsave(&worker->lock, flags);
784 	if (!queuing_blocked(worker, work)) {
785 		kthread_insert_work(worker, work, &worker->work_list);
786 		ret = true;
787 	}
788 	spin_unlock_irqrestore(&worker->lock, flags);
789 	return ret;
790 }
791 EXPORT_SYMBOL_GPL(kthread_queue_work);
792 
793 /**
794  * kthread_delayed_work_timer_fn - callback that queues the associated kthread
795  *	delayed work when the timer expires.
796  * @__data: pointer to the data associated with the timer
797  *
798  * The format of the function is defined by struct timer_list.
799  * It should have been called from irqsafe timer with irq already off.
800  */
801 void kthread_delayed_work_timer_fn(unsigned long __data)
802 {
803 	struct kthread_delayed_work *dwork =
804 		(struct kthread_delayed_work *)__data;
805 	struct kthread_work *work = &dwork->work;
806 	struct kthread_worker *worker = work->worker;
807 
808 	/*
809 	 * This might happen when a pending work is reinitialized.
810 	 * It means that it is used a wrong way.
811 	 */
812 	if (WARN_ON_ONCE(!worker))
813 		return;
814 
815 	spin_lock(&worker->lock);
816 	/* Work must not be used with >1 worker, see kthread_queue_work(). */
817 	WARN_ON_ONCE(work->worker != worker);
818 
819 	/* Move the work from worker->delayed_work_list. */
820 	WARN_ON_ONCE(list_empty(&work->node));
821 	list_del_init(&work->node);
822 	kthread_insert_work(worker, work, &worker->work_list);
823 
824 	spin_unlock(&worker->lock);
825 }
826 EXPORT_SYMBOL(kthread_delayed_work_timer_fn);
827 
828 void __kthread_queue_delayed_work(struct kthread_worker *worker,
829 				  struct kthread_delayed_work *dwork,
830 				  unsigned long delay)
831 {
832 	struct timer_list *timer = &dwork->timer;
833 	struct kthread_work *work = &dwork->work;
834 
835 	WARN_ON_ONCE(timer->function != kthread_delayed_work_timer_fn ||
836 		     timer->data != (unsigned long)dwork);
837 
838 	/*
839 	 * If @delay is 0, queue @dwork->work immediately.  This is for
840 	 * both optimization and correctness.  The earliest @timer can
841 	 * expire is on the closest next tick and delayed_work users depend
842 	 * on that there's no such delay when @delay is 0.
843 	 */
844 	if (!delay) {
845 		kthread_insert_work(worker, work, &worker->work_list);
846 		return;
847 	}
848 
849 	/* Be paranoid and try to detect possible races already now. */
850 	kthread_insert_work_sanity_check(worker, work);
851 
852 	list_add(&work->node, &worker->delayed_work_list);
853 	work->worker = worker;
854 	timer->expires = jiffies + delay;
855 	add_timer(timer);
856 }
857 
858 /**
859  * kthread_queue_delayed_work - queue the associated kthread work
860  *	after a delay.
861  * @worker: target kthread_worker
862  * @dwork: kthread_delayed_work to queue
863  * @delay: number of jiffies to wait before queuing
864  *
865  * If the work has not been pending it starts a timer that will queue
866  * the work after the given @delay. If @delay is zero, it queues the
867  * work immediately.
868  *
869  * Return: %false if the @work has already been pending. It means that
870  * either the timer was running or the work was queued. It returns %true
871  * otherwise.
872  */
873 bool kthread_queue_delayed_work(struct kthread_worker *worker,
874 				struct kthread_delayed_work *dwork,
875 				unsigned long delay)
876 {
877 	struct kthread_work *work = &dwork->work;
878 	unsigned long flags;
879 	bool ret = false;
880 
881 	spin_lock_irqsave(&worker->lock, flags);
882 
883 	if (!queuing_blocked(worker, work)) {
884 		__kthread_queue_delayed_work(worker, dwork, delay);
885 		ret = true;
886 	}
887 
888 	spin_unlock_irqrestore(&worker->lock, flags);
889 	return ret;
890 }
891 EXPORT_SYMBOL_GPL(kthread_queue_delayed_work);
892 
893 struct kthread_flush_work {
894 	struct kthread_work	work;
895 	struct completion	done;
896 };
897 
898 static void kthread_flush_work_fn(struct kthread_work *work)
899 {
900 	struct kthread_flush_work *fwork =
901 		container_of(work, struct kthread_flush_work, work);
902 	complete(&fwork->done);
903 }
904 
905 /**
906  * kthread_flush_work - flush a kthread_work
907  * @work: work to flush
908  *
909  * If @work is queued or executing, wait for it to finish execution.
910  */
911 void kthread_flush_work(struct kthread_work *work)
912 {
913 	struct kthread_flush_work fwork = {
914 		KTHREAD_WORK_INIT(fwork.work, kthread_flush_work_fn),
915 		COMPLETION_INITIALIZER_ONSTACK(fwork.done),
916 	};
917 	struct kthread_worker *worker;
918 	bool noop = false;
919 
920 	worker = work->worker;
921 	if (!worker)
922 		return;
923 
924 	spin_lock_irq(&worker->lock);
925 	/* Work must not be used with >1 worker, see kthread_queue_work(). */
926 	WARN_ON_ONCE(work->worker != worker);
927 
928 	if (!list_empty(&work->node))
929 		kthread_insert_work(worker, &fwork.work, work->node.next);
930 	else if (worker->current_work == work)
931 		kthread_insert_work(worker, &fwork.work,
932 				    worker->work_list.next);
933 	else
934 		noop = true;
935 
936 	spin_unlock_irq(&worker->lock);
937 
938 	if (!noop)
939 		wait_for_completion(&fwork.done);
940 }
941 EXPORT_SYMBOL_GPL(kthread_flush_work);
942 
943 /*
944  * This function removes the work from the worker queue. Also it makes sure
945  * that it won't get queued later via the delayed work's timer.
946  *
947  * The work might still be in use when this function finishes. See the
948  * current_work proceed by the worker.
949  *
950  * Return: %true if @work was pending and successfully canceled,
951  *	%false if @work was not pending
952  */
953 static bool __kthread_cancel_work(struct kthread_work *work, bool is_dwork,
954 				  unsigned long *flags)
955 {
956 	/* Try to cancel the timer if exists. */
957 	if (is_dwork) {
958 		struct kthread_delayed_work *dwork =
959 			container_of(work, struct kthread_delayed_work, work);
960 		struct kthread_worker *worker = work->worker;
961 
962 		/*
963 		 * del_timer_sync() must be called to make sure that the timer
964 		 * callback is not running. The lock must be temporary released
965 		 * to avoid a deadlock with the callback. In the meantime,
966 		 * any queuing is blocked by setting the canceling counter.
967 		 */
968 		work->canceling++;
969 		spin_unlock_irqrestore(&worker->lock, *flags);
970 		del_timer_sync(&dwork->timer);
971 		spin_lock_irqsave(&worker->lock, *flags);
972 		work->canceling--;
973 	}
974 
975 	/*
976 	 * Try to remove the work from a worker list. It might either
977 	 * be from worker->work_list or from worker->delayed_work_list.
978 	 */
979 	if (!list_empty(&work->node)) {
980 		list_del_init(&work->node);
981 		return true;
982 	}
983 
984 	return false;
985 }
986 
987 /**
988  * kthread_mod_delayed_work - modify delay of or queue a kthread delayed work
989  * @worker: kthread worker to use
990  * @dwork: kthread delayed work to queue
991  * @delay: number of jiffies to wait before queuing
992  *
993  * If @dwork is idle, equivalent to kthread_queue_delayed_work(). Otherwise,
994  * modify @dwork's timer so that it expires after @delay. If @delay is zero,
995  * @work is guaranteed to be queued immediately.
996  *
997  * Return: %true if @dwork was pending and its timer was modified,
998  * %false otherwise.
999  *
1000  * A special case is when the work is being canceled in parallel.
1001  * It might be caused either by the real kthread_cancel_delayed_work_sync()
1002  * or yet another kthread_mod_delayed_work() call. We let the other command
1003  * win and return %false here. The caller is supposed to synchronize these
1004  * operations a reasonable way.
1005  *
1006  * This function is safe to call from any context including IRQ handler.
1007  * See __kthread_cancel_work() and kthread_delayed_work_timer_fn()
1008  * for details.
1009  */
1010 bool kthread_mod_delayed_work(struct kthread_worker *worker,
1011 			      struct kthread_delayed_work *dwork,
1012 			      unsigned long delay)
1013 {
1014 	struct kthread_work *work = &dwork->work;
1015 	unsigned long flags;
1016 	int ret = false;
1017 
1018 	spin_lock_irqsave(&worker->lock, flags);
1019 
1020 	/* Do not bother with canceling when never queued. */
1021 	if (!work->worker)
1022 		goto fast_queue;
1023 
1024 	/* Work must not be used with >1 worker, see kthread_queue_work() */
1025 	WARN_ON_ONCE(work->worker != worker);
1026 
1027 	/* Do not fight with another command that is canceling this work. */
1028 	if (work->canceling)
1029 		goto out;
1030 
1031 	ret = __kthread_cancel_work(work, true, &flags);
1032 fast_queue:
1033 	__kthread_queue_delayed_work(worker, dwork, delay);
1034 out:
1035 	spin_unlock_irqrestore(&worker->lock, flags);
1036 	return ret;
1037 }
1038 EXPORT_SYMBOL_GPL(kthread_mod_delayed_work);
1039 
1040 static bool __kthread_cancel_work_sync(struct kthread_work *work, bool is_dwork)
1041 {
1042 	struct kthread_worker *worker = work->worker;
1043 	unsigned long flags;
1044 	int ret = false;
1045 
1046 	if (!worker)
1047 		goto out;
1048 
1049 	spin_lock_irqsave(&worker->lock, flags);
1050 	/* Work must not be used with >1 worker, see kthread_queue_work(). */
1051 	WARN_ON_ONCE(work->worker != worker);
1052 
1053 	ret = __kthread_cancel_work(work, is_dwork, &flags);
1054 
1055 	if (worker->current_work != work)
1056 		goto out_fast;
1057 
1058 	/*
1059 	 * The work is in progress and we need to wait with the lock released.
1060 	 * In the meantime, block any queuing by setting the canceling counter.
1061 	 */
1062 	work->canceling++;
1063 	spin_unlock_irqrestore(&worker->lock, flags);
1064 	kthread_flush_work(work);
1065 	spin_lock_irqsave(&worker->lock, flags);
1066 	work->canceling--;
1067 
1068 out_fast:
1069 	spin_unlock_irqrestore(&worker->lock, flags);
1070 out:
1071 	return ret;
1072 }
1073 
1074 /**
1075  * kthread_cancel_work_sync - cancel a kthread work and wait for it to finish
1076  * @work: the kthread work to cancel
1077  *
1078  * Cancel @work and wait for its execution to finish.  This function
1079  * can be used even if the work re-queues itself. On return from this
1080  * function, @work is guaranteed to be not pending or executing on any CPU.
1081  *
1082  * kthread_cancel_work_sync(&delayed_work->work) must not be used for
1083  * delayed_work's. Use kthread_cancel_delayed_work_sync() instead.
1084  *
1085  * The caller must ensure that the worker on which @work was last
1086  * queued can't be destroyed before this function returns.
1087  *
1088  * Return: %true if @work was pending, %false otherwise.
1089  */
1090 bool kthread_cancel_work_sync(struct kthread_work *work)
1091 {
1092 	return __kthread_cancel_work_sync(work, false);
1093 }
1094 EXPORT_SYMBOL_GPL(kthread_cancel_work_sync);
1095 
1096 /**
1097  * kthread_cancel_delayed_work_sync - cancel a kthread delayed work and
1098  *	wait for it to finish.
1099  * @dwork: the kthread delayed work to cancel
1100  *
1101  * This is kthread_cancel_work_sync() for delayed works.
1102  *
1103  * Return: %true if @dwork was pending, %false otherwise.
1104  */
1105 bool kthread_cancel_delayed_work_sync(struct kthread_delayed_work *dwork)
1106 {
1107 	return __kthread_cancel_work_sync(&dwork->work, true);
1108 }
1109 EXPORT_SYMBOL_GPL(kthread_cancel_delayed_work_sync);
1110 
1111 /**
1112  * kthread_flush_worker - flush all current works on a kthread_worker
1113  * @worker: worker to flush
1114  *
1115  * Wait until all currently executing or pending works on @worker are
1116  * finished.
1117  */
1118 void kthread_flush_worker(struct kthread_worker *worker)
1119 {
1120 	struct kthread_flush_work fwork = {
1121 		KTHREAD_WORK_INIT(fwork.work, kthread_flush_work_fn),
1122 		COMPLETION_INITIALIZER_ONSTACK(fwork.done),
1123 	};
1124 
1125 	kthread_queue_work(worker, &fwork.work);
1126 	wait_for_completion(&fwork.done);
1127 }
1128 EXPORT_SYMBOL_GPL(kthread_flush_worker);
1129 
1130 /**
1131  * kthread_destroy_worker - destroy a kthread worker
1132  * @worker: worker to be destroyed
1133  *
1134  * Flush and destroy @worker.  The simple flush is enough because the kthread
1135  * worker API is used only in trivial scenarios.  There are no multi-step state
1136  * machines needed.
1137  */
1138 void kthread_destroy_worker(struct kthread_worker *worker)
1139 {
1140 	struct task_struct *task;
1141 
1142 	task = worker->task;
1143 	if (WARN_ON(!task))
1144 		return;
1145 
1146 	kthread_flush_worker(worker);
1147 	kthread_stop(task);
1148 	WARN_ON(!list_empty(&worker->work_list));
1149 	kfree(worker);
1150 }
1151 EXPORT_SYMBOL(kthread_destroy_worker);
1152