2005-04-17 06:20:36 +08:00
|
|
|
/* Kernel thread helper functions.
|
|
|
|
* Copyright (C) 2004 IBM Corporation, Rusty Russell.
|
|
|
|
*
|
2007-05-09 17:34:32 +08:00
|
|
|
* Creation is done via kthreadd, so that we get a clean environment
|
2005-04-17 06:20:36 +08:00
|
|
|
* even if we're invoked from userspace (think modprobe, hotplug cpu,
|
|
|
|
* etc.).
|
|
|
|
*/
|
|
|
|
#include <linux/sched.h>
|
|
|
|
#include <linux/kthread.h>
|
|
|
|
#include <linux/completion.h>
|
|
|
|
#include <linux/err.h>
|
cpuset,mm: update tasks' mems_allowed in time
Fix allocating page cache/slab object on the unallowed node when memory
spread is set by updating tasks' mems_allowed after its cpuset's mems is
changed.
In order to update tasks' mems_allowed in time, we must modify the code of
memory policy. Because the memory policy is applied in the process's
context originally. After applying this patch, one task directly
manipulates anothers mems_allowed, and we use alloc_lock in the
task_struct to protect mems_allowed and memory policy of the task.
But in the fast path, we didn't use lock to protect them, because adding a
lock may lead to performance regression. But if we don't add a lock,the
task might see no nodes when changing cpuset's mems_allowed to some
non-overlapping set. In order to avoid it, we set all new allowed nodes,
then clear newly disallowed ones.
[lee.schermerhorn@hp.com:
The rework of mpol_new() to extract the adjusting of the node mask to
apply cpuset and mpol flags "context" breaks set_mempolicy() and mbind()
with MPOL_PREFERRED and a NULL nodemask--i.e., explicit local
allocation. Fix this by adding the check for MPOL_PREFERRED and empty
node mask to mpol_new_mpolicy().
Remove the now unneeded 'nodes = NULL' from mpol_new().
Note that mpol_new_mempolicy() is always called with a non-NULL
'nodes' parameter now that it has been removed from mpol_new().
Therefore, we don't need to test nodes for NULL before testing it for
'empty'. However, just to be extra paranoid, add a VM_BUG_ON() to
verify this assumption.]
[lee.schermerhorn@hp.com:
I don't think the function name 'mpol_new_mempolicy' is descriptive
enough to differentiate it from mpol_new().
This function applies cpuset set context, usually constraining nodes
to those allowed by the cpuset. However, when the 'RELATIVE_NODES flag
is set, it also translates the nodes. So I settled on
'mpol_set_nodemask()', because the comment block for mpol_new() mentions
that we need to call this function to "set nodes".
Some additional minor line length, whitespace and typo cleanup.]
Signed-off-by: Miao Xie <miaox@cn.fujitsu.com>
Cc: Ingo Molnar <mingo@elte.hu>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Cc: Christoph Lameter <cl@linux-foundation.org>
Cc: Paul Menage <menage@google.com>
Cc: Nick Piggin <nickpiggin@yahoo.com.au>
Cc: Yasunori Goto <y-goto@jp.fujitsu.com>
Cc: Pekka Enberg <penberg@cs.helsinki.fi>
Cc: David Rientjes <rientjes@google.com>
Signed-off-by: Lee Schermerhorn <lee.schermerhorn@hp.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2009-06-17 06:31:49 +08:00
|
|
|
#include <linux/cpuset.h>
|
2005-04-17 06:20:36 +08:00
|
|
|
#include <linux/unistd.h>
|
|
|
|
#include <linux/file.h>
|
2011-05-24 02:51:41 +08:00
|
|
|
#include <linux/export.h>
|
2006-03-23 19:00:24 +08:00
|
|
|
#include <linux/mutex.h>
|
2010-06-29 16:07:09 +08:00
|
|
|
#include <linux/slab.h>
|
|
|
|
#include <linux/freezer.h>
|
2012-10-11 09:28:25 +08:00
|
|
|
#include <linux/ptrace.h>
|
2013-05-01 06:27:21 +08:00
|
|
|
#include <linux/uaccess.h>
|
2009-04-15 07:39:12 +08:00
|
|
|
#include <trace/events/sched.h>
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2007-05-09 17:34:32 +08:00
|
|
|
static DEFINE_SPINLOCK(kthread_create_lock);
|
|
|
|
static LIST_HEAD(kthread_create_list);
|
|
|
|
struct task_struct *kthreadd_task;
|
2005-04-17 06:20:36 +08:00
|
|
|
|
|
|
|
struct kthread_create_info
|
|
|
|
{
|
2007-05-09 17:34:32 +08:00
|
|
|
/* Information passed to kthread() from kthreadd. */
|
2005-04-17 06:20:36 +08:00
|
|
|
int (*threadfn)(void *data);
|
|
|
|
void *data;
|
2011-03-23 07:30:44 +08:00
|
|
|
int node;
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2007-05-09 17:34:32 +08:00
|
|
|
/* Result passed back to kthread_create() from kthreadd. */
|
2005-04-17 06:20:36 +08:00
|
|
|
struct task_struct *result;
|
2013-11-13 07:06:45 +08:00
|
|
|
struct completion *done;
|
2006-11-22 22:55:48 +08:00
|
|
|
|
2007-05-09 17:34:32 +08:00
|
|
|
struct list_head list;
|
2005-04-17 06:20:36 +08:00
|
|
|
};
|
|
|
|
|
2009-06-18 07:27:45 +08:00
|
|
|
struct kthread {
|
2012-07-16 18:42:36 +08:00
|
|
|
unsigned long flags;
|
|
|
|
unsigned int cpu;
|
2010-06-29 16:07:09 +08:00
|
|
|
void *data;
|
2012-07-16 18:42:36 +08:00
|
|
|
struct completion parked;
|
2009-06-18 07:27:45 +08:00
|
|
|
struct completion exited;
|
2005-04-17 06:20:36 +08:00
|
|
|
};
|
|
|
|
|
2012-07-16 18:42:36 +08:00
|
|
|
enum KTHREAD_BITS {
|
|
|
|
KTHREAD_IS_PER_CPU = 0,
|
|
|
|
KTHREAD_SHOULD_STOP,
|
|
|
|
KTHREAD_SHOULD_PARK,
|
|
|
|
KTHREAD_IS_PARKED,
|
|
|
|
};
|
|
|
|
|
2013-04-30 06:05:01 +08:00
|
|
|
#define __to_kthread(vfork) \
|
|
|
|
container_of(vfork, struct kthread, exited)
|
|
|
|
|
|
|
|
static inline struct kthread *to_kthread(struct task_struct *k)
|
|
|
|
{
|
|
|
|
return __to_kthread(k->vfork_done);
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct kthread *to_live_kthread(struct task_struct *k)
|
|
|
|
{
|
|
|
|
struct completion *vfork = ACCESS_ONCE(k->vfork_done);
|
2016-09-16 13:45:44 +08:00
|
|
|
if (likely(vfork) && try_get_task_stack(k))
|
2013-04-30 06:05:01 +08:00
|
|
|
return __to_kthread(vfork);
|
|
|
|
return NULL;
|
|
|
|
}
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2006-06-25 20:49:19 +08:00
|
|
|
/**
|
|
|
|
* kthread_should_stop - should this kthread return now?
|
|
|
|
*
|
2007-02-10 17:45:59 +08:00
|
|
|
* When someone calls kthread_stop() on your kthread, it will be woken
|
2006-06-25 20:49:19 +08:00
|
|
|
* and this will return true. You should then return, and your return
|
|
|
|
* value will be passed through to kthread_stop().
|
|
|
|
*/
|
2012-07-16 18:42:36 +08:00
|
|
|
bool kthread_should_stop(void)
|
2005-04-17 06:20:36 +08:00
|
|
|
{
|
2012-07-16 18:42:36 +08:00
|
|
|
return test_bit(KTHREAD_SHOULD_STOP, &to_kthread(current)->flags);
|
2005-04-17 06:20:36 +08:00
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(kthread_should_stop);
|
|
|
|
|
2012-07-16 18:42:36 +08:00
|
|
|
/**
|
|
|
|
* kthread_should_park - should this kthread park now?
|
|
|
|
*
|
|
|
|
* When someone calls kthread_park() on your kthread, it will be woken
|
|
|
|
* and this will return true. You should then do the necessary
|
|
|
|
* cleanup and call kthread_parkme()
|
|
|
|
*
|
|
|
|
* Similar to kthread_should_stop(), but this keeps the thread alive
|
|
|
|
* and in a park position. kthread_unpark() "restarts" the thread and
|
|
|
|
* calls the thread function again.
|
|
|
|
*/
|
|
|
|
bool kthread_should_park(void)
|
|
|
|
{
|
|
|
|
return test_bit(KTHREAD_SHOULD_PARK, &to_kthread(current)->flags);
|
|
|
|
}
|
2015-08-07 06:46:45 +08:00
|
|
|
EXPORT_SYMBOL_GPL(kthread_should_park);
|
2012-07-16 18:42:36 +08:00
|
|
|
|
2011-11-22 04:32:23 +08:00
|
|
|
/**
|
|
|
|
* kthread_freezable_should_stop - should this freezable kthread return now?
|
|
|
|
* @was_frozen: optional out parameter, indicates whether %current was frozen
|
|
|
|
*
|
|
|
|
* kthread_should_stop() for freezable kthreads, which will enter
|
|
|
|
* refrigerator if necessary. This function is safe from kthread_stop() /
|
|
|
|
* freezer deadlock and freezable kthreads should use this function instead
|
|
|
|
* of calling try_to_freeze() directly.
|
|
|
|
*/
|
|
|
|
bool kthread_freezable_should_stop(bool *was_frozen)
|
|
|
|
{
|
|
|
|
bool frozen = false;
|
|
|
|
|
|
|
|
might_sleep();
|
|
|
|
|
|
|
|
if (unlikely(freezing(current)))
|
|
|
|
frozen = __refrigerator(true);
|
|
|
|
|
|
|
|
if (was_frozen)
|
|
|
|
*was_frozen = frozen;
|
|
|
|
|
|
|
|
return kthread_should_stop();
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL_GPL(kthread_freezable_should_stop);
|
|
|
|
|
2010-06-29 16:07:09 +08:00
|
|
|
/**
|
|
|
|
* kthread_data - return data value specified on kthread creation
|
|
|
|
* @task: kthread task in question
|
|
|
|
*
|
|
|
|
* Return the data value specified when kthread @task was created.
|
|
|
|
* The caller is responsible for ensuring the validity of @task when
|
|
|
|
* calling this function.
|
|
|
|
*/
|
|
|
|
void *kthread_data(struct task_struct *task)
|
|
|
|
{
|
|
|
|
return to_kthread(task)->data;
|
|
|
|
}
|
|
|
|
|
2013-05-01 06:27:21 +08:00
|
|
|
/**
|
2016-10-12 04:55:17 +08:00
|
|
|
* kthread_probe_data - speculative version of kthread_data()
|
2013-05-01 06:27:21 +08:00
|
|
|
* @task: possible kthread task in question
|
|
|
|
*
|
|
|
|
* @task could be a kthread task. Return the data value specified when it
|
|
|
|
* was created if accessible. If @task isn't a kthread task or its data is
|
|
|
|
* inaccessible for any reason, %NULL is returned. This function requires
|
|
|
|
* that @task itself is safe to dereference.
|
|
|
|
*/
|
2016-10-12 04:55:17 +08:00
|
|
|
void *kthread_probe_data(struct task_struct *task)
|
2013-05-01 06:27:21 +08:00
|
|
|
{
|
|
|
|
struct kthread *kthread = to_kthread(task);
|
|
|
|
void *data = NULL;
|
|
|
|
|
|
|
|
probe_kernel_read(&data, &kthread->data, sizeof(data));
|
|
|
|
return data;
|
|
|
|
}
|
|
|
|
|
2012-07-16 18:42:36 +08:00
|
|
|
static void __kthread_parkme(struct kthread *self)
|
|
|
|
{
|
2013-04-09 15:33:34 +08:00
|
|
|
__set_current_state(TASK_PARKED);
|
2012-07-16 18:42:36 +08:00
|
|
|
while (test_bit(KTHREAD_SHOULD_PARK, &self->flags)) {
|
|
|
|
if (!test_and_set_bit(KTHREAD_IS_PARKED, &self->flags))
|
|
|
|
complete(&self->parked);
|
|
|
|
schedule();
|
2013-04-09 15:33:34 +08:00
|
|
|
__set_current_state(TASK_PARKED);
|
2012-07-16 18:42:36 +08:00
|
|
|
}
|
|
|
|
clear_bit(KTHREAD_IS_PARKED, &self->flags);
|
|
|
|
__set_current_state(TASK_RUNNING);
|
|
|
|
}
|
|
|
|
|
|
|
|
void kthread_parkme(void)
|
|
|
|
{
|
|
|
|
__kthread_parkme(to_kthread(current));
|
|
|
|
}
|
2015-08-07 06:46:45 +08:00
|
|
|
EXPORT_SYMBOL_GPL(kthread_parkme);
|
2012-07-16 18:42:36 +08:00
|
|
|
|
2005-04-17 06:20:36 +08:00
|
|
|
static int kthread(void *_create)
|
|
|
|
{
|
2009-06-18 07:27:45 +08:00
|
|
|
/* Copy data: it's on kthread's stack */
|
2005-04-17 06:20:36 +08:00
|
|
|
struct kthread_create_info *create = _create;
|
2009-06-18 07:27:45 +08:00
|
|
|
int (*threadfn)(void *data) = create->threadfn;
|
|
|
|
void *data = create->data;
|
2013-11-13 07:06:45 +08:00
|
|
|
struct completion *done;
|
2009-06-18 07:27:45 +08:00
|
|
|
struct kthread self;
|
|
|
|
int ret;
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2012-07-16 18:42:36 +08:00
|
|
|
self.flags = 0;
|
2010-06-29 16:07:09 +08:00
|
|
|
self.data = data;
|
2009-06-18 07:27:45 +08:00
|
|
|
init_completion(&self.exited);
|
2012-07-16 18:42:36 +08:00
|
|
|
init_completion(&self.parked);
|
2009-06-18 07:27:45 +08:00
|
|
|
current->vfork_done = &self.exited;
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2013-11-13 07:06:45 +08:00
|
|
|
/* If user was SIGKILLed, I release the structure. */
|
|
|
|
done = xchg(&create->done, NULL);
|
|
|
|
if (!done) {
|
|
|
|
kfree(create);
|
|
|
|
do_exit(-EINTR);
|
|
|
|
}
|
2005-04-17 06:20:36 +08:00
|
|
|
/* OK, tell user we're spawned, wait for stop or wakeup */
|
2007-05-24 04:57:27 +08:00
|
|
|
__set_current_state(TASK_UNINTERRUPTIBLE);
|
2009-04-09 23:50:35 +08:00
|
|
|
create->result = current;
|
2013-11-13 07:06:45 +08:00
|
|
|
complete(done);
|
2005-04-17 06:20:36 +08:00
|
|
|
schedule();
|
|
|
|
|
2009-06-18 07:27:45 +08:00
|
|
|
ret = -EINTR;
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2012-07-16 18:42:36 +08:00
|
|
|
if (!test_bit(KTHREAD_SHOULD_STOP, &self.flags)) {
|
|
|
|
__kthread_parkme(&self);
|
|
|
|
ret = threadfn(data);
|
|
|
|
}
|
2009-06-18 07:27:45 +08:00
|
|
|
/* we can't just return, we must preserve "self" on stack */
|
|
|
|
do_exit(ret);
|
2005-04-17 06:20:36 +08:00
|
|
|
}
|
|
|
|
|
2011-03-23 07:30:44 +08:00
|
|
|
/* called from do_fork() to get node information for about to be created task */
|
|
|
|
int tsk_fork_get_node(struct task_struct *tsk)
|
|
|
|
{
|
|
|
|
#ifdef CONFIG_NUMA
|
|
|
|
if (tsk == kthreadd_task)
|
|
|
|
return tsk->pref_node_fork;
|
|
|
|
#endif
|
2014-04-04 05:46:25 +08:00
|
|
|
return NUMA_NO_NODE;
|
2011-03-23 07:30:44 +08:00
|
|
|
}
|
|
|
|
|
2007-05-09 17:34:32 +08:00
|
|
|
static void create_kthread(struct kthread_create_info *create)
|
2005-04-17 06:20:36 +08:00
|
|
|
{
|
|
|
|
int pid;
|
|
|
|
|
2011-03-23 07:30:44 +08:00
|
|
|
#ifdef CONFIG_NUMA
|
|
|
|
current->pref_node_fork = create->node;
|
|
|
|
#endif
|
2005-04-17 06:20:36 +08:00
|
|
|
/* We want our own signal handler (we take no signals by default). */
|
|
|
|
pid = kernel_thread(kthread, create, CLONE_FS | CLONE_FILES | SIGCHLD);
|
2009-06-18 07:27:43 +08:00
|
|
|
if (pid < 0) {
|
2013-11-13 07:06:45 +08:00
|
|
|
/* If user was SIGKILLed, I release the structure. */
|
|
|
|
struct completion *done = xchg(&create->done, NULL);
|
|
|
|
|
|
|
|
if (!done) {
|
|
|
|
kfree(create);
|
|
|
|
return;
|
|
|
|
}
|
2005-04-17 06:20:36 +08:00
|
|
|
create->result = ERR_PTR(pid);
|
2013-11-13 07:06:45 +08:00
|
|
|
complete(done);
|
2009-06-18 07:27:43 +08:00
|
|
|
}
|
2005-04-17 06:20:36 +08:00
|
|
|
}
|
|
|
|
|
2016-10-12 04:55:27 +08:00
|
|
|
static struct task_struct *__kthread_create_on_node(int (*threadfn)(void *data),
|
|
|
|
void *data, int node,
|
|
|
|
const char namefmt[],
|
|
|
|
va_list args)
|
2005-04-17 06:20:36 +08:00
|
|
|
{
|
2013-11-13 07:06:45 +08:00
|
|
|
DECLARE_COMPLETION_ONSTACK(done);
|
|
|
|
struct task_struct *task;
|
|
|
|
struct kthread_create_info *create = kmalloc(sizeof(*create),
|
|
|
|
GFP_KERNEL);
|
|
|
|
|
|
|
|
if (!create)
|
|
|
|
return ERR_PTR(-ENOMEM);
|
|
|
|
create->threadfn = threadfn;
|
|
|
|
create->data = data;
|
|
|
|
create->node = node;
|
|
|
|
create->done = &done;
|
2007-05-09 17:34:32 +08:00
|
|
|
|
|
|
|
spin_lock(&kthread_create_lock);
|
2013-11-13 07:06:45 +08:00
|
|
|
list_add_tail(&create->list, &kthread_create_list);
|
2007-05-09 17:34:32 +08:00
|
|
|
spin_unlock(&kthread_create_lock);
|
|
|
|
|
2008-04-29 15:59:23 +08:00
|
|
|
wake_up_process(kthreadd_task);
|
2013-11-13 07:06:45 +08:00
|
|
|
/*
|
|
|
|
* Wait for completion in killable state, for I might be chosen by
|
|
|
|
* the OOM killer while kthreadd is trying to allocate memory for
|
|
|
|
* new kernel thread.
|
|
|
|
*/
|
|
|
|
if (unlikely(wait_for_completion_killable(&done))) {
|
|
|
|
/*
|
|
|
|
* If I was SIGKILLed before kthreadd (or new kernel thread)
|
|
|
|
* calls complete(), leave the cleanup of this structure to
|
|
|
|
* that thread.
|
|
|
|
*/
|
|
|
|
if (xchg(&create->done, NULL))
|
2014-06-05 07:05:36 +08:00
|
|
|
return ERR_PTR(-EINTR);
|
2013-11-13 07:06:45 +08:00
|
|
|
/*
|
|
|
|
* kthreadd (or new kernel thread) will call complete()
|
|
|
|
* shortly.
|
|
|
|
*/
|
|
|
|
wait_for_completion(&done);
|
|
|
|
}
|
|
|
|
task = create->result;
|
|
|
|
if (!IS_ERR(task)) {
|
2011-01-07 20:41:40 +08:00
|
|
|
static const struct sched_param param = { .sched_priority = 0 };
|
2009-04-09 23:50:36 +08:00
|
|
|
|
2013-11-13 07:06:45 +08:00
|
|
|
vsnprintf(task->comm, sizeof(task->comm), namefmt, args);
|
2009-04-09 23:50:36 +08:00
|
|
|
/*
|
|
|
|
* root may have changed our (kthreadd's) priority or CPU mask.
|
|
|
|
* The kernel thread should not inherit these properties.
|
|
|
|
*/
|
2013-11-13 07:06:45 +08:00
|
|
|
sched_setscheduler_nocheck(task, SCHED_NORMAL, ¶m);
|
|
|
|
set_cpus_allowed_ptr(task, cpu_all_mask);
|
2005-04-17 06:20:36 +08:00
|
|
|
}
|
2013-11-13 07:06:45 +08:00
|
|
|
kfree(create);
|
|
|
|
return task;
|
2005-04-17 06:20:36 +08:00
|
|
|
}
|
2016-10-12 04:55:27 +08:00
|
|
|
|
|
|
|
/**
|
|
|
|
* kthread_create_on_node - create a kthread.
|
|
|
|
* @threadfn: the function to run until signal_pending(current).
|
|
|
|
* @data: data ptr for @threadfn.
|
|
|
|
* @node: task and thread structures for the thread are allocated on this node
|
|
|
|
* @namefmt: printf-style name for the thread.
|
|
|
|
*
|
|
|
|
* Description: This helper function creates and names a kernel
|
|
|
|
* thread. The thread will be stopped: use wake_up_process() to start
|
|
|
|
* it. See also kthread_run(). The new thread has SCHED_NORMAL policy and
|
|
|
|
* is affine to all CPUs.
|
|
|
|
*
|
|
|
|
* If thread is going to be bound on a particular cpu, give its node
|
|
|
|
* in @node, to get NUMA affinity for kthread stack, or else give NUMA_NO_NODE.
|
|
|
|
* When woken, the thread will run @threadfn() with @data as its
|
|
|
|
* argument. @threadfn() can either call do_exit() directly if it is a
|
|
|
|
* standalone thread for which no one will call kthread_stop(), or
|
|
|
|
* return when 'kthread_should_stop()' is true (which means
|
|
|
|
* kthread_stop() has been called). The return value should be zero
|
|
|
|
* or a negative error number; it will be passed to kthread_stop().
|
|
|
|
*
|
|
|
|
* Returns a task_struct or ERR_PTR(-ENOMEM) or ERR_PTR(-EINTR).
|
|
|
|
*/
|
|
|
|
struct task_struct *kthread_create_on_node(int (*threadfn)(void *data),
|
|
|
|
void *data, int node,
|
|
|
|
const char namefmt[],
|
|
|
|
...)
|
|
|
|
{
|
|
|
|
struct task_struct *task;
|
|
|
|
va_list args;
|
|
|
|
|
|
|
|
va_start(args, namefmt);
|
|
|
|
task = __kthread_create_on_node(threadfn, data, node, namefmt, args);
|
|
|
|
va_end(args);
|
|
|
|
|
|
|
|
return task;
|
|
|
|
}
|
2011-03-23 07:30:44 +08:00
|
|
|
EXPORT_SYMBOL(kthread_create_on_node);
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2015-05-15 23:43:34 +08:00
|
|
|
static void __kthread_bind_mask(struct task_struct *p, const struct cpumask *mask, long state)
|
2012-07-16 18:42:36 +08:00
|
|
|
{
|
2015-05-15 23:43:34 +08:00
|
|
|
unsigned long flags;
|
|
|
|
|
2013-04-09 15:33:34 +08:00
|
|
|
if (!wait_task_inactive(p, state)) {
|
|
|
|
WARN_ON(1);
|
|
|
|
return;
|
|
|
|
}
|
2015-05-15 23:43:34 +08:00
|
|
|
|
2012-07-16 18:42:36 +08:00
|
|
|
/* It's safe because the task is inactive. */
|
2015-05-15 23:43:34 +08:00
|
|
|
raw_spin_lock_irqsave(&p->pi_lock, flags);
|
|
|
|
do_set_cpus_allowed(p, mask);
|
2013-03-20 04:45:20 +08:00
|
|
|
p->flags |= PF_NO_SETAFFINITY;
|
2015-05-15 23:43:34 +08:00
|
|
|
raw_spin_unlock_irqrestore(&p->pi_lock, flags);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void __kthread_bind(struct task_struct *p, unsigned int cpu, long state)
|
|
|
|
{
|
|
|
|
__kthread_bind_mask(p, cpumask_of(cpu), state);
|
|
|
|
}
|
|
|
|
|
|
|
|
void kthread_bind_mask(struct task_struct *p, const struct cpumask *mask)
|
|
|
|
{
|
|
|
|
__kthread_bind_mask(p, mask, TASK_UNINTERRUPTIBLE);
|
2012-07-16 18:42:36 +08:00
|
|
|
}
|
|
|
|
|
2009-12-17 01:04:39 +08:00
|
|
|
/**
|
|
|
|
* kthread_bind - bind a just-created kthread to a cpu.
|
|
|
|
* @p: thread created by kthread_create().
|
|
|
|
* @cpu: cpu (might not be online, must be possible) for @k to run on.
|
|
|
|
*
|
|
|
|
* Description: This function is equivalent to set_cpus_allowed(),
|
|
|
|
* except that @cpu doesn't need to be online, and the thread must be
|
|
|
|
* stopped (i.e., just returned from kthread_create()).
|
|
|
|
*/
|
|
|
|
void kthread_bind(struct task_struct *p, unsigned int cpu)
|
|
|
|
{
|
2013-04-09 15:33:34 +08:00
|
|
|
__kthread_bind(p, cpu, TASK_UNINTERRUPTIBLE);
|
2009-12-17 01:04:39 +08:00
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(kthread_bind);
|
|
|
|
|
2012-07-16 18:42:36 +08:00
|
|
|
/**
|
|
|
|
* kthread_create_on_cpu - Create a cpu bound kthread
|
|
|
|
* @threadfn: the function to run until signal_pending(current).
|
|
|
|
* @data: data ptr for @threadfn.
|
|
|
|
* @cpu: The cpu on which the thread should be bound,
|
|
|
|
* @namefmt: printf-style name for the thread. Format is restricted
|
|
|
|
* to "name.*%u". Code fills in cpu number.
|
|
|
|
*
|
|
|
|
* Description: This helper function creates and names a kernel thread
|
|
|
|
* The thread will be woken and put into park mode.
|
|
|
|
*/
|
|
|
|
struct task_struct *kthread_create_on_cpu(int (*threadfn)(void *data),
|
|
|
|
void *data, unsigned int cpu,
|
|
|
|
const char *namefmt)
|
|
|
|
{
|
|
|
|
struct task_struct *p;
|
|
|
|
|
2014-10-10 06:26:18 +08:00
|
|
|
p = kthread_create_on_node(threadfn, data, cpu_to_node(cpu), namefmt,
|
2012-07-16 18:42:36 +08:00
|
|
|
cpu);
|
|
|
|
if (IS_ERR(p))
|
|
|
|
return p;
|
2016-10-12 04:55:23 +08:00
|
|
|
kthread_bind(p, cpu);
|
|
|
|
/* CPU hotplug need to bind once again when unparking the thread. */
|
2012-07-16 18:42:36 +08:00
|
|
|
set_bit(KTHREAD_IS_PER_CPU, &to_kthread(p)->flags);
|
|
|
|
to_kthread(p)->cpu = cpu;
|
|
|
|
return p;
|
|
|
|
}
|
|
|
|
|
2013-04-09 15:33:34 +08:00
|
|
|
static void __kthread_unpark(struct task_struct *k, struct kthread *kthread)
|
|
|
|
{
|
|
|
|
clear_bit(KTHREAD_SHOULD_PARK, &kthread->flags);
|
|
|
|
/*
|
|
|
|
* We clear the IS_PARKED bit here as we don't wait
|
|
|
|
* until the task has left the park code. So if we'd
|
|
|
|
* park before that happens we'd see the IS_PARKED bit
|
|
|
|
* which might be about to be cleared.
|
|
|
|
*/
|
|
|
|
if (test_and_clear_bit(KTHREAD_IS_PARKED, &kthread->flags)) {
|
2016-10-12 04:55:23 +08:00
|
|
|
/*
|
|
|
|
* Newly created kthread was parked when the CPU was offline.
|
|
|
|
* The binding was lost and we need to set it again.
|
|
|
|
*/
|
2013-04-09 15:33:34 +08:00
|
|
|
if (test_bit(KTHREAD_IS_PER_CPU, &kthread->flags))
|
|
|
|
__kthread_bind(k, kthread->cpu, TASK_PARKED);
|
|
|
|
wake_up_state(k, TASK_PARKED);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2012-07-16 18:42:36 +08:00
|
|
|
/**
|
|
|
|
* kthread_unpark - unpark a thread created by kthread_create().
|
|
|
|
* @k: thread created by kthread_create().
|
|
|
|
*
|
|
|
|
* Sets kthread_should_park() for @k to return false, wakes it, and
|
|
|
|
* waits for it to return. If the thread is marked percpu then its
|
|
|
|
* bound to the cpu again.
|
|
|
|
*/
|
|
|
|
void kthread_unpark(struct task_struct *k)
|
|
|
|
{
|
2013-04-30 06:05:12 +08:00
|
|
|
struct kthread *kthread = to_live_kthread(k);
|
2012-07-16 18:42:36 +08:00
|
|
|
|
2016-09-16 13:45:44 +08:00
|
|
|
if (kthread) {
|
2013-04-09 15:33:34 +08:00
|
|
|
__kthread_unpark(k, kthread);
|
2016-09-16 13:45:44 +08:00
|
|
|
put_task_stack(k);
|
|
|
|
}
|
2012-07-16 18:42:36 +08:00
|
|
|
}
|
2015-08-07 06:46:45 +08:00
|
|
|
EXPORT_SYMBOL_GPL(kthread_unpark);
|
2012-07-16 18:42:36 +08:00
|
|
|
|
|
|
|
/**
|
|
|
|
* kthread_park - park a thread created by kthread_create().
|
|
|
|
* @k: thread created by kthread_create().
|
|
|
|
*
|
|
|
|
* Sets kthread_should_park() for @k to return true, wakes it, and
|
|
|
|
* waits for it to return. This can also be called after kthread_create()
|
|
|
|
* instead of calling wake_up_process(): the thread will park without
|
|
|
|
* calling threadfn().
|
|
|
|
*
|
|
|
|
* Returns 0 if the thread is parked, -ENOSYS if the thread exited.
|
|
|
|
* If called by the kthread itself just the park bit is set.
|
|
|
|
*/
|
|
|
|
int kthread_park(struct task_struct *k)
|
|
|
|
{
|
2013-04-30 06:05:12 +08:00
|
|
|
struct kthread *kthread = to_live_kthread(k);
|
2012-07-16 18:42:36 +08:00
|
|
|
int ret = -ENOSYS;
|
|
|
|
|
|
|
|
if (kthread) {
|
|
|
|
if (!test_bit(KTHREAD_IS_PARKED, &kthread->flags)) {
|
|
|
|
set_bit(KTHREAD_SHOULD_PARK, &kthread->flags);
|
|
|
|
if (k != current) {
|
|
|
|
wake_up_process(k);
|
|
|
|
wait_for_completion(&kthread->parked);
|
|
|
|
}
|
|
|
|
}
|
2016-09-16 13:45:44 +08:00
|
|
|
put_task_stack(k);
|
2012-07-16 18:42:36 +08:00
|
|
|
ret = 0;
|
|
|
|
}
|
|
|
|
return ret;
|
|
|
|
}
|
2015-08-07 06:46:45 +08:00
|
|
|
EXPORT_SYMBOL_GPL(kthread_park);
|
2012-07-16 18:42:36 +08:00
|
|
|
|
2006-06-25 20:49:19 +08:00
|
|
|
/**
|
|
|
|
* kthread_stop - stop a thread created by kthread_create().
|
|
|
|
* @k: thread created by kthread_create().
|
|
|
|
*
|
|
|
|
* Sets kthread_should_stop() for @k to return true, wakes it, and
|
2009-06-19 08:51:13 +08:00
|
|
|
* waits for it to exit. This can also be called after kthread_create()
|
|
|
|
* instead of calling wake_up_process(): the thread will exit without
|
|
|
|
* calling threadfn().
|
|
|
|
*
|
|
|
|
* If threadfn() may call do_exit() itself, the caller must ensure
|
|
|
|
* task_struct can't go away.
|
2006-06-25 20:49:19 +08:00
|
|
|
*
|
|
|
|
* Returns the result of threadfn(), or %-EINTR if wake_up_process()
|
|
|
|
* was never called.
|
|
|
|
*/
|
2005-04-17 06:20:36 +08:00
|
|
|
int kthread_stop(struct task_struct *k)
|
|
|
|
{
|
2013-04-30 06:05:12 +08:00
|
|
|
struct kthread *kthread;
|
2005-04-17 06:20:36 +08:00
|
|
|
int ret;
|
|
|
|
|
tracing, sched: LTTng instrumentation - scheduler
Instrument the scheduler activity (sched_switch, migration, wakeups,
wait for a task, signal delivery) and process/thread
creation/destruction (fork, exit, kthread stop). Actually, kthread
creation is not instrumented in this patch because it is architecture
dependent. It allows to connect tracers such as ftrace which detects
scheduling latencies, good/bad scheduler decisions. Tools like LTTng can
export this scheduler information along with instrumentation of the rest
of the kernel activity to perform post-mortem analysis on the scheduler
activity.
About the performance impact of tracepoints (which is comparable to
markers), even without immediate values optimizations, tests done by
Hideo Aoki on ia64 show no regression. His test case was using hackbench
on a kernel where scheduler instrumentation (about 5 events in code
scheduler code) was added. See the "Tracepoints" patch header for
performance result detail.
Changelog :
- Change instrumentation location and parameter to match ftrace
instrumentation, previously done with kernel markers.
[ mingo@elte.hu: conflict resolutions ]
Signed-off-by: Mathieu Desnoyers <mathieu.desnoyers@polymtl.ca>
Acked-by: 'Peter Zijlstra' <peterz@infradead.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2008-07-19 00:16:17 +08:00
|
|
|
trace_sched_kthread_stop(k);
|
2013-04-30 06:05:12 +08:00
|
|
|
|
|
|
|
get_task_struct(k);
|
|
|
|
kthread = to_live_kthread(k);
|
2012-07-16 18:42:36 +08:00
|
|
|
if (kthread) {
|
|
|
|
set_bit(KTHREAD_SHOULD_STOP, &kthread->flags);
|
2013-04-09 15:33:34 +08:00
|
|
|
__kthread_unpark(k, kthread);
|
2009-06-18 07:27:45 +08:00
|
|
|
wake_up_process(k);
|
|
|
|
wait_for_completion(&kthread->exited);
|
2016-09-16 13:45:44 +08:00
|
|
|
put_task_stack(k);
|
2009-06-18 07:27:45 +08:00
|
|
|
}
|
|
|
|
ret = k->exit_code;
|
2005-04-17 06:20:36 +08:00
|
|
|
put_task_struct(k);
|
tracing, sched: LTTng instrumentation - scheduler
Instrument the scheduler activity (sched_switch, migration, wakeups,
wait for a task, signal delivery) and process/thread
creation/destruction (fork, exit, kthread stop). Actually, kthread
creation is not instrumented in this patch because it is architecture
dependent. It allows to connect tracers such as ftrace which detects
scheduling latencies, good/bad scheduler decisions. Tools like LTTng can
export this scheduler information along with instrumentation of the rest
of the kernel activity to perform post-mortem analysis on the scheduler
activity.
About the performance impact of tracepoints (which is comparable to
markers), even without immediate values optimizations, tests done by
Hideo Aoki on ia64 show no regression. His test case was using hackbench
on a kernel where scheduler instrumentation (about 5 events in code
scheduler code) was added. See the "Tracepoints" patch header for
performance result detail.
Changelog :
- Change instrumentation location and parameter to match ftrace
instrumentation, previously done with kernel markers.
[ mingo@elte.hu: conflict resolutions ]
Signed-off-by: Mathieu Desnoyers <mathieu.desnoyers@polymtl.ca>
Acked-by: 'Peter Zijlstra' <peterz@infradead.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2008-07-19 00:16:17 +08:00
|
|
|
|
2013-04-30 06:05:12 +08:00
|
|
|
trace_sched_kthread_stop_ret(ret);
|
2005-04-17 06:20:36 +08:00
|
|
|
return ret;
|
|
|
|
}
|
2006-07-14 15:24:05 +08:00
|
|
|
EXPORT_SYMBOL(kthread_stop);
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2007-07-31 15:39:16 +08:00
|
|
|
int kthreadd(void *unused)
|
2005-04-17 06:20:36 +08:00
|
|
|
{
|
2007-05-09 17:34:32 +08:00
|
|
|
struct task_struct *tsk = current;
|
2005-04-17 06:20:36 +08:00
|
|
|
|
2007-07-31 15:39:16 +08:00
|
|
|
/* Setup a clean context for our children to inherit. */
|
2007-05-09 17:34:32 +08:00
|
|
|
set_task_comm(tsk, "kthreadd");
|
2007-05-09 17:34:37 +08:00
|
|
|
ignore_signals(tsk);
|
2009-03-31 12:05:10 +08:00
|
|
|
set_cpus_allowed_ptr(tsk, cpu_all_mask);
|
2012-12-13 05:51:39 +08:00
|
|
|
set_mems_allowed(node_states[N_MEMORY]);
|
2007-05-09 17:34:32 +08:00
|
|
|
|
2011-11-24 01:28:17 +08:00
|
|
|
current->flags |= PF_NOFREEZE;
|
2007-05-09 17:34:32 +08:00
|
|
|
|
|
|
|
for (;;) {
|
|
|
|
set_current_state(TASK_INTERRUPTIBLE);
|
|
|
|
if (list_empty(&kthread_create_list))
|
|
|
|
schedule();
|
|
|
|
__set_current_state(TASK_RUNNING);
|
|
|
|
|
|
|
|
spin_lock(&kthread_create_lock);
|
|
|
|
while (!list_empty(&kthread_create_list)) {
|
|
|
|
struct kthread_create_info *create;
|
|
|
|
|
|
|
|
create = list_entry(kthread_create_list.next,
|
|
|
|
struct kthread_create_info, list);
|
|
|
|
list_del_init(&create->list);
|
|
|
|
spin_unlock(&kthread_create_lock);
|
|
|
|
|
|
|
|
create_kthread(create);
|
|
|
|
|
|
|
|
spin_lock(&kthread_create_lock);
|
|
|
|
}
|
|
|
|
spin_unlock(&kthread_create_lock);
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
2010-06-29 16:07:09 +08:00
|
|
|
|
2016-10-12 04:55:20 +08:00
|
|
|
void __kthread_init_worker(struct kthread_worker *worker,
|
2010-12-22 17:27:53 +08:00
|
|
|
const char *name,
|
|
|
|
struct lock_class_key *key)
|
|
|
|
{
|
|
|
|
spin_lock_init(&worker->lock);
|
|
|
|
lockdep_set_class_and_name(&worker->lock, key, name);
|
|
|
|
INIT_LIST_HEAD(&worker->work_list);
|
2016-10-12 04:55:40 +08:00
|
|
|
INIT_LIST_HEAD(&worker->delayed_work_list);
|
2010-12-22 17:27:53 +08:00
|
|
|
worker->task = NULL;
|
|
|
|
}
|
2016-10-12 04:55:20 +08:00
|
|
|
EXPORT_SYMBOL_GPL(__kthread_init_worker);
|
2010-12-22 17:27:53 +08:00
|
|
|
|
2010-06-29 16:07:09 +08:00
|
|
|
/**
|
|
|
|
* kthread_worker_fn - kthread function to process kthread_worker
|
|
|
|
* @worker_ptr: pointer to initialized kthread_worker
|
|
|
|
*
|
kthread: add kthread_create_worker*()
Kthread workers are currently created using the classic kthread API,
namely kthread_run(). kthread_worker_fn() is passed as the @threadfn
parameter.
This patch defines kthread_create_worker() and
kthread_create_worker_on_cpu() functions that hide implementation details.
They enforce using kthread_worker_fn() for the main thread. But I doubt
that there are any plans to create any alternative. In fact, I think that
we do not want any alternative main thread because it would be hard to
support consistency with the rest of the kthread worker API.
The naming and function of kthread_create_worker() is inspired by the
workqueues API like the rest of the kthread worker API.
The kthread_create_worker_on_cpu() variant is motivated by the original
kthread_create_on_cpu(). Note that we need to bind per-CPU kthread
workers already when they are created. It makes the life easier.
kthread_bind() could not be used later for an already running worker.
This patch does _not_ convert existing kthread workers. The kthread
worker API need more improvements first, e.g. a function to destroy the
worker.
IMPORTANT:
kthread_create_worker_on_cpu() allows to use any format of the worker
name, in compare with kthread_create_on_cpu(). The good thing is that it
is more generic. The bad thing is that most users will need to pass the
cpu number in two parameters, e.g. kthread_create_worker_on_cpu(cpu,
"helper/%d", cpu).
To be honest, the main motivation was to avoid the need for an empty
va_list. The only legal way was to create a helper function that would be
called with an empty list. Other attempts caused compilation warnings or
even errors on different architectures.
There were also other alternatives, for example, using #define or
splitting __kthread_create_worker(). The used solution looked like the
least ugly.
Link: http://lkml.kernel.org/r/1470754545-17632-6-git-send-email-pmladek@suse.com
Signed-off-by: Petr Mladek <pmladek@suse.com>
Acked-by: Tejun Heo <tj@kernel.org>
Cc: Oleg Nesterov <oleg@redhat.com>
Cc: Ingo Molnar <mingo@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Cc: "Paul E. McKenney" <paulmck@linux.vnet.ibm.com>
Cc: Josh Triplett <josh@joshtriplett.org>
Cc: Thomas Gleixner <tglx@linutronix.de>
Cc: Jiri Kosina <jkosina@suse.cz>
Cc: Borislav Petkov <bp@suse.de>
Cc: Michal Hocko <mhocko@suse.cz>
Cc: Vlastimil Babka <vbabka@suse.cz>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2016-10-12 04:55:30 +08:00
|
|
|
* This function implements the main cycle of kthread worker. It processes
|
|
|
|
* work_list until it is stopped with kthread_stop(). It sleeps when the queue
|
|
|
|
* is empty.
|
2010-06-29 16:07:09 +08:00
|
|
|
*
|
kthread: add kthread_create_worker*()
Kthread workers are currently created using the classic kthread API,
namely kthread_run(). kthread_worker_fn() is passed as the @threadfn
parameter.
This patch defines kthread_create_worker() and
kthread_create_worker_on_cpu() functions that hide implementation details.
They enforce using kthread_worker_fn() for the main thread. But I doubt
that there are any plans to create any alternative. In fact, I think that
we do not want any alternative main thread because it would be hard to
support consistency with the rest of the kthread worker API.
The naming and function of kthread_create_worker() is inspired by the
workqueues API like the rest of the kthread worker API.
The kthread_create_worker_on_cpu() variant is motivated by the original
kthread_create_on_cpu(). Note that we need to bind per-CPU kthread
workers already when they are created. It makes the life easier.
kthread_bind() could not be used later for an already running worker.
This patch does _not_ convert existing kthread workers. The kthread
worker API need more improvements first, e.g. a function to destroy the
worker.
IMPORTANT:
kthread_create_worker_on_cpu() allows to use any format of the worker
name, in compare with kthread_create_on_cpu(). The good thing is that it
is more generic. The bad thing is that most users will need to pass the
cpu number in two parameters, e.g. kthread_create_worker_on_cpu(cpu,
"helper/%d", cpu).
To be honest, the main motivation was to avoid the need for an empty
va_list. The only legal way was to create a helper function that would be
called with an empty list. Other attempts caused compilation warnings or
even errors on different architectures.
There were also other alternatives, for example, using #define or
splitting __kthread_create_worker(). The used solution looked like the
least ugly.
Link: http://lkml.kernel.org/r/1470754545-17632-6-git-send-email-pmladek@suse.com
Signed-off-by: Petr Mladek <pmladek@suse.com>
Acked-by: Tejun Heo <tj@kernel.org>
Cc: Oleg Nesterov <oleg@redhat.com>
Cc: Ingo Molnar <mingo@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Cc: "Paul E. McKenney" <paulmck@linux.vnet.ibm.com>
Cc: Josh Triplett <josh@joshtriplett.org>
Cc: Thomas Gleixner <tglx@linutronix.de>
Cc: Jiri Kosina <jkosina@suse.cz>
Cc: Borislav Petkov <bp@suse.de>
Cc: Michal Hocko <mhocko@suse.cz>
Cc: Vlastimil Babka <vbabka@suse.cz>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2016-10-12 04:55:30 +08:00
|
|
|
* The works are not allowed to keep any locks, disable preemption or interrupts
|
|
|
|
* when they finish. There is defined a safe point for freezing when one work
|
|
|
|
* finishes and before a new one is started.
|
2016-10-12 04:55:36 +08:00
|
|
|
*
|
|
|
|
* Also the works must not be handled by more than one worker at the same time,
|
|
|
|
* see also kthread_queue_work().
|
2010-06-29 16:07:09 +08:00
|
|
|
*/
|
|
|
|
int kthread_worker_fn(void *worker_ptr)
|
|
|
|
{
|
|
|
|
struct kthread_worker *worker = worker_ptr;
|
|
|
|
struct kthread_work *work;
|
|
|
|
|
kthread: add kthread_create_worker*()
Kthread workers are currently created using the classic kthread API,
namely kthread_run(). kthread_worker_fn() is passed as the @threadfn
parameter.
This patch defines kthread_create_worker() and
kthread_create_worker_on_cpu() functions that hide implementation details.
They enforce using kthread_worker_fn() for the main thread. But I doubt
that there are any plans to create any alternative. In fact, I think that
we do not want any alternative main thread because it would be hard to
support consistency with the rest of the kthread worker API.
The naming and function of kthread_create_worker() is inspired by the
workqueues API like the rest of the kthread worker API.
The kthread_create_worker_on_cpu() variant is motivated by the original
kthread_create_on_cpu(). Note that we need to bind per-CPU kthread
workers already when they are created. It makes the life easier.
kthread_bind() could not be used later for an already running worker.
This patch does _not_ convert existing kthread workers. The kthread
worker API need more improvements first, e.g. a function to destroy the
worker.
IMPORTANT:
kthread_create_worker_on_cpu() allows to use any format of the worker
name, in compare with kthread_create_on_cpu(). The good thing is that it
is more generic. The bad thing is that most users will need to pass the
cpu number in two parameters, e.g. kthread_create_worker_on_cpu(cpu,
"helper/%d", cpu).
To be honest, the main motivation was to avoid the need for an empty
va_list. The only legal way was to create a helper function that would be
called with an empty list. Other attempts caused compilation warnings or
even errors on different architectures.
There were also other alternatives, for example, using #define or
splitting __kthread_create_worker(). The used solution looked like the
least ugly.
Link: http://lkml.kernel.org/r/1470754545-17632-6-git-send-email-pmladek@suse.com
Signed-off-by: Petr Mladek <pmladek@suse.com>
Acked-by: Tejun Heo <tj@kernel.org>
Cc: Oleg Nesterov <oleg@redhat.com>
Cc: Ingo Molnar <mingo@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Cc: "Paul E. McKenney" <paulmck@linux.vnet.ibm.com>
Cc: Josh Triplett <josh@joshtriplett.org>
Cc: Thomas Gleixner <tglx@linutronix.de>
Cc: Jiri Kosina <jkosina@suse.cz>
Cc: Borislav Petkov <bp@suse.de>
Cc: Michal Hocko <mhocko@suse.cz>
Cc: Vlastimil Babka <vbabka@suse.cz>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2016-10-12 04:55:30 +08:00
|
|
|
/*
|
|
|
|
* FIXME: Update the check and remove the assignment when all kthread
|
|
|
|
* worker users are created using kthread_create_worker*() functions.
|
|
|
|
*/
|
|
|
|
WARN_ON(worker->task && worker->task != current);
|
2010-06-29 16:07:09 +08:00
|
|
|
worker->task = current;
|
|
|
|
repeat:
|
|
|
|
set_current_state(TASK_INTERRUPTIBLE); /* mb paired w/ kthread_stop */
|
|
|
|
|
|
|
|
if (kthread_should_stop()) {
|
|
|
|
__set_current_state(TASK_RUNNING);
|
|
|
|
spin_lock_irq(&worker->lock);
|
|
|
|
worker->task = NULL;
|
|
|
|
spin_unlock_irq(&worker->lock);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
work = NULL;
|
|
|
|
spin_lock_irq(&worker->lock);
|
|
|
|
if (!list_empty(&worker->work_list)) {
|
|
|
|
work = list_first_entry(&worker->work_list,
|
|
|
|
struct kthread_work, node);
|
|
|
|
list_del_init(&work->node);
|
|
|
|
}
|
2012-07-20 04:52:53 +08:00
|
|
|
worker->current_work = work;
|
2010-06-29 16:07:09 +08:00
|
|
|
spin_unlock_irq(&worker->lock);
|
|
|
|
|
|
|
|
if (work) {
|
|
|
|
__set_current_state(TASK_RUNNING);
|
|
|
|
work->func(work);
|
|
|
|
} else if (!freezing(current))
|
|
|
|
schedule();
|
|
|
|
|
|
|
|
try_to_freeze();
|
|
|
|
goto repeat;
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL_GPL(kthread_worker_fn);
|
|
|
|
|
kthread: add kthread_create_worker*()
Kthread workers are currently created using the classic kthread API,
namely kthread_run(). kthread_worker_fn() is passed as the @threadfn
parameter.
This patch defines kthread_create_worker() and
kthread_create_worker_on_cpu() functions that hide implementation details.
They enforce using kthread_worker_fn() for the main thread. But I doubt
that there are any plans to create any alternative. In fact, I think that
we do not want any alternative main thread because it would be hard to
support consistency with the rest of the kthread worker API.
The naming and function of kthread_create_worker() is inspired by the
workqueues API like the rest of the kthread worker API.
The kthread_create_worker_on_cpu() variant is motivated by the original
kthread_create_on_cpu(). Note that we need to bind per-CPU kthread
workers already when they are created. It makes the life easier.
kthread_bind() could not be used later for an already running worker.
This patch does _not_ convert existing kthread workers. The kthread
worker API need more improvements first, e.g. a function to destroy the
worker.
IMPORTANT:
kthread_create_worker_on_cpu() allows to use any format of the worker
name, in compare with kthread_create_on_cpu(). The good thing is that it
is more generic. The bad thing is that most users will need to pass the
cpu number in two parameters, e.g. kthread_create_worker_on_cpu(cpu,
"helper/%d", cpu).
To be honest, the main motivation was to avoid the need for an empty
va_list. The only legal way was to create a helper function that would be
called with an empty list. Other attempts caused compilation warnings or
even errors on different architectures.
There were also other alternatives, for example, using #define or
splitting __kthread_create_worker(). The used solution looked like the
least ugly.
Link: http://lkml.kernel.org/r/1470754545-17632-6-git-send-email-pmladek@suse.com
Signed-off-by: Petr Mladek <pmladek@suse.com>
Acked-by: Tejun Heo <tj@kernel.org>
Cc: Oleg Nesterov <oleg@redhat.com>
Cc: Ingo Molnar <mingo@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Cc: "Paul E. McKenney" <paulmck@linux.vnet.ibm.com>
Cc: Josh Triplett <josh@joshtriplett.org>
Cc: Thomas Gleixner <tglx@linutronix.de>
Cc: Jiri Kosina <jkosina@suse.cz>
Cc: Borislav Petkov <bp@suse.de>
Cc: Michal Hocko <mhocko@suse.cz>
Cc: Vlastimil Babka <vbabka@suse.cz>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2016-10-12 04:55:30 +08:00
|
|
|
static struct kthread_worker *
|
|
|
|
__kthread_create_worker(int cpu, const char namefmt[], va_list args)
|
|
|
|
{
|
|
|
|
struct kthread_worker *worker;
|
|
|
|
struct task_struct *task;
|
|
|
|
|
|
|
|
worker = kzalloc(sizeof(*worker), GFP_KERNEL);
|
|
|
|
if (!worker)
|
|
|
|
return ERR_PTR(-ENOMEM);
|
|
|
|
|
|
|
|
kthread_init_worker(worker);
|
|
|
|
|
|
|
|
if (cpu >= 0) {
|
|
|
|
char name[TASK_COMM_LEN];
|
|
|
|
|
|
|
|
/*
|
|
|
|
* kthread_create_worker_on_cpu() allows to pass a generic
|
|
|
|
* namefmt in compare with kthread_create_on_cpu. We need
|
|
|
|
* to format it here.
|
|
|
|
*/
|
|
|
|
vsnprintf(name, sizeof(name), namefmt, args);
|
|
|
|
task = kthread_create_on_cpu(kthread_worker_fn, worker,
|
|
|
|
cpu, name);
|
|
|
|
} else {
|
|
|
|
task = __kthread_create_on_node(kthread_worker_fn, worker,
|
|
|
|
-1, namefmt, args);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (IS_ERR(task))
|
|
|
|
goto fail_task;
|
|
|
|
|
|
|
|
worker->task = task;
|
|
|
|
wake_up_process(task);
|
|
|
|
return worker;
|
|
|
|
|
|
|
|
fail_task:
|
|
|
|
kfree(worker);
|
|
|
|
return ERR_CAST(task);
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* kthread_create_worker - create a kthread worker
|
|
|
|
* @namefmt: printf-style name for the kthread worker (task).
|
|
|
|
*
|
|
|
|
* Returns a pointer to the allocated worker on success, ERR_PTR(-ENOMEM)
|
|
|
|
* when the needed structures could not get allocated, and ERR_PTR(-EINTR)
|
|
|
|
* when the worker was SIGKILLed.
|
|
|
|
*/
|
|
|
|
struct kthread_worker *
|
|
|
|
kthread_create_worker(const char namefmt[], ...)
|
|
|
|
{
|
|
|
|
struct kthread_worker *worker;
|
|
|
|
va_list args;
|
|
|
|
|
|
|
|
va_start(args, namefmt);
|
|
|
|
worker = __kthread_create_worker(-1, namefmt, args);
|
|
|
|
va_end(args);
|
|
|
|
|
|
|
|
return worker;
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(kthread_create_worker);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* kthread_create_worker_on_cpu - create a kthread worker and bind it
|
|
|
|
* it to a given CPU and the associated NUMA node.
|
|
|
|
* @cpu: CPU number
|
|
|
|
* @namefmt: printf-style name for the kthread worker (task).
|
|
|
|
*
|
|
|
|
* Use a valid CPU number if you want to bind the kthread worker
|
|
|
|
* to the given CPU and the associated NUMA node.
|
|
|
|
*
|
|
|
|
* A good practice is to add the cpu number also into the worker name.
|
|
|
|
* For example, use kthread_create_worker_on_cpu(cpu, "helper/%d", cpu).
|
|
|
|
*
|
|
|
|
* Returns a pointer to the allocated worker on success, ERR_PTR(-ENOMEM)
|
|
|
|
* when the needed structures could not get allocated, and ERR_PTR(-EINTR)
|
|
|
|
* when the worker was SIGKILLed.
|
|
|
|
*/
|
|
|
|
struct kthread_worker *
|
|
|
|
kthread_create_worker_on_cpu(int cpu, const char namefmt[], ...)
|
|
|
|
{
|
|
|
|
struct kthread_worker *worker;
|
|
|
|
va_list args;
|
|
|
|
|
|
|
|
va_start(args, namefmt);
|
|
|
|
worker = __kthread_create_worker(cpu, namefmt, args);
|
|
|
|
va_end(args);
|
|
|
|
|
|
|
|
return worker;
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(kthread_create_worker_on_cpu);
|
|
|
|
|
kthread: allow to cancel kthread work
We are going to use kthread workers more widely and sometimes we will need
to make sure that the work is neither pending nor running.
This patch implements cancel_*_sync() operations as inspired by
workqueues. Well, we are synchronized against the other operations via
the worker lock, we use del_timer_sync() and a counter to count parallel
cancel operations. Therefore the implementation might be easier.
First, we check if a worker is assigned. If not, the work has newer been
queued after it was initialized.
Second, we take the worker lock. It must be the right one. The work must
not be assigned to another worker unless it is initialized in between.
Third, we try to cancel the timer when it exists. The timer is deleted
synchronously to make sure that the timer call back is not running. We
need to temporary release the worker->lock to avoid a possible deadlock
with the callback. In the meantime, we set work->canceling counter to
avoid any queuing.
Fourth, we try to remove the work from a worker list. It might be
the list of either normal or delayed works.
Fifth, if the work is running, we call kthread_flush_work(). It might
take an arbitrary time. We need to release the worker-lock again. In the
meantime, we again block any queuing by the canceling counter.
As already mentioned, the check for a pending kthread work is done under a
lock. In compare with workqueues, we do not need to fight for a single
PENDING bit to block other operations. Therefore we do not suffer from
the thundering storm problem and all parallel canceling jobs might use
kthread_flush_work(). Any queuing is blocked until the counter gets zero.
Link: http://lkml.kernel.org/r/1470754545-17632-10-git-send-email-pmladek@suse.com
Signed-off-by: Petr Mladek <pmladek@suse.com>
Acked-by: Tejun Heo <tj@kernel.org>
Cc: Oleg Nesterov <oleg@redhat.com>
Cc: Ingo Molnar <mingo@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Cc: "Paul E. McKenney" <paulmck@linux.vnet.ibm.com>
Cc: Josh Triplett <josh@joshtriplett.org>
Cc: Thomas Gleixner <tglx@linutronix.de>
Cc: Jiri Kosina <jkosina@suse.cz>
Cc: Borislav Petkov <bp@suse.de>
Cc: Michal Hocko <mhocko@suse.cz>
Cc: Vlastimil Babka <vbabka@suse.cz>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2016-10-12 04:55:43 +08:00
|
|
|
/*
|
|
|
|
* Returns true when the work could not be queued at the moment.
|
|
|
|
* It happens when it is already pending in a worker list
|
|
|
|
* or when it is being cancelled.
|
|
|
|
*/
|
|
|
|
static inline bool queuing_blocked(struct kthread_worker *worker,
|
|
|
|
struct kthread_work *work)
|
|
|
|
{
|
|
|
|
lockdep_assert_held(&worker->lock);
|
|
|
|
|
|
|
|
return !list_empty(&work->node) || work->canceling;
|
|
|
|
}
|
|
|
|
|
2016-10-12 04:55:36 +08:00
|
|
|
static void kthread_insert_work_sanity_check(struct kthread_worker *worker,
|
|
|
|
struct kthread_work *work)
|
|
|
|
{
|
|
|
|
lockdep_assert_held(&worker->lock);
|
|
|
|
WARN_ON_ONCE(!list_empty(&work->node));
|
|
|
|
/* Do not use a work with >1 worker, see kthread_queue_work() */
|
|
|
|
WARN_ON_ONCE(work->worker && work->worker != worker);
|
|
|
|
}
|
|
|
|
|
2012-07-20 04:52:53 +08:00
|
|
|
/* insert @work before @pos in @worker */
|
2016-10-12 04:55:20 +08:00
|
|
|
static void kthread_insert_work(struct kthread_worker *worker,
|
2016-10-12 04:55:36 +08:00
|
|
|
struct kthread_work *work,
|
|
|
|
struct list_head *pos)
|
2012-07-20 04:52:53 +08:00
|
|
|
{
|
2016-10-12 04:55:36 +08:00
|
|
|
kthread_insert_work_sanity_check(worker, work);
|
2012-07-20 04:52:53 +08:00
|
|
|
|
|
|
|
list_add_tail(&work->node, pos);
|
2012-07-20 04:52:53 +08:00
|
|
|
work->worker = worker;
|
2014-07-26 12:03:59 +08:00
|
|
|
if (!worker->current_work && likely(worker->task))
|
2012-07-20 04:52:53 +08:00
|
|
|
wake_up_process(worker->task);
|
|
|
|
}
|
|
|
|
|
2010-06-29 16:07:09 +08:00
|
|
|
/**
|
2016-10-12 04:55:20 +08:00
|
|
|
* kthread_queue_work - queue a kthread_work
|
2010-06-29 16:07:09 +08:00
|
|
|
* @worker: target kthread_worker
|
|
|
|
* @work: kthread_work to queue
|
|
|
|
*
|
|
|
|
* Queue @work to work processor @task for async execution. @task
|
|
|
|
* must have been created with kthread_worker_create(). Returns %true
|
|
|
|
* if @work was successfully queued, %false if it was already pending.
|
2016-10-12 04:55:36 +08:00
|
|
|
*
|
|
|
|
* Reinitialize the work if it needs to be used by another worker.
|
|
|
|
* For example, when the worker was stopped and started again.
|
2010-06-29 16:07:09 +08:00
|
|
|
*/
|
2016-10-12 04:55:20 +08:00
|
|
|
bool kthread_queue_work(struct kthread_worker *worker,
|
2010-06-29 16:07:09 +08:00
|
|
|
struct kthread_work *work)
|
|
|
|
{
|
|
|
|
bool ret = false;
|
|
|
|
unsigned long flags;
|
|
|
|
|
|
|
|
spin_lock_irqsave(&worker->lock, flags);
|
kthread: allow to cancel kthread work
We are going to use kthread workers more widely and sometimes we will need
to make sure that the work is neither pending nor running.
This patch implements cancel_*_sync() operations as inspired by
workqueues. Well, we are synchronized against the other operations via
the worker lock, we use del_timer_sync() and a counter to count parallel
cancel operations. Therefore the implementation might be easier.
First, we check if a worker is assigned. If not, the work has newer been
queued after it was initialized.
Second, we take the worker lock. It must be the right one. The work must
not be assigned to another worker unless it is initialized in between.
Third, we try to cancel the timer when it exists. The timer is deleted
synchronously to make sure that the timer call back is not running. We
need to temporary release the worker->lock to avoid a possible deadlock
with the callback. In the meantime, we set work->canceling counter to
avoid any queuing.
Fourth, we try to remove the work from a worker list. It might be
the list of either normal or delayed works.
Fifth, if the work is running, we call kthread_flush_work(). It might
take an arbitrary time. We need to release the worker-lock again. In the
meantime, we again block any queuing by the canceling counter.
As already mentioned, the check for a pending kthread work is done under a
lock. In compare with workqueues, we do not need to fight for a single
PENDING bit to block other operations. Therefore we do not suffer from
the thundering storm problem and all parallel canceling jobs might use
kthread_flush_work(). Any queuing is blocked until the counter gets zero.
Link: http://lkml.kernel.org/r/1470754545-17632-10-git-send-email-pmladek@suse.com
Signed-off-by: Petr Mladek <pmladek@suse.com>
Acked-by: Tejun Heo <tj@kernel.org>
Cc: Oleg Nesterov <oleg@redhat.com>
Cc: Ingo Molnar <mingo@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Cc: "Paul E. McKenney" <paulmck@linux.vnet.ibm.com>
Cc: Josh Triplett <josh@joshtriplett.org>
Cc: Thomas Gleixner <tglx@linutronix.de>
Cc: Jiri Kosina <jkosina@suse.cz>
Cc: Borislav Petkov <bp@suse.de>
Cc: Michal Hocko <mhocko@suse.cz>
Cc: Vlastimil Babka <vbabka@suse.cz>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2016-10-12 04:55:43 +08:00
|
|
|
if (!queuing_blocked(worker, work)) {
|
2016-10-12 04:55:20 +08:00
|
|
|
kthread_insert_work(worker, work, &worker->work_list);
|
2010-06-29 16:07:09 +08:00
|
|
|
ret = true;
|
|
|
|
}
|
|
|
|
spin_unlock_irqrestore(&worker->lock, flags);
|
|
|
|
return ret;
|
|
|
|
}
|
2016-10-12 04:55:20 +08:00
|
|
|
EXPORT_SYMBOL_GPL(kthread_queue_work);
|
2010-06-29 16:07:09 +08:00
|
|
|
|
2016-10-12 04:55:40 +08:00
|
|
|
/**
|
|
|
|
* kthread_delayed_work_timer_fn - callback that queues the associated kthread
|
|
|
|
* delayed work when the timer expires.
|
|
|
|
* @__data: pointer to the data associated with the timer
|
|
|
|
*
|
|
|
|
* The format of the function is defined by struct timer_list.
|
|
|
|
* It should have been called from irqsafe timer with irq already off.
|
|
|
|
*/
|
|
|
|
void kthread_delayed_work_timer_fn(unsigned long __data)
|
|
|
|
{
|
|
|
|
struct kthread_delayed_work *dwork =
|
|
|
|
(struct kthread_delayed_work *)__data;
|
|
|
|
struct kthread_work *work = &dwork->work;
|
|
|
|
struct kthread_worker *worker = work->worker;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* This might happen when a pending work is reinitialized.
|
|
|
|
* It means that it is used a wrong way.
|
|
|
|
*/
|
|
|
|
if (WARN_ON_ONCE(!worker))
|
|
|
|
return;
|
|
|
|
|
|
|
|
spin_lock(&worker->lock);
|
|
|
|
/* Work must not be used with >1 worker, see kthread_queue_work(). */
|
|
|
|
WARN_ON_ONCE(work->worker != worker);
|
|
|
|
|
|
|
|
/* Move the work from worker->delayed_work_list. */
|
|
|
|
WARN_ON_ONCE(list_empty(&work->node));
|
|
|
|
list_del_init(&work->node);
|
|
|
|
kthread_insert_work(worker, work, &worker->work_list);
|
|
|
|
|
|
|
|
spin_unlock(&worker->lock);
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(kthread_delayed_work_timer_fn);
|
|
|
|
|
|
|
|
void __kthread_queue_delayed_work(struct kthread_worker *worker,
|
|
|
|
struct kthread_delayed_work *dwork,
|
|
|
|
unsigned long delay)
|
|
|
|
{
|
|
|
|
struct timer_list *timer = &dwork->timer;
|
|
|
|
struct kthread_work *work = &dwork->work;
|
|
|
|
|
|
|
|
WARN_ON_ONCE(timer->function != kthread_delayed_work_timer_fn ||
|
|
|
|
timer->data != (unsigned long)dwork);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* If @delay is 0, queue @dwork->work immediately. This is for
|
|
|
|
* both optimization and correctness. The earliest @timer can
|
|
|
|
* expire is on the closest next tick and delayed_work users depend
|
|
|
|
* on that there's no such delay when @delay is 0.
|
|
|
|
*/
|
|
|
|
if (!delay) {
|
|
|
|
kthread_insert_work(worker, work, &worker->work_list);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Be paranoid and try to detect possible races already now. */
|
|
|
|
kthread_insert_work_sanity_check(worker, work);
|
|
|
|
|
|
|
|
list_add(&work->node, &worker->delayed_work_list);
|
|
|
|
work->worker = worker;
|
|
|
|
timer_stats_timer_set_start_info(&dwork->timer);
|
|
|
|
timer->expires = jiffies + delay;
|
|
|
|
add_timer(timer);
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* kthread_queue_delayed_work - queue the associated kthread work
|
|
|
|
* after a delay.
|
|
|
|
* @worker: target kthread_worker
|
|
|
|
* @dwork: kthread_delayed_work to queue
|
|
|
|
* @delay: number of jiffies to wait before queuing
|
|
|
|
*
|
|
|
|
* If the work has not been pending it starts a timer that will queue
|
|
|
|
* the work after the given @delay. If @delay is zero, it queues the
|
|
|
|
* work immediately.
|
|
|
|
*
|
|
|
|
* Return: %false if the @work has already been pending. It means that
|
|
|
|
* either the timer was running or the work was queued. It returns %true
|
|
|
|
* otherwise.
|
|
|
|
*/
|
|
|
|
bool kthread_queue_delayed_work(struct kthread_worker *worker,
|
|
|
|
struct kthread_delayed_work *dwork,
|
|
|
|
unsigned long delay)
|
|
|
|
{
|
|
|
|
struct kthread_work *work = &dwork->work;
|
|
|
|
unsigned long flags;
|
|
|
|
bool ret = false;
|
|
|
|
|
|
|
|
spin_lock_irqsave(&worker->lock, flags);
|
|
|
|
|
kthread: allow to cancel kthread work
We are going to use kthread workers more widely and sometimes we will need
to make sure that the work is neither pending nor running.
This patch implements cancel_*_sync() operations as inspired by
workqueues. Well, we are synchronized against the other operations via
the worker lock, we use del_timer_sync() and a counter to count parallel
cancel operations. Therefore the implementation might be easier.
First, we check if a worker is assigned. If not, the work has newer been
queued after it was initialized.
Second, we take the worker lock. It must be the right one. The work must
not be assigned to another worker unless it is initialized in between.
Third, we try to cancel the timer when it exists. The timer is deleted
synchronously to make sure that the timer call back is not running. We
need to temporary release the worker->lock to avoid a possible deadlock
with the callback. In the meantime, we set work->canceling counter to
avoid any queuing.
Fourth, we try to remove the work from a worker list. It might be
the list of either normal or delayed works.
Fifth, if the work is running, we call kthread_flush_work(). It might
take an arbitrary time. We need to release the worker-lock again. In the
meantime, we again block any queuing by the canceling counter.
As already mentioned, the check for a pending kthread work is done under a
lock. In compare with workqueues, we do not need to fight for a single
PENDING bit to block other operations. Therefore we do not suffer from
the thundering storm problem and all parallel canceling jobs might use
kthread_flush_work(). Any queuing is blocked until the counter gets zero.
Link: http://lkml.kernel.org/r/1470754545-17632-10-git-send-email-pmladek@suse.com
Signed-off-by: Petr Mladek <pmladek@suse.com>
Acked-by: Tejun Heo <tj@kernel.org>
Cc: Oleg Nesterov <oleg@redhat.com>
Cc: Ingo Molnar <mingo@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Cc: "Paul E. McKenney" <paulmck@linux.vnet.ibm.com>
Cc: Josh Triplett <josh@joshtriplett.org>
Cc: Thomas Gleixner <tglx@linutronix.de>
Cc: Jiri Kosina <jkosina@suse.cz>
Cc: Borislav Petkov <bp@suse.de>
Cc: Michal Hocko <mhocko@suse.cz>
Cc: Vlastimil Babka <vbabka@suse.cz>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2016-10-12 04:55:43 +08:00
|
|
|
if (!queuing_blocked(worker, work)) {
|
2016-10-12 04:55:40 +08:00
|
|
|
__kthread_queue_delayed_work(worker, dwork, delay);
|
|
|
|
ret = true;
|
|
|
|
}
|
|
|
|
|
|
|
|
spin_unlock_irqrestore(&worker->lock, flags);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL_GPL(kthread_queue_delayed_work);
|
|
|
|
|
2012-07-20 04:52:53 +08:00
|
|
|
struct kthread_flush_work {
|
|
|
|
struct kthread_work work;
|
|
|
|
struct completion done;
|
|
|
|
};
|
|
|
|
|
|
|
|
static void kthread_flush_work_fn(struct kthread_work *work)
|
|
|
|
{
|
|
|
|
struct kthread_flush_work *fwork =
|
|
|
|
container_of(work, struct kthread_flush_work, work);
|
|
|
|
complete(&fwork->done);
|
|
|
|
}
|
|
|
|
|
2010-06-29 16:07:09 +08:00
|
|
|
/**
|
2016-10-12 04:55:20 +08:00
|
|
|
* kthread_flush_work - flush a kthread_work
|
2010-06-29 16:07:09 +08:00
|
|
|
* @work: work to flush
|
|
|
|
*
|
|
|
|
* If @work is queued or executing, wait for it to finish execution.
|
|
|
|
*/
|
2016-10-12 04:55:20 +08:00
|
|
|
void kthread_flush_work(struct kthread_work *work)
|
2010-06-29 16:07:09 +08:00
|
|
|
{
|
2012-07-20 04:52:53 +08:00
|
|
|
struct kthread_flush_work fwork = {
|
|
|
|
KTHREAD_WORK_INIT(fwork.work, kthread_flush_work_fn),
|
|
|
|
COMPLETION_INITIALIZER_ONSTACK(fwork.done),
|
|
|
|
};
|
|
|
|
struct kthread_worker *worker;
|
|
|
|
bool noop = false;
|
|
|
|
|
|
|
|
worker = work->worker;
|
|
|
|
if (!worker)
|
|
|
|
return;
|
2010-06-29 16:07:09 +08:00
|
|
|
|
2012-07-20 04:52:53 +08:00
|
|
|
spin_lock_irq(&worker->lock);
|
2016-10-12 04:55:36 +08:00
|
|
|
/* Work must not be used with >1 worker, see kthread_queue_work(). */
|
|
|
|
WARN_ON_ONCE(work->worker != worker);
|
2010-06-29 16:07:09 +08:00
|
|
|
|
2012-07-20 04:52:53 +08:00
|
|
|
if (!list_empty(&work->node))
|
2016-10-12 04:55:20 +08:00
|
|
|
kthread_insert_work(worker, &fwork.work, work->node.next);
|
2012-07-20 04:52:53 +08:00
|
|
|
else if (worker->current_work == work)
|
2016-10-12 04:55:20 +08:00
|
|
|
kthread_insert_work(worker, &fwork.work,
|
|
|
|
worker->work_list.next);
|
2012-07-20 04:52:53 +08:00
|
|
|
else
|
|
|
|
noop = true;
|
2010-06-29 16:07:09 +08:00
|
|
|
|
2012-07-20 04:52:53 +08:00
|
|
|
spin_unlock_irq(&worker->lock);
|
2010-06-29 16:07:09 +08:00
|
|
|
|
2012-07-20 04:52:53 +08:00
|
|
|
if (!noop)
|
|
|
|
wait_for_completion(&fwork.done);
|
2010-06-29 16:07:09 +08:00
|
|
|
}
|
2016-10-12 04:55:20 +08:00
|
|
|
EXPORT_SYMBOL_GPL(kthread_flush_work);
|
2010-06-29 16:07:09 +08:00
|
|
|
|
kthread: allow to cancel kthread work
We are going to use kthread workers more widely and sometimes we will need
to make sure that the work is neither pending nor running.
This patch implements cancel_*_sync() operations as inspired by
workqueues. Well, we are synchronized against the other operations via
the worker lock, we use del_timer_sync() and a counter to count parallel
cancel operations. Therefore the implementation might be easier.
First, we check if a worker is assigned. If not, the work has newer been
queued after it was initialized.
Second, we take the worker lock. It must be the right one. The work must
not be assigned to another worker unless it is initialized in between.
Third, we try to cancel the timer when it exists. The timer is deleted
synchronously to make sure that the timer call back is not running. We
need to temporary release the worker->lock to avoid a possible deadlock
with the callback. In the meantime, we set work->canceling counter to
avoid any queuing.
Fourth, we try to remove the work from a worker list. It might be
the list of either normal or delayed works.
Fifth, if the work is running, we call kthread_flush_work(). It might
take an arbitrary time. We need to release the worker-lock again. In the
meantime, we again block any queuing by the canceling counter.
As already mentioned, the check for a pending kthread work is done under a
lock. In compare with workqueues, we do not need to fight for a single
PENDING bit to block other operations. Therefore we do not suffer from
the thundering storm problem and all parallel canceling jobs might use
kthread_flush_work(). Any queuing is blocked until the counter gets zero.
Link: http://lkml.kernel.org/r/1470754545-17632-10-git-send-email-pmladek@suse.com
Signed-off-by: Petr Mladek <pmladek@suse.com>
Acked-by: Tejun Heo <tj@kernel.org>
Cc: Oleg Nesterov <oleg@redhat.com>
Cc: Ingo Molnar <mingo@redhat.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Steven Rostedt <rostedt@goodmis.org>
Cc: "Paul E. McKenney" <paulmck@linux.vnet.ibm.com>
Cc: Josh Triplett <josh@joshtriplett.org>
Cc: Thomas Gleixner <tglx@linutronix.de>
Cc: Jiri Kosina <jkosina@suse.cz>
Cc: Borislav Petkov <bp@suse.de>
Cc: Michal Hocko <mhocko@suse.cz>
Cc: Vlastimil Babka <vbabka@suse.cz>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2016-10-12 04:55:43 +08:00
|
|
|
/*
|
|
|
|
* This function removes the work from the worker queue. Also it makes sure
|
|
|
|
* that it won't get queued later via the delayed work's timer.
|
|
|
|
*
|
|
|
|
* The work might still be in use when this function finishes. See the
|
|
|
|
* current_work proceed by the worker.
|
|
|
|
*
|
|
|
|
* Return: %true if @work was pending and successfully canceled,
|
|
|
|
* %false if @work was not pending
|
|
|
|
*/
|
|
|
|
static bool __kthread_cancel_work(struct kthread_work *work, bool is_dwork,
|
|
|
|
unsigned long *flags)
|
|
|
|
{
|
|
|
|
/* Try to cancel the timer if exists. */
|
|
|
|
if (is_dwork) {
|
|
|
|
struct kthread_delayed_work *dwork =
|
|
|
|
container_of(work, struct kthread_delayed_work, work);
|
|
|
|
struct kthread_worker *worker = work->worker;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* del_timer_sync() must be called to make sure that the timer
|
|
|
|
* callback is not running. The lock must be temporary released
|
|
|
|
* to avoid a deadlock with the callback. In the meantime,
|
|
|
|
* any queuing is blocked by setting the canceling counter.
|
|
|
|
*/
|
|
|
|
work->canceling++;
|
|
|
|
spin_unlock_irqrestore(&worker->lock, *flags);
|
|
|
|
del_timer_sync(&dwork->timer);
|
|
|
|
spin_lock_irqsave(&worker->lock, *flags);
|
|
|
|
work->canceling--;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Try to remove the work from a worker list. It might either
|
|
|
|
* be from worker->work_list or from worker->delayed_work_list.
|
|
|
|
*/
|
|
|
|
if (!list_empty(&work->node)) {
|
|
|
|
list_del_init(&work->node);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
static bool __kthread_cancel_work_sync(struct kthread_work *work, bool is_dwork)
|
|
|
|
{
|
|
|
|
struct kthread_worker *worker = work->worker;
|
|
|
|
unsigned long flags;
|
|
|
|
int ret = false;
|
|
|
|
|
|
|
|
if (!worker)
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
spin_lock_irqsave(&worker->lock, flags);
|
|
|
|
/* Work must not be used with >1 worker, see kthread_queue_work(). */
|
|
|
|
WARN_ON_ONCE(work->worker != worker);
|
|
|
|
|
|
|
|
ret = __kthread_cancel_work(work, is_dwork, &flags);
|
|
|
|
|
|
|
|
if (worker->current_work != work)
|
|
|
|
goto out_fast;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* The work is in progress and we need to wait with the lock released.
|
|
|
|
* In the meantime, block any queuing by setting the canceling counter.
|
|
|
|
*/
|
|
|
|
work->canceling++;
|
|
|
|
spin_unlock_irqrestore(&worker->lock, flags);
|
|
|
|
kthread_flush_work(work);
|
|
|
|
spin_lock_irqsave(&worker->lock, flags);
|
|
|
|
work->canceling--;
|
|
|
|
|
|
|
|
out_fast:
|
|
|
|
spin_unlock_irqrestore(&worker->lock, flags);
|
|
|
|
out:
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* kthread_cancel_work_sync - cancel a kthread work and wait for it to finish
|
|
|
|
* @work: the kthread work to cancel
|
|
|
|
*
|
|
|
|
* Cancel @work and wait for its execution to finish. This function
|
|
|
|
* can be used even if the work re-queues itself. On return from this
|
|
|
|
* function, @work is guaranteed to be not pending or executing on any CPU.
|
|
|
|
*
|
|
|
|
* kthread_cancel_work_sync(&delayed_work->work) must not be used for
|
|
|
|
* delayed_work's. Use kthread_cancel_delayed_work_sync() instead.
|
|
|
|
*
|
|
|
|
* The caller must ensure that the worker on which @work was last
|
|
|
|
* queued can't be destroyed before this function returns.
|
|
|
|
*
|
|
|
|
* Return: %true if @work was pending, %false otherwise.
|
|
|
|
*/
|
|
|
|
bool kthread_cancel_work_sync(struct kthread_work *work)
|
|
|
|
{
|
|
|
|
return __kthread_cancel_work_sync(work, false);
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL_GPL(kthread_cancel_work_sync);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* kthread_cancel_delayed_work_sync - cancel a kthread delayed work and
|
|
|
|
* wait for it to finish.
|
|
|
|
* @dwork: the kthread delayed work to cancel
|
|
|
|
*
|
|
|
|
* This is kthread_cancel_work_sync() for delayed works.
|
|
|
|
*
|
|
|
|
* Return: %true if @dwork was pending, %false otherwise.
|
|
|
|
*/
|
|
|
|
bool kthread_cancel_delayed_work_sync(struct kthread_delayed_work *dwork)
|
|
|
|
{
|
|
|
|
return __kthread_cancel_work_sync(&dwork->work, true);
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL_GPL(kthread_cancel_delayed_work_sync);
|
|
|
|
|
2010-06-29 16:07:09 +08:00
|
|
|
/**
|
2016-10-12 04:55:20 +08:00
|
|
|
* kthread_flush_worker - flush all current works on a kthread_worker
|
2010-06-29 16:07:09 +08:00
|
|
|
* @worker: worker to flush
|
|
|
|
*
|
|
|
|
* Wait until all currently executing or pending works on @worker are
|
|
|
|
* finished.
|
|
|
|
*/
|
2016-10-12 04:55:20 +08:00
|
|
|
void kthread_flush_worker(struct kthread_worker *worker)
|
2010-06-29 16:07:09 +08:00
|
|
|
{
|
|
|
|
struct kthread_flush_work fwork = {
|
|
|
|
KTHREAD_WORK_INIT(fwork.work, kthread_flush_work_fn),
|
|
|
|
COMPLETION_INITIALIZER_ONSTACK(fwork.done),
|
|
|
|
};
|
|
|
|
|
2016-10-12 04:55:20 +08:00
|
|
|
kthread_queue_work(worker, &fwork.work);
|
2010-06-29 16:07:09 +08:00
|
|
|
wait_for_completion(&fwork.done);
|
|
|
|
}
|
2016-10-12 04:55:20 +08:00
|
|
|
EXPORT_SYMBOL_GPL(kthread_flush_worker);
|
2016-10-12 04:55:33 +08:00
|
|
|
|
|
|
|
/**
|
|
|
|
* kthread_destroy_worker - destroy a kthread worker
|
|
|
|
* @worker: worker to be destroyed
|
|
|
|
*
|
|
|
|
* Flush and destroy @worker. The simple flush is enough because the kthread
|
|
|
|
* worker API is used only in trivial scenarios. There are no multi-step state
|
|
|
|
* machines needed.
|
|
|
|
*/
|
|
|
|
void kthread_destroy_worker(struct kthread_worker *worker)
|
|
|
|
{
|
|
|
|
struct task_struct *task;
|
|
|
|
|
|
|
|
task = worker->task;
|
|
|
|
if (WARN_ON(!task))
|
|
|
|
return;
|
|
|
|
|
|
|
|
kthread_flush_worker(worker);
|
|
|
|
kthread_stop(task);
|
|
|
|
WARN_ON(!list_empty(&worker->work_list));
|
|
|
|
kfree(worker);
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(kthread_destroy_worker);
|