2005-04-16 15:20:36 -07:00
|
|
|
/*
|
|
|
|
* linux/kernel/workqueue.c
|
|
|
|
*
|
|
|
|
* Generic mechanism for defining kernel helper threads for running
|
|
|
|
* arbitrary tasks in process context.
|
|
|
|
*
|
|
|
|
* Started by Ingo Molnar, Copyright (C) 2002
|
|
|
|
*
|
|
|
|
* Derived from the taskqueue/keventd code by:
|
|
|
|
*
|
|
|
|
* David Woodhouse <dwmw2@infradead.org>
|
|
|
|
* Andrew Morton <andrewm@uow.edu.au>
|
|
|
|
* Kai Petzke <wpp@marie.physik.tu-berlin.de>
|
|
|
|
* Theodore Ts'o <tytso@mit.edu>
|
2005-10-30 16:01:59 -07:00
|
|
|
*
|
|
|
|
* Made to use alloc_percpu by Christoph Lameter <clameter@sgi.com>.
|
2005-04-16 15:20:36 -07:00
|
|
|
*/
|
|
|
|
|
|
|
|
#include <linux/module.h>
|
|
|
|
#include <linux/kernel.h>
|
|
|
|
#include <linux/sched.h>
|
|
|
|
#include <linux/init.h>
|
|
|
|
#include <linux/signal.h>
|
|
|
|
#include <linux/completion.h>
|
|
|
|
#include <linux/workqueue.h>
|
|
|
|
#include <linux/slab.h>
|
|
|
|
#include <linux/cpu.h>
|
|
|
|
#include <linux/notifier.h>
|
|
|
|
#include <linux/kthread.h>
|
2006-02-23 11:43:43 -07:00
|
|
|
#include <linux/hardirq.h>
|
2006-10-11 01:21:26 -07:00
|
|
|
#include <linux/mempolicy.h>
|
2006-12-06 21:34:49 -07:00
|
|
|
#include <linux/freezer.h>
|
2006-12-06 21:37:26 -07:00
|
|
|
#include <linux/kallsyms.h>
|
|
|
|
#include <linux/debug_locks.h>
|
2005-04-16 15:20:36 -07:00
|
|
|
|
|
|
|
/*
|
2006-01-08 02:05:12 -07:00
|
|
|
* The per-CPU workqueue (if single thread, we always use the first
|
|
|
|
* possible cpu).
|
2005-04-16 15:20:36 -07:00
|
|
|
*/
|
|
|
|
struct cpu_workqueue_struct {
|
|
|
|
|
|
|
|
spinlock_t lock;
|
|
|
|
|
|
|
|
struct list_head worklist;
|
|
|
|
wait_queue_head_t more_work;
|
|
|
|
|
|
|
|
struct workqueue_struct *wq;
|
2006-07-03 00:25:41 -07:00
|
|
|
struct task_struct *thread;
|
implement flush_work()
A basic problem with flush_scheduled_work() is that it blocks behind _all_
presently-queued works, rather than just the work whcih the caller wants to
flush. If the caller holds some lock, and if one of the queued work happens
to want that lock as well then accidental deadlocks can occur.
One example of this is the phy layer: it wants to flush work while holding
rtnl_lock(). But if a linkwatch event happens to be queued, the phy code will
deadlock because the linkwatch callback function takes rtnl_lock.
So we implement a new function which will flush a *single* work - just the one
which the caller wants to free up. Thus we avoid the accidental deadlocks
which can arise from unrelated subsystems' callbacks taking shared locks.
flush_work() non-blockingly dequeues the work_struct which we want to kill,
then it waits for its handler to complete on all CPUs.
Add ->current_work to the "struct cpu_workqueue_struct", it points to
currently running "struct work_struct". When flush_work(work) detects
->current_work == work, it inserts a barrier at the _head_ of ->worklist
(and thus right _after_ that work) and waits for completition. This means
that the next work fired on that CPU will be this barrier, or another
barrier queued by concurrent flush_work(), so the caller of flush_work()
will be woken before any "regular" work has a chance to run.
When wait_on_work() unlocks workqueue_mutex (or whatever we choose to protect
against CPU hotplug), CPU may go away. But in that case take_over_work() will
move a barrier we queued to another CPU, it will be fired sometime, and
wait_on_work() will be woken.
Actually, we are doing cleanup_workqueue_thread()->kthread_stop() before
take_over_work(), so cwq->thread should complete its ->worklist (and thus
the barrier), because currently we don't check kthread_should_stop() in
run_workqueue(). But even if we did, everything should be ok.
[akpm@osdl.org: cleanup]
[akpm@osdl.org: add flush_work_keventd() wrapper]
Signed-off-by: Oleg Nesterov <oleg@tv-sign.ru>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2007-05-09 02:33:52 -07:00
|
|
|
struct work_struct *current_work;
|
2005-04-16 15:20:36 -07:00
|
|
|
|
|
|
|
int run_depth; /* Detect run_workqueue() recursion depth */
|
2006-12-06 21:34:49 -07:00
|
|
|
|
|
|
|
int freezeable; /* Freeze the thread during suspend */
|
2005-04-16 15:20:36 -07:00
|
|
|
} ____cacheline_aligned;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* The externally visible workqueue abstraction is an array of
|
|
|
|
* per-CPU workqueues:
|
|
|
|
*/
|
|
|
|
struct workqueue_struct {
|
2005-10-30 16:01:59 -07:00
|
|
|
struct cpu_workqueue_struct *cpu_wq;
|
2005-04-16 15:20:36 -07:00
|
|
|
const char *name;
|
|
|
|
struct list_head list; /* Empty if single thread */
|
|
|
|
};
|
|
|
|
|
|
|
|
/* All the per-cpu workqueues on the system, for hotplug cpu to add/remove
|
|
|
|
threads to each one as cpus come/go. */
|
2006-08-13 23:24:26 -07:00
|
|
|
static DEFINE_MUTEX(workqueue_mutex);
|
2005-04-16 15:20:36 -07:00
|
|
|
static LIST_HEAD(workqueues);
|
|
|
|
|
2006-01-08 02:05:12 -07:00
|
|
|
static int singlethread_cpu;
|
|
|
|
|
2005-04-16 15:20:36 -07:00
|
|
|
/* If it's single threaded, it isn't in the list of workqueues. */
|
|
|
|
static inline int is_single_threaded(struct workqueue_struct *wq)
|
|
|
|
{
|
|
|
|
return list_empty(&wq->list);
|
|
|
|
}
|
|
|
|
|
[PATCH] WorkStruct: Use direct assignment rather than cmpxchg()
Use direct assignment rather than cmpxchg() as the latter is unavailable
and unimplementable on some platforms and is actually unnecessary.
The use of cmpxchg() was to guard against two possibilities, neither of
which can actually occur:
(1) The pending flag may have been unset or may be cleared. However, given
where it's called, the pending flag is _always_ set. I don't think it
can be unset whilst we're in set_wq_data().
Once the work is enqueued to be actually run, the only way off the queue
is for it to be actually run.
If it's a delayed work item, then the bit can't be cleared by the timer
because we haven't started the timer yet. Also, the pending bit can't be
cleared by cancelling the delayed work _until_ the work item has had its
timer started.
(2) The workqueue pointer might change. This can only happen in two cases:
(a) The work item has just been queued to actually run, and so we're
protected by the appropriate workqueue spinlock.
(b) A delayed work item is being queued, and so the timer hasn't been
started yet, and so no one else knows about the work item or can
access it (the pending bit protects us).
Besides, set_wq_data() _sets_ the workqueue pointer unconditionally, so
it can be assigned instead.
So, replacing the set_wq_data() with a straight assignment would be okay
in most cases.
The problem is where we end up tangling with test_and_set_bit() emulated
using spinlocks, and even then it's not a problem _provided_
test_and_set_bit() doesn't attempt to modify the word if the bit was
set.
If that's a problem, then a bitops-proofed assignment will be required -
equivalent to atomic_set() vs other atomic_xxx() ops.
Signed-off-by: David Howells <dhowells@redhat.com>
Signed-off-by: Linus Torvalds <torvalds@osdl.org>
2006-12-07 04:33:26 -07:00
|
|
|
/*
|
|
|
|
* Set the workqueue on which a work item is to be run
|
|
|
|
* - Must *only* be called if the pending flag is set
|
|
|
|
*/
|
2006-11-22 07:54:49 -07:00
|
|
|
static inline void set_wq_data(struct work_struct *work, void *wq)
|
|
|
|
{
|
[PATCH] WorkStruct: Use direct assignment rather than cmpxchg()
Use direct assignment rather than cmpxchg() as the latter is unavailable
and unimplementable on some platforms and is actually unnecessary.
The use of cmpxchg() was to guard against two possibilities, neither of
which can actually occur:
(1) The pending flag may have been unset or may be cleared. However, given
where it's called, the pending flag is _always_ set. I don't think it
can be unset whilst we're in set_wq_data().
Once the work is enqueued to be actually run, the only way off the queue
is for it to be actually run.
If it's a delayed work item, then the bit can't be cleared by the timer
because we haven't started the timer yet. Also, the pending bit can't be
cleared by cancelling the delayed work _until_ the work item has had its
timer started.
(2) The workqueue pointer might change. This can only happen in two cases:
(a) The work item has just been queued to actually run, and so we're
protected by the appropriate workqueue spinlock.
(b) A delayed work item is being queued, and so the timer hasn't been
started yet, and so no one else knows about the work item or can
access it (the pending bit protects us).
Besides, set_wq_data() _sets_ the workqueue pointer unconditionally, so
it can be assigned instead.
So, replacing the set_wq_data() with a straight assignment would be okay
in most cases.
The problem is where we end up tangling with test_and_set_bit() emulated
using spinlocks, and even then it's not a problem _provided_
test_and_set_bit() doesn't attempt to modify the word if the bit was
set.
If that's a problem, then a bitops-proofed assignment will be required -
equivalent to atomic_set() vs other atomic_xxx() ops.
Signed-off-by: David Howells <dhowells@redhat.com>
Signed-off-by: Linus Torvalds <torvalds@osdl.org>
2006-12-07 04:33:26 -07:00
|
|
|
unsigned long new;
|
|
|
|
|
|
|
|
BUG_ON(!work_pending(work));
|
2006-11-22 07:54:49 -07:00
|
|
|
|
|
|
|
new = (unsigned long) wq | (1UL << WORK_STRUCT_PENDING);
|
2006-12-16 10:53:50 -07:00
|
|
|
new |= WORK_STRUCT_FLAG_MASK & *work_data_bits(work);
|
|
|
|
atomic_long_set(&work->data, new);
|
2006-11-22 07:54:49 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
static inline void *get_wq_data(struct work_struct *work)
|
|
|
|
{
|
2006-12-16 10:53:50 -07:00
|
|
|
return (void *) (atomic_long_read(&work->data) & WORK_STRUCT_WQ_DATA_MASK);
|
2006-11-22 07:54:49 -07:00
|
|
|
}
|
|
|
|
|
2006-12-07 10:28:19 -07:00
|
|
|
static int __run_work(struct cpu_workqueue_struct *cwq, struct work_struct *work)
|
|
|
|
{
|
|
|
|
int ret = 0;
|
|
|
|
unsigned long flags;
|
|
|
|
|
|
|
|
spin_lock_irqsave(&cwq->lock, flags);
|
|
|
|
/*
|
|
|
|
* We need to re-validate the work info after we've gotten
|
|
|
|
* the cpu_workqueue lock. We can run the work now iff:
|
|
|
|
*
|
|
|
|
* - the wq_data still matches the cpu_workqueue_struct
|
|
|
|
* - AND the work is still marked pending
|
|
|
|
* - AND the work is still on a list (which will be this
|
|
|
|
* workqueue_struct list)
|
|
|
|
*
|
|
|
|
* All these conditions are important, because we
|
|
|
|
* need to protect against the work being run right
|
|
|
|
* now on another CPU (all but the last one might be
|
|
|
|
* true if it's currently running and has not been
|
|
|
|
* released yet, for example).
|
|
|
|
*/
|
|
|
|
if (get_wq_data(work) == cwq
|
|
|
|
&& work_pending(work)
|
|
|
|
&& !list_empty(&work->entry)) {
|
|
|
|
work_func_t f = work->func;
|
implement flush_work()
A basic problem with flush_scheduled_work() is that it blocks behind _all_
presently-queued works, rather than just the work whcih the caller wants to
flush. If the caller holds some lock, and if one of the queued work happens
to want that lock as well then accidental deadlocks can occur.
One example of this is the phy layer: it wants to flush work while holding
rtnl_lock(). But if a linkwatch event happens to be queued, the phy code will
deadlock because the linkwatch callback function takes rtnl_lock.
So we implement a new function which will flush a *single* work - just the one
which the caller wants to free up. Thus we avoid the accidental deadlocks
which can arise from unrelated subsystems' callbacks taking shared locks.
flush_work() non-blockingly dequeues the work_struct which we want to kill,
then it waits for its handler to complete on all CPUs.
Add ->current_work to the "struct cpu_workqueue_struct", it points to
currently running "struct work_struct". When flush_work(work) detects
->current_work == work, it inserts a barrier at the _head_ of ->worklist
(and thus right _after_ that work) and waits for completition. This means
that the next work fired on that CPU will be this barrier, or another
barrier queued by concurrent flush_work(), so the caller of flush_work()
will be woken before any "regular" work has a chance to run.
When wait_on_work() unlocks workqueue_mutex (or whatever we choose to protect
against CPU hotplug), CPU may go away. But in that case take_over_work() will
move a barrier we queued to another CPU, it will be fired sometime, and
wait_on_work() will be woken.
Actually, we are doing cleanup_workqueue_thread()->kthread_stop() before
take_over_work(), so cwq->thread should complete its ->worklist (and thus
the barrier), because currently we don't check kthread_should_stop() in
run_workqueue(). But even if we did, everything should be ok.
[akpm@osdl.org: cleanup]
[akpm@osdl.org: add flush_work_keventd() wrapper]
Signed-off-by: Oleg Nesterov <oleg@tv-sign.ru>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2007-05-09 02:33:52 -07:00
|
|
|
cwq->current_work = work;
|
2006-12-07 10:28:19 -07:00
|
|
|
list_del_init(&work->entry);
|
|
|
|
spin_unlock_irqrestore(&cwq->lock, flags);
|
|
|
|
|
2006-12-16 10:53:50 -07:00
|
|
|
if (!test_bit(WORK_STRUCT_NOAUTOREL, work_data_bits(work)))
|
2006-12-07 10:28:19 -07:00
|
|
|
work_release(work);
|
|
|
|
f(work);
|
|
|
|
|
|
|
|
spin_lock_irqsave(&cwq->lock, flags);
|
implement flush_work()
A basic problem with flush_scheduled_work() is that it blocks behind _all_
presently-queued works, rather than just the work whcih the caller wants to
flush. If the caller holds some lock, and if one of the queued work happens
to want that lock as well then accidental deadlocks can occur.
One example of this is the phy layer: it wants to flush work while holding
rtnl_lock(). But if a linkwatch event happens to be queued, the phy code will
deadlock because the linkwatch callback function takes rtnl_lock.
So we implement a new function which will flush a *single* work - just the one
which the caller wants to free up. Thus we avoid the accidental deadlocks
which can arise from unrelated subsystems' callbacks taking shared locks.
flush_work() non-blockingly dequeues the work_struct which we want to kill,
then it waits for its handler to complete on all CPUs.
Add ->current_work to the "struct cpu_workqueue_struct", it points to
currently running "struct work_struct". When flush_work(work) detects
->current_work == work, it inserts a barrier at the _head_ of ->worklist
(and thus right _after_ that work) and waits for completition. This means
that the next work fired on that CPU will be this barrier, or another
barrier queued by concurrent flush_work(), so the caller of flush_work()
will be woken before any "regular" work has a chance to run.
When wait_on_work() unlocks workqueue_mutex (or whatever we choose to protect
against CPU hotplug), CPU may go away. But in that case take_over_work() will
move a barrier we queued to another CPU, it will be fired sometime, and
wait_on_work() will be woken.
Actually, we are doing cleanup_workqueue_thread()->kthread_stop() before
take_over_work(), so cwq->thread should complete its ->worklist (and thus
the barrier), because currently we don't check kthread_should_stop() in
run_workqueue(). But even if we did, everything should be ok.
[akpm@osdl.org: cleanup]
[akpm@osdl.org: add flush_work_keventd() wrapper]
Signed-off-by: Oleg Nesterov <oleg@tv-sign.ru>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2007-05-09 02:33:52 -07:00
|
|
|
cwq->current_work = NULL;
|
2006-12-07 10:28:19 -07:00
|
|
|
ret = 1;
|
|
|
|
}
|
|
|
|
spin_unlock_irqrestore(&cwq->lock, flags);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* run_scheduled_work - run scheduled work synchronously
|
|
|
|
* @work: work to run
|
|
|
|
*
|
|
|
|
* This checks if the work was pending, and runs it
|
|
|
|
* synchronously if so. It returns a boolean to indicate
|
|
|
|
* whether it had any scheduled work to run or not.
|
|
|
|
*
|
|
|
|
* NOTE! This _only_ works for normal work_structs. You
|
|
|
|
* CANNOT use this for delayed work, because the wq data
|
|
|
|
* for delayed work will not point properly to the per-
|
|
|
|
* CPU workqueue struct, but will change!
|
|
|
|
*/
|
|
|
|
int fastcall run_scheduled_work(struct work_struct *work)
|
|
|
|
{
|
|
|
|
for (;;) {
|
|
|
|
struct cpu_workqueue_struct *cwq;
|
|
|
|
|
|
|
|
if (!work_pending(work))
|
|
|
|
return 0;
|
|
|
|
if (list_empty(&work->entry))
|
|
|
|
return 0;
|
|
|
|
/* NOTE! This depends intimately on __queue_work! */
|
|
|
|
cwq = get_wq_data(work);
|
|
|
|
if (!cwq)
|
|
|
|
return 0;
|
|
|
|
if (__run_work(cwq, work))
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(run_scheduled_work);
|
|
|
|
|
implement flush_work()
A basic problem with flush_scheduled_work() is that it blocks behind _all_
presently-queued works, rather than just the work whcih the caller wants to
flush. If the caller holds some lock, and if one of the queued work happens
to want that lock as well then accidental deadlocks can occur.
One example of this is the phy layer: it wants to flush work while holding
rtnl_lock(). But if a linkwatch event happens to be queued, the phy code will
deadlock because the linkwatch callback function takes rtnl_lock.
So we implement a new function which will flush a *single* work - just the one
which the caller wants to free up. Thus we avoid the accidental deadlocks
which can arise from unrelated subsystems' callbacks taking shared locks.
flush_work() non-blockingly dequeues the work_struct which we want to kill,
then it waits for its handler to complete on all CPUs.
Add ->current_work to the "struct cpu_workqueue_struct", it points to
currently running "struct work_struct". When flush_work(work) detects
->current_work == work, it inserts a barrier at the _head_ of ->worklist
(and thus right _after_ that work) and waits for completition. This means
that the next work fired on that CPU will be this barrier, or another
barrier queued by concurrent flush_work(), so the caller of flush_work()
will be woken before any "regular" work has a chance to run.
When wait_on_work() unlocks workqueue_mutex (or whatever we choose to protect
against CPU hotplug), CPU may go away. But in that case take_over_work() will
move a barrier we queued to another CPU, it will be fired sometime, and
wait_on_work() will be woken.
Actually, we are doing cleanup_workqueue_thread()->kthread_stop() before
take_over_work(), so cwq->thread should complete its ->worklist (and thus
the barrier), because currently we don't check kthread_should_stop() in
run_workqueue(). But even if we did, everything should be ok.
[akpm@osdl.org: cleanup]
[akpm@osdl.org: add flush_work_keventd() wrapper]
Signed-off-by: Oleg Nesterov <oleg@tv-sign.ru>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2007-05-09 02:33:52 -07:00
|
|
|
static void insert_work(struct cpu_workqueue_struct *cwq,
|
|
|
|
struct work_struct *work, int tail)
|
|
|
|
{
|
|
|
|
set_wq_data(work, cwq);
|
|
|
|
if (tail)
|
|
|
|
list_add_tail(&work->entry, &cwq->worklist);
|
|
|
|
else
|
|
|
|
list_add(&work->entry, &cwq->worklist);
|
|
|
|
wake_up(&cwq->more_work);
|
|
|
|
}
|
|
|
|
|
2005-04-16 15:20:36 -07:00
|
|
|
/* Preempt must be disabled. */
|
|
|
|
static void __queue_work(struct cpu_workqueue_struct *cwq,
|
|
|
|
struct work_struct *work)
|
|
|
|
{
|
|
|
|
unsigned long flags;
|
|
|
|
|
|
|
|
spin_lock_irqsave(&cwq->lock, flags);
|
implement flush_work()
A basic problem with flush_scheduled_work() is that it blocks behind _all_
presently-queued works, rather than just the work whcih the caller wants to
flush. If the caller holds some lock, and if one of the queued work happens
to want that lock as well then accidental deadlocks can occur.
One example of this is the phy layer: it wants to flush work while holding
rtnl_lock(). But if a linkwatch event happens to be queued, the phy code will
deadlock because the linkwatch callback function takes rtnl_lock.
So we implement a new function which will flush a *single* work - just the one
which the caller wants to free up. Thus we avoid the accidental deadlocks
which can arise from unrelated subsystems' callbacks taking shared locks.
flush_work() non-blockingly dequeues the work_struct which we want to kill,
then it waits for its handler to complete on all CPUs.
Add ->current_work to the "struct cpu_workqueue_struct", it points to
currently running "struct work_struct". When flush_work(work) detects
->current_work == work, it inserts a barrier at the _head_ of ->worklist
(and thus right _after_ that work) and waits for completition. This means
that the next work fired on that CPU will be this barrier, or another
barrier queued by concurrent flush_work(), so the caller of flush_work()
will be woken before any "regular" work has a chance to run.
When wait_on_work() unlocks workqueue_mutex (or whatever we choose to protect
against CPU hotplug), CPU may go away. But in that case take_over_work() will
move a barrier we queued to another CPU, it will be fired sometime, and
wait_on_work() will be woken.
Actually, we are doing cleanup_workqueue_thread()->kthread_stop() before
take_over_work(), so cwq->thread should complete its ->worklist (and thus
the barrier), because currently we don't check kthread_should_stop() in
run_workqueue(). But even if we did, everything should be ok.
[akpm@osdl.org: cleanup]
[akpm@osdl.org: add flush_work_keventd() wrapper]
Signed-off-by: Oleg Nesterov <oleg@tv-sign.ru>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2007-05-09 02:33:52 -07:00
|
|
|
insert_work(cwq, work, 1);
|
2005-04-16 15:20:36 -07:00
|
|
|
spin_unlock_irqrestore(&cwq->lock, flags);
|
|
|
|
}
|
|
|
|
|
2006-07-30 03:03:42 -07:00
|
|
|
/**
|
|
|
|
* queue_work - queue work on a workqueue
|
|
|
|
* @wq: workqueue to use
|
|
|
|
* @work: work to queue
|
|
|
|
*
|
2006-10-28 10:38:58 -07:00
|
|
|
* Returns 0 if @work was already on a queue, non-zero otherwise.
|
2005-04-16 15:20:36 -07:00
|
|
|
*
|
|
|
|
* We queue the work to the CPU it was submitted, but there is no
|
|
|
|
* guarantee that it will be processed by that CPU.
|
|
|
|
*/
|
|
|
|
int fastcall queue_work(struct workqueue_struct *wq, struct work_struct *work)
|
|
|
|
{
|
|
|
|
int ret = 0, cpu = get_cpu();
|
|
|
|
|
2006-12-16 10:53:50 -07:00
|
|
|
if (!test_and_set_bit(WORK_STRUCT_PENDING, work_data_bits(work))) {
|
2005-04-16 15:20:36 -07:00
|
|
|
if (unlikely(is_single_threaded(wq)))
|
2006-01-08 02:05:12 -07:00
|
|
|
cpu = singlethread_cpu;
|
2005-04-16 15:20:36 -07:00
|
|
|
BUG_ON(!list_empty(&work->entry));
|
2005-10-30 16:01:59 -07:00
|
|
|
__queue_work(per_cpu_ptr(wq->cpu_wq, cpu), work);
|
2005-04-16 15:20:36 -07:00
|
|
|
ret = 1;
|
|
|
|
}
|
|
|
|
put_cpu();
|
|
|
|
return ret;
|
|
|
|
}
|
2006-06-29 22:40:45 -07:00
|
|
|
EXPORT_SYMBOL_GPL(queue_work);
|
2005-04-16 15:20:36 -07:00
|
|
|
|
[PATCH] Add debugging feature /proc/timer_stat
Add /proc/timer_stats support: debugging feature to profile timer expiration.
Both the starting site, process/PID and the expiration function is captured.
This allows the quick identification of timer event sources in a system.
Sample output:
# echo 1 > /proc/timer_stats
# cat /proc/timer_stats
Timer Stats Version: v0.1
Sample period: 4.010 s
24, 0 swapper hrtimer_stop_sched_tick (hrtimer_sched_tick)
11, 0 swapper sk_reset_timer (tcp_delack_timer)
6, 0 swapper hrtimer_stop_sched_tick (hrtimer_sched_tick)
2, 1 swapper queue_delayed_work_on (delayed_work_timer_fn)
17, 0 swapper hrtimer_restart_sched_tick (hrtimer_sched_tick)
2, 1 swapper queue_delayed_work_on (delayed_work_timer_fn)
4, 2050 pcscd do_nanosleep (hrtimer_wakeup)
5, 4179 sshd sk_reset_timer (tcp_write_timer)
4, 2248 yum-updatesd schedule_timeout (process_timeout)
18, 0 swapper hrtimer_restart_sched_tick (hrtimer_sched_tick)
3, 0 swapper sk_reset_timer (tcp_delack_timer)
1, 1 swapper neigh_table_init_no_netlink (neigh_periodic_timer)
2, 1 swapper e1000_up (e1000_watchdog)
1, 1 init schedule_timeout (process_timeout)
100 total events, 25.24 events/sec
[ cleanups and hrtimers support from Thomas Gleixner <tglx@linutronix.de> ]
[bunk@stusta.de: nr_entries can become static]
Signed-off-by: Ingo Molnar <mingo@elte.hu>
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
Cc: john stultz <johnstul@us.ibm.com>
Cc: Roman Zippel <zippel@linux-m68k.org>
Cc: Andi Kleen <ak@suse.de>
Signed-off-by: Adrian Bunk <bunk@stusta.de>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2007-02-16 02:28:13 -07:00
|
|
|
void delayed_work_timer_fn(unsigned long __data)
|
2005-04-16 15:20:36 -07:00
|
|
|
{
|
2006-11-22 07:54:01 -07:00
|
|
|
struct delayed_work *dwork = (struct delayed_work *)__data;
|
2006-11-22 07:54:49 -07:00
|
|
|
struct workqueue_struct *wq = get_wq_data(&dwork->work);
|
2005-04-16 15:20:36 -07:00
|
|
|
int cpu = smp_processor_id();
|
|
|
|
|
|
|
|
if (unlikely(is_single_threaded(wq)))
|
2006-01-08 02:05:12 -07:00
|
|
|
cpu = singlethread_cpu;
|
2005-04-16 15:20:36 -07:00
|
|
|
|
2006-11-22 07:54:01 -07:00
|
|
|
__queue_work(per_cpu_ptr(wq->cpu_wq, cpu), &dwork->work);
|
2005-04-16 15:20:36 -07:00
|
|
|
}
|
|
|
|
|
2006-07-30 03:03:42 -07:00
|
|
|
/**
|
|
|
|
* queue_delayed_work - queue work on a workqueue after delay
|
|
|
|
* @wq: workqueue to use
|
2006-12-22 02:06:52 -07:00
|
|
|
* @dwork: delayable work to queue
|
2006-07-30 03:03:42 -07:00
|
|
|
* @delay: number of jiffies to wait before queueing
|
|
|
|
*
|
2006-10-28 10:38:58 -07:00
|
|
|
* Returns 0 if @work was already on a queue, non-zero otherwise.
|
2006-07-30 03:03:42 -07:00
|
|
|
*/
|
2005-04-16 15:20:36 -07:00
|
|
|
int fastcall queue_delayed_work(struct workqueue_struct *wq,
|
2006-11-22 07:54:01 -07:00
|
|
|
struct delayed_work *dwork, unsigned long delay)
|
2005-04-16 15:20:36 -07:00
|
|
|
{
|
|
|
|
int ret = 0;
|
2006-11-22 07:54:01 -07:00
|
|
|
struct timer_list *timer = &dwork->timer;
|
|
|
|
struct work_struct *work = &dwork->work;
|
|
|
|
|
[PATCH] Add debugging feature /proc/timer_stat
Add /proc/timer_stats support: debugging feature to profile timer expiration.
Both the starting site, process/PID and the expiration function is captured.
This allows the quick identification of timer event sources in a system.
Sample output:
# echo 1 > /proc/timer_stats
# cat /proc/timer_stats
Timer Stats Version: v0.1
Sample period: 4.010 s
24, 0 swapper hrtimer_stop_sched_tick (hrtimer_sched_tick)
11, 0 swapper sk_reset_timer (tcp_delack_timer)
6, 0 swapper hrtimer_stop_sched_tick (hrtimer_sched_tick)
2, 1 swapper queue_delayed_work_on (delayed_work_timer_fn)
17, 0 swapper hrtimer_restart_sched_tick (hrtimer_sched_tick)
2, 1 swapper queue_delayed_work_on (delayed_work_timer_fn)
4, 2050 pcscd do_nanosleep (hrtimer_wakeup)
5, 4179 sshd sk_reset_timer (tcp_write_timer)
4, 2248 yum-updatesd schedule_timeout (process_timeout)
18, 0 swapper hrtimer_restart_sched_tick (hrtimer_sched_tick)
3, 0 swapper sk_reset_timer (tcp_delack_timer)
1, 1 swapper neigh_table_init_no_netlink (neigh_periodic_timer)
2, 1 swapper e1000_up (e1000_watchdog)
1, 1 init schedule_timeout (process_timeout)
100 total events, 25.24 events/sec
[ cleanups and hrtimers support from Thomas Gleixner <tglx@linutronix.de> ]
[bunk@stusta.de: nr_entries can become static]
Signed-off-by: Ingo Molnar <mingo@elte.hu>
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
Cc: john stultz <johnstul@us.ibm.com>
Cc: Roman Zippel <zippel@linux-m68k.org>
Cc: Andi Kleen <ak@suse.de>
Signed-off-by: Adrian Bunk <bunk@stusta.de>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2007-02-16 02:28:13 -07:00
|
|
|
timer_stats_timer_set_start_info(timer);
|
2006-11-22 07:54:01 -07:00
|
|
|
if (delay == 0)
|
|
|
|
return queue_work(wq, work);
|
2005-04-16 15:20:36 -07:00
|
|
|
|
2006-12-16 10:53:50 -07:00
|
|
|
if (!test_and_set_bit(WORK_STRUCT_PENDING, work_data_bits(work))) {
|
2005-04-16 15:20:36 -07:00
|
|
|
BUG_ON(timer_pending(timer));
|
|
|
|
BUG_ON(!list_empty(&work->entry));
|
|
|
|
|
|
|
|
/* This stores wq for the moment, for the timer_fn */
|
2006-11-22 07:54:49 -07:00
|
|
|
set_wq_data(work, wq);
|
2005-04-16 15:20:36 -07:00
|
|
|
timer->expires = jiffies + delay;
|
2006-11-22 07:54:01 -07:00
|
|
|
timer->data = (unsigned long)dwork;
|
2005-04-16 15:20:36 -07:00
|
|
|
timer->function = delayed_work_timer_fn;
|
|
|
|
add_timer(timer);
|
|
|
|
ret = 1;
|
|
|
|
}
|
|
|
|
return ret;
|
|
|
|
}
|
2006-06-29 22:40:45 -07:00
|
|
|
EXPORT_SYMBOL_GPL(queue_delayed_work);
|
2005-04-16 15:20:36 -07:00
|
|
|
|
2006-07-30 03:03:42 -07:00
|
|
|
/**
|
|
|
|
* queue_delayed_work_on - queue work on specific CPU after delay
|
|
|
|
* @cpu: CPU number to execute work on
|
|
|
|
* @wq: workqueue to use
|
2006-12-22 02:06:52 -07:00
|
|
|
* @dwork: work to queue
|
2006-07-30 03:03:42 -07:00
|
|
|
* @delay: number of jiffies to wait before queueing
|
|
|
|
*
|
2006-10-28 10:38:58 -07:00
|
|
|
* Returns 0 if @work was already on a queue, non-zero otherwise.
|
2006-07-30 03:03:42 -07:00
|
|
|
*/
|
2006-06-28 13:50:33 -07:00
|
|
|
int queue_delayed_work_on(int cpu, struct workqueue_struct *wq,
|
2006-11-22 07:54:01 -07:00
|
|
|
struct delayed_work *dwork, unsigned long delay)
|
2006-06-28 13:50:33 -07:00
|
|
|
{
|
|
|
|
int ret = 0;
|
2006-11-22 07:54:01 -07:00
|
|
|
struct timer_list *timer = &dwork->timer;
|
|
|
|
struct work_struct *work = &dwork->work;
|
2006-06-28 13:50:33 -07:00
|
|
|
|
2006-12-16 10:53:50 -07:00
|
|
|
if (!test_and_set_bit(WORK_STRUCT_PENDING, work_data_bits(work))) {
|
2006-06-28 13:50:33 -07:00
|
|
|
BUG_ON(timer_pending(timer));
|
|
|
|
BUG_ON(!list_empty(&work->entry));
|
|
|
|
|
|
|
|
/* This stores wq for the moment, for the timer_fn */
|
2006-11-22 07:54:49 -07:00
|
|
|
set_wq_data(work, wq);
|
2006-06-28 13:50:33 -07:00
|
|
|
timer->expires = jiffies + delay;
|
2006-11-22 07:54:01 -07:00
|
|
|
timer->data = (unsigned long)dwork;
|
2006-06-28 13:50:33 -07:00
|
|
|
timer->function = delayed_work_timer_fn;
|
|
|
|
add_timer_on(timer, cpu);
|
|
|
|
ret = 1;
|
|
|
|
}
|
|
|
|
return ret;
|
|
|
|
}
|
2006-06-29 22:40:45 -07:00
|
|
|
EXPORT_SYMBOL_GPL(queue_delayed_work_on);
|
2005-04-16 15:20:36 -07:00
|
|
|
|
2006-01-14 14:20:43 -07:00
|
|
|
static void run_workqueue(struct cpu_workqueue_struct *cwq)
|
2005-04-16 15:20:36 -07:00
|
|
|
{
|
|
|
|
unsigned long flags;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Keep taking off work from the queue until
|
|
|
|
* done.
|
|
|
|
*/
|
|
|
|
spin_lock_irqsave(&cwq->lock, flags);
|
|
|
|
cwq->run_depth++;
|
|
|
|
if (cwq->run_depth > 3) {
|
|
|
|
/* morton gets to eat his hat */
|
|
|
|
printk("%s: recursion depth exceeded: %d\n",
|
|
|
|
__FUNCTION__, cwq->run_depth);
|
|
|
|
dump_stack();
|
|
|
|
}
|
|
|
|
while (!list_empty(&cwq->worklist)) {
|
|
|
|
struct work_struct *work = list_entry(cwq->worklist.next,
|
|
|
|
struct work_struct, entry);
|
2006-11-22 07:54:45 -07:00
|
|
|
work_func_t f = work->func;
|
2005-04-16 15:20:36 -07:00
|
|
|
|
implement flush_work()
A basic problem with flush_scheduled_work() is that it blocks behind _all_
presently-queued works, rather than just the work whcih the caller wants to
flush. If the caller holds some lock, and if one of the queued work happens
to want that lock as well then accidental deadlocks can occur.
One example of this is the phy layer: it wants to flush work while holding
rtnl_lock(). But if a linkwatch event happens to be queued, the phy code will
deadlock because the linkwatch callback function takes rtnl_lock.
So we implement a new function which will flush a *single* work - just the one
which the caller wants to free up. Thus we avoid the accidental deadlocks
which can arise from unrelated subsystems' callbacks taking shared locks.
flush_work() non-blockingly dequeues the work_struct which we want to kill,
then it waits for its handler to complete on all CPUs.
Add ->current_work to the "struct cpu_workqueue_struct", it points to
currently running "struct work_struct". When flush_work(work) detects
->current_work == work, it inserts a barrier at the _head_ of ->worklist
(and thus right _after_ that work) and waits for completition. This means
that the next work fired on that CPU will be this barrier, or another
barrier queued by concurrent flush_work(), so the caller of flush_work()
will be woken before any "regular" work has a chance to run.
When wait_on_work() unlocks workqueue_mutex (or whatever we choose to protect
against CPU hotplug), CPU may go away. But in that case take_over_work() will
move a barrier we queued to another CPU, it will be fired sometime, and
wait_on_work() will be woken.
Actually, we are doing cleanup_workqueue_thread()->kthread_stop() before
take_over_work(), so cwq->thread should complete its ->worklist (and thus
the barrier), because currently we don't check kthread_should_stop() in
run_workqueue(). But even if we did, everything should be ok.
[akpm@osdl.org: cleanup]
[akpm@osdl.org: add flush_work_keventd() wrapper]
Signed-off-by: Oleg Nesterov <oleg@tv-sign.ru>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2007-05-09 02:33:52 -07:00
|
|
|
cwq->current_work = work;
|
2005-04-16 15:20:36 -07:00
|
|
|
list_del_init(cwq->worklist.next);
|
|
|
|
spin_unlock_irqrestore(&cwq->lock, flags);
|
|
|
|
|
2006-11-22 07:54:49 -07:00
|
|
|
BUG_ON(get_wq_data(work) != cwq);
|
2006-12-16 10:53:50 -07:00
|
|
|
if (!test_bit(WORK_STRUCT_NOAUTOREL, work_data_bits(work)))
|
2006-11-22 07:55:48 -07:00
|
|
|
work_release(work);
|
|
|
|
f(work);
|
2005-04-16 15:20:36 -07:00
|
|
|
|
2006-12-06 21:37:26 -07:00
|
|
|
if (unlikely(in_atomic() || lockdep_depth(current) > 0)) {
|
|
|
|
printk(KERN_ERR "BUG: workqueue leaked lock or atomic: "
|
|
|
|
"%s/0x%08x/%d\n",
|
|
|
|
current->comm, preempt_count(),
|
|
|
|
current->pid);
|
|
|
|
printk(KERN_ERR " last function: ");
|
|
|
|
print_symbol("%s\n", (unsigned long)f);
|
|
|
|
debug_show_held_locks(current);
|
|
|
|
dump_stack();
|
|
|
|
}
|
|
|
|
|
2005-04-16 15:20:36 -07:00
|
|
|
spin_lock_irqsave(&cwq->lock, flags);
|
implement flush_work()
A basic problem with flush_scheduled_work() is that it blocks behind _all_
presently-queued works, rather than just the work whcih the caller wants to
flush. If the caller holds some lock, and if one of the queued work happens
to want that lock as well then accidental deadlocks can occur.
One example of this is the phy layer: it wants to flush work while holding
rtnl_lock(). But if a linkwatch event happens to be queued, the phy code will
deadlock because the linkwatch callback function takes rtnl_lock.
So we implement a new function which will flush a *single* work - just the one
which the caller wants to free up. Thus we avoid the accidental deadlocks
which can arise from unrelated subsystems' callbacks taking shared locks.
flush_work() non-blockingly dequeues the work_struct which we want to kill,
then it waits for its handler to complete on all CPUs.
Add ->current_work to the "struct cpu_workqueue_struct", it points to
currently running "struct work_struct". When flush_work(work) detects
->current_work == work, it inserts a barrier at the _head_ of ->worklist
(and thus right _after_ that work) and waits for completition. This means
that the next work fired on that CPU will be this barrier, or another
barrier queued by concurrent flush_work(), so the caller of flush_work()
will be woken before any "regular" work has a chance to run.
When wait_on_work() unlocks workqueue_mutex (or whatever we choose to protect
against CPU hotplug), CPU may go away. But in that case take_over_work() will
move a barrier we queued to another CPU, it will be fired sometime, and
wait_on_work() will be woken.
Actually, we are doing cleanup_workqueue_thread()->kthread_stop() before
take_over_work(), so cwq->thread should complete its ->worklist (and thus
the barrier), because currently we don't check kthread_should_stop() in
run_workqueue(). But even if we did, everything should be ok.
[akpm@osdl.org: cleanup]
[akpm@osdl.org: add flush_work_keventd() wrapper]
Signed-off-by: Oleg Nesterov <oleg@tv-sign.ru>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2007-05-09 02:33:52 -07:00
|
|
|
cwq->current_work = NULL;
|
2005-04-16 15:20:36 -07:00
|
|
|
}
|
|
|
|
cwq->run_depth--;
|
|
|
|
spin_unlock_irqrestore(&cwq->lock, flags);
|
|
|
|
}
|
|
|
|
|
|
|
|
static int worker_thread(void *__cwq)
|
|
|
|
{
|
|
|
|
struct cpu_workqueue_struct *cwq = __cwq;
|
|
|
|
DECLARE_WAITQUEUE(wait, current);
|
|
|
|
struct k_sigaction sa;
|
|
|
|
sigset_t blocked;
|
|
|
|
|
2006-12-06 21:34:49 -07:00
|
|
|
if (!cwq->freezeable)
|
|
|
|
current->flags |= PF_NOFREEZE;
|
2005-04-16 15:20:36 -07:00
|
|
|
|
|
|
|
set_user_nice(current, -5);
|
|
|
|
|
|
|
|
/* Block and flush all signals */
|
|
|
|
sigfillset(&blocked);
|
|
|
|
sigprocmask(SIG_BLOCK, &blocked, NULL);
|
|
|
|
flush_signals(current);
|
|
|
|
|
2006-10-11 01:21:26 -07:00
|
|
|
/*
|
|
|
|
* We inherited MPOL_INTERLEAVE from the booting kernel.
|
|
|
|
* Set MPOL_DEFAULT to insure node local allocations.
|
|
|
|
*/
|
|
|
|
numa_default_policy();
|
|
|
|
|
2005-04-16 15:20:36 -07:00
|
|
|
/* SIG_IGN makes children autoreap: see do_notify_parent(). */
|
|
|
|
sa.sa.sa_handler = SIG_IGN;
|
|
|
|
sa.sa.sa_flags = 0;
|
|
|
|
siginitset(&sa.sa.sa_mask, sigmask(SIGCHLD));
|
|
|
|
do_sigaction(SIGCHLD, &sa, (struct k_sigaction *)0);
|
|
|
|
|
|
|
|
set_current_state(TASK_INTERRUPTIBLE);
|
|
|
|
while (!kthread_should_stop()) {
|
2006-12-06 21:34:49 -07:00
|
|
|
if (cwq->freezeable)
|
|
|
|
try_to_freeze();
|
|
|
|
|
2005-04-16 15:20:36 -07:00
|
|
|
add_wait_queue(&cwq->more_work, &wait);
|
|
|
|
if (list_empty(&cwq->worklist))
|
|
|
|
schedule();
|
|
|
|
else
|
|
|
|
__set_current_state(TASK_RUNNING);
|
|
|
|
remove_wait_queue(&cwq->more_work, &wait);
|
|
|
|
|
|
|
|
if (!list_empty(&cwq->worklist))
|
|
|
|
run_workqueue(cwq);
|
|
|
|
set_current_state(TASK_INTERRUPTIBLE);
|
|
|
|
}
|
|
|
|
__set_current_state(TASK_RUNNING);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2007-05-09 02:33:51 -07:00
|
|
|
struct wq_barrier {
|
|
|
|
struct work_struct work;
|
|
|
|
struct completion done;
|
|
|
|
};
|
|
|
|
|
|
|
|
static void wq_barrier_func(struct work_struct *work)
|
|
|
|
{
|
|
|
|
struct wq_barrier *barr = container_of(work, struct wq_barrier, work);
|
|
|
|
complete(&barr->done);
|
|
|
|
}
|
|
|
|
|
2007-05-09 02:33:54 -07:00
|
|
|
static void insert_wq_barrier(struct cpu_workqueue_struct *cwq,
|
|
|
|
struct wq_barrier *barr, int tail)
|
2007-05-09 02:33:51 -07:00
|
|
|
{
|
|
|
|
INIT_WORK(&barr->work, wq_barrier_func);
|
|
|
|
__set_bit(WORK_STRUCT_PENDING, work_data_bits(&barr->work));
|
|
|
|
|
|
|
|
init_completion(&barr->done);
|
2007-05-09 02:33:54 -07:00
|
|
|
|
|
|
|
insert_work(cwq, &barr->work, tail);
|
2007-05-09 02:33:51 -07:00
|
|
|
}
|
|
|
|
|
2005-04-16 15:20:36 -07:00
|
|
|
static void flush_cpu_workqueue(struct cpu_workqueue_struct *cwq)
|
|
|
|
{
|
|
|
|
if (cwq->thread == current) {
|
|
|
|
/*
|
|
|
|
* Probably keventd trying to flush its own queue. So simply run
|
|
|
|
* it by hand rather than deadlocking.
|
|
|
|
*/
|
2007-05-09 02:33:53 -07:00
|
|
|
preempt_enable();
|
|
|
|
/*
|
|
|
|
* We can still touch *cwq here because we are keventd, and
|
|
|
|
* hot-unplug will be waiting us to exit.
|
|
|
|
*/
|
2005-04-16 15:20:36 -07:00
|
|
|
run_workqueue(cwq);
|
2007-05-09 02:33:53 -07:00
|
|
|
preempt_disable();
|
2005-04-16 15:20:36 -07:00
|
|
|
} else {
|
2007-05-09 02:33:51 -07:00
|
|
|
struct wq_barrier barr;
|
2007-05-09 02:33:54 -07:00
|
|
|
int active = 0;
|
2005-04-16 15:20:36 -07:00
|
|
|
|
2007-05-09 02:33:54 -07:00
|
|
|
spin_lock_irq(&cwq->lock);
|
|
|
|
if (!list_empty(&cwq->worklist) || cwq->current_work != NULL) {
|
|
|
|
insert_wq_barrier(cwq, &barr, 1);
|
|
|
|
active = 1;
|
|
|
|
}
|
|
|
|
spin_unlock_irq(&cwq->lock);
|
2005-04-16 15:20:36 -07:00
|
|
|
|
2007-05-09 02:33:54 -07:00
|
|
|
if (active) {
|
|
|
|
preempt_enable();
|
|
|
|
wait_for_completion(&barr.done);
|
|
|
|
preempt_disable();
|
|
|
|
}
|
2005-04-16 15:20:36 -07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2006-07-30 03:03:42 -07:00
|
|
|
/**
|
2005-04-16 15:20:36 -07:00
|
|
|
* flush_workqueue - ensure that any scheduled work has run to completion.
|
2006-07-30 03:03:42 -07:00
|
|
|
* @wq: workqueue to flush
|
2005-04-16 15:20:36 -07:00
|
|
|
*
|
|
|
|
* Forces execution of the workqueue and blocks until its completion.
|
|
|
|
* This is typically used in driver shutdown handlers.
|
|
|
|
*
|
2007-05-09 02:33:51 -07:00
|
|
|
* We sleep until all works which were queued on entry have been handled,
|
|
|
|
* but we are not livelocked by new incoming ones.
|
2005-04-16 15:20:36 -07:00
|
|
|
*
|
|
|
|
* This function used to run the workqueues itself. Now we just wait for the
|
|
|
|
* helper threads to do it.
|
|
|
|
*/
|
|
|
|
void fastcall flush_workqueue(struct workqueue_struct *wq)
|
|
|
|
{
|
2007-05-09 02:33:53 -07:00
|
|
|
preempt_disable(); /* CPU hotplug */
|
2005-04-16 15:20:36 -07:00
|
|
|
if (is_single_threaded(wq)) {
|
2005-11-28 14:43:56 -07:00
|
|
|
/* Always use first cpu's area. */
|
2006-01-08 02:05:12 -07:00
|
|
|
flush_cpu_workqueue(per_cpu_ptr(wq->cpu_wq, singlethread_cpu));
|
2005-04-16 15:20:36 -07:00
|
|
|
} else {
|
|
|
|
int cpu;
|
|
|
|
|
|
|
|
for_each_online_cpu(cpu)
|
2005-10-30 16:01:59 -07:00
|
|
|
flush_cpu_workqueue(per_cpu_ptr(wq->cpu_wq, cpu));
|
2005-04-16 15:20:36 -07:00
|
|
|
}
|
2007-05-09 02:33:53 -07:00
|
|
|
preempt_enable();
|
2005-04-16 15:20:36 -07:00
|
|
|
}
|
2006-06-29 22:40:45 -07:00
|
|
|
EXPORT_SYMBOL_GPL(flush_workqueue);
|
2005-04-16 15:20:36 -07:00
|
|
|
|
implement flush_work()
A basic problem with flush_scheduled_work() is that it blocks behind _all_
presently-queued works, rather than just the work whcih the caller wants to
flush. If the caller holds some lock, and if one of the queued work happens
to want that lock as well then accidental deadlocks can occur.
One example of this is the phy layer: it wants to flush work while holding
rtnl_lock(). But if a linkwatch event happens to be queued, the phy code will
deadlock because the linkwatch callback function takes rtnl_lock.
So we implement a new function which will flush a *single* work - just the one
which the caller wants to free up. Thus we avoid the accidental deadlocks
which can arise from unrelated subsystems' callbacks taking shared locks.
flush_work() non-blockingly dequeues the work_struct which we want to kill,
then it waits for its handler to complete on all CPUs.
Add ->current_work to the "struct cpu_workqueue_struct", it points to
currently running "struct work_struct". When flush_work(work) detects
->current_work == work, it inserts a barrier at the _head_ of ->worklist
(and thus right _after_ that work) and waits for completition. This means
that the next work fired on that CPU will be this barrier, or another
barrier queued by concurrent flush_work(), so the caller of flush_work()
will be woken before any "regular" work has a chance to run.
When wait_on_work() unlocks workqueue_mutex (or whatever we choose to protect
against CPU hotplug), CPU may go away. But in that case take_over_work() will
move a barrier we queued to another CPU, it will be fired sometime, and
wait_on_work() will be woken.
Actually, we are doing cleanup_workqueue_thread()->kthread_stop() before
take_over_work(), so cwq->thread should complete its ->worklist (and thus
the barrier), because currently we don't check kthread_should_stop() in
run_workqueue(). But even if we did, everything should be ok.
[akpm@osdl.org: cleanup]
[akpm@osdl.org: add flush_work_keventd() wrapper]
Signed-off-by: Oleg Nesterov <oleg@tv-sign.ru>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2007-05-09 02:33:52 -07:00
|
|
|
static void wait_on_work(struct cpu_workqueue_struct *cwq,
|
|
|
|
struct work_struct *work)
|
|
|
|
{
|
|
|
|
struct wq_barrier barr;
|
|
|
|
int running = 0;
|
|
|
|
|
|
|
|
spin_lock_irq(&cwq->lock);
|
|
|
|
if (unlikely(cwq->current_work == work)) {
|
2007-05-09 02:33:54 -07:00
|
|
|
insert_wq_barrier(cwq, &barr, 0);
|
implement flush_work()
A basic problem with flush_scheduled_work() is that it blocks behind _all_
presently-queued works, rather than just the work whcih the caller wants to
flush. If the caller holds some lock, and if one of the queued work happens
to want that lock as well then accidental deadlocks can occur.
One example of this is the phy layer: it wants to flush work while holding
rtnl_lock(). But if a linkwatch event happens to be queued, the phy code will
deadlock because the linkwatch callback function takes rtnl_lock.
So we implement a new function which will flush a *single* work - just the one
which the caller wants to free up. Thus we avoid the accidental deadlocks
which can arise from unrelated subsystems' callbacks taking shared locks.
flush_work() non-blockingly dequeues the work_struct which we want to kill,
then it waits for its handler to complete on all CPUs.
Add ->current_work to the "struct cpu_workqueue_struct", it points to
currently running "struct work_struct". When flush_work(work) detects
->current_work == work, it inserts a barrier at the _head_ of ->worklist
(and thus right _after_ that work) and waits for completition. This means
that the next work fired on that CPU will be this barrier, or another
barrier queued by concurrent flush_work(), so the caller of flush_work()
will be woken before any "regular" work has a chance to run.
When wait_on_work() unlocks workqueue_mutex (or whatever we choose to protect
against CPU hotplug), CPU may go away. But in that case take_over_work() will
move a barrier we queued to another CPU, it will be fired sometime, and
wait_on_work() will be woken.
Actually, we are doing cleanup_workqueue_thread()->kthread_stop() before
take_over_work(), so cwq->thread should complete its ->worklist (and thus
the barrier), because currently we don't check kthread_should_stop() in
run_workqueue(). But even if we did, everything should be ok.
[akpm@osdl.org: cleanup]
[akpm@osdl.org: add flush_work_keventd() wrapper]
Signed-off-by: Oleg Nesterov <oleg@tv-sign.ru>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2007-05-09 02:33:52 -07:00
|
|
|
running = 1;
|
|
|
|
}
|
|
|
|
spin_unlock_irq(&cwq->lock);
|
|
|
|
|
|
|
|
if (unlikely(running)) {
|
|
|
|
mutex_unlock(&workqueue_mutex);
|
|
|
|
wait_for_completion(&barr.done);
|
|
|
|
mutex_lock(&workqueue_mutex);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* flush_work - block until a work_struct's callback has terminated
|
|
|
|
* @wq: the workqueue on which the work is queued
|
|
|
|
* @work: the work which is to be flushed
|
|
|
|
*
|
|
|
|
* flush_work() will attempt to cancel the work if it is queued. If the work's
|
|
|
|
* callback appears to be running, flush_work() will block until it has
|
|
|
|
* completed.
|
|
|
|
*
|
|
|
|
* flush_work() is designed to be used when the caller is tearing down data
|
|
|
|
* structures which the callback function operates upon. It is expected that,
|
|
|
|
* prior to calling flush_work(), the caller has arranged for the work to not
|
|
|
|
* be requeued.
|
|
|
|
*/
|
|
|
|
void flush_work(struct workqueue_struct *wq, struct work_struct *work)
|
|
|
|
{
|
|
|
|
struct cpu_workqueue_struct *cwq;
|
|
|
|
|
|
|
|
mutex_lock(&workqueue_mutex);
|
|
|
|
cwq = get_wq_data(work);
|
|
|
|
/* Was it ever queued ? */
|
|
|
|
if (!cwq)
|
|
|
|
goto out;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* This work can't be re-queued, and the lock above protects us
|
|
|
|
* from take_over_work(), no need to re-check that get_wq_data()
|
|
|
|
* is still the same when we take cwq->lock.
|
|
|
|
*/
|
|
|
|
spin_lock_irq(&cwq->lock);
|
|
|
|
list_del_init(&work->entry);
|
|
|
|
work_release(work);
|
|
|
|
spin_unlock_irq(&cwq->lock);
|
|
|
|
|
|
|
|
if (is_single_threaded(wq)) {
|
|
|
|
/* Always use first cpu's area. */
|
|
|
|
wait_on_work(per_cpu_ptr(wq->cpu_wq, singlethread_cpu), work);
|
|
|
|
} else {
|
|
|
|
int cpu;
|
|
|
|
|
|
|
|
for_each_online_cpu(cpu)
|
|
|
|
wait_on_work(per_cpu_ptr(wq->cpu_wq, cpu), work);
|
|
|
|
}
|
|
|
|
out:
|
|
|
|
mutex_unlock(&workqueue_mutex);
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL_GPL(flush_work);
|
|
|
|
|
2005-04-16 15:20:36 -07:00
|
|
|
static struct task_struct *create_workqueue_thread(struct workqueue_struct *wq,
|
2006-12-06 21:34:49 -07:00
|
|
|
int cpu, int freezeable)
|
2005-04-16 15:20:36 -07:00
|
|
|
{
|
2005-10-30 16:01:59 -07:00
|
|
|
struct cpu_workqueue_struct *cwq = per_cpu_ptr(wq->cpu_wq, cpu);
|
2005-04-16 15:20:36 -07:00
|
|
|
struct task_struct *p;
|
|
|
|
|
|
|
|
spin_lock_init(&cwq->lock);
|
|
|
|
cwq->wq = wq;
|
|
|
|
cwq->thread = NULL;
|
2006-12-06 21:34:49 -07:00
|
|
|
cwq->freezeable = freezeable;
|
2005-04-16 15:20:36 -07:00
|
|
|
INIT_LIST_HEAD(&cwq->worklist);
|
|
|
|
init_waitqueue_head(&cwq->more_work);
|
|
|
|
|
|
|
|
if (is_single_threaded(wq))
|
|
|
|
p = kthread_create(worker_thread, cwq, "%s", wq->name);
|
|
|
|
else
|
|
|
|
p = kthread_create(worker_thread, cwq, "%s/%d", wq->name, cpu);
|
|
|
|
if (IS_ERR(p))
|
|
|
|
return NULL;
|
|
|
|
cwq->thread = p;
|
|
|
|
return p;
|
|
|
|
}
|
|
|
|
|
|
|
|
struct workqueue_struct *__create_workqueue(const char *name,
|
2006-12-06 21:34:49 -07:00
|
|
|
int singlethread, int freezeable)
|
2005-04-16 15:20:36 -07:00
|
|
|
{
|
|
|
|
int cpu, destroy = 0;
|
|
|
|
struct workqueue_struct *wq;
|
|
|
|
struct task_struct *p;
|
|
|
|
|
2005-09-06 15:18:31 -07:00
|
|
|
wq = kzalloc(sizeof(*wq), GFP_KERNEL);
|
2005-04-16 15:20:36 -07:00
|
|
|
if (!wq)
|
|
|
|
return NULL;
|
|
|
|
|
2005-10-30 16:01:59 -07:00
|
|
|
wq->cpu_wq = alloc_percpu(struct cpu_workqueue_struct);
|
2006-01-08 02:03:04 -07:00
|
|
|
if (!wq->cpu_wq) {
|
|
|
|
kfree(wq);
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2005-04-16 15:20:36 -07:00
|
|
|
wq->name = name;
|
2006-08-13 23:24:26 -07:00
|
|
|
mutex_lock(&workqueue_mutex);
|
2005-04-16 15:20:36 -07:00
|
|
|
if (singlethread) {
|
|
|
|
INIT_LIST_HEAD(&wq->list);
|
2006-12-06 21:34:49 -07:00
|
|
|
p = create_workqueue_thread(wq, singlethread_cpu, freezeable);
|
2005-04-16 15:20:36 -07:00
|
|
|
if (!p)
|
|
|
|
destroy = 1;
|
|
|
|
else
|
|
|
|
wake_up_process(p);
|
|
|
|
} else {
|
|
|
|
list_add(&wq->list, &workqueues);
|
|
|
|
for_each_online_cpu(cpu) {
|
2006-12-06 21:34:49 -07:00
|
|
|
p = create_workqueue_thread(wq, cpu, freezeable);
|
2005-04-16 15:20:36 -07:00
|
|
|
if (p) {
|
|
|
|
kthread_bind(p, cpu);
|
|
|
|
wake_up_process(p);
|
|
|
|
} else
|
|
|
|
destroy = 1;
|
|
|
|
}
|
|
|
|
}
|
2006-08-13 23:24:26 -07:00
|
|
|
mutex_unlock(&workqueue_mutex);
|
2005-04-16 15:20:36 -07:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Was there any error during startup? If yes then clean up:
|
|
|
|
*/
|
|
|
|
if (destroy) {
|
|
|
|
destroy_workqueue(wq);
|
|
|
|
wq = NULL;
|
|
|
|
}
|
|
|
|
return wq;
|
|
|
|
}
|
2006-06-29 22:40:45 -07:00
|
|
|
EXPORT_SYMBOL_GPL(__create_workqueue);
|
2005-04-16 15:20:36 -07:00
|
|
|
|
|
|
|
static void cleanup_workqueue_thread(struct workqueue_struct *wq, int cpu)
|
|
|
|
{
|
|
|
|
struct cpu_workqueue_struct *cwq;
|
|
|
|
unsigned long flags;
|
|
|
|
struct task_struct *p;
|
|
|
|
|
2005-10-30 16:01:59 -07:00
|
|
|
cwq = per_cpu_ptr(wq->cpu_wq, cpu);
|
2005-04-16 15:20:36 -07:00
|
|
|
spin_lock_irqsave(&cwq->lock, flags);
|
|
|
|
p = cwq->thread;
|
|
|
|
cwq->thread = NULL;
|
|
|
|
spin_unlock_irqrestore(&cwq->lock, flags);
|
|
|
|
if (p)
|
|
|
|
kthread_stop(p);
|
|
|
|
}
|
|
|
|
|
2006-07-30 03:03:42 -07:00
|
|
|
/**
|
|
|
|
* destroy_workqueue - safely terminate a workqueue
|
|
|
|
* @wq: target workqueue
|
|
|
|
*
|
|
|
|
* Safely destroy a workqueue. All work currently pending will be done first.
|
|
|
|
*/
|
2005-04-16 15:20:36 -07:00
|
|
|
void destroy_workqueue(struct workqueue_struct *wq)
|
|
|
|
{
|
|
|
|
int cpu;
|
|
|
|
|
|
|
|
flush_workqueue(wq);
|
|
|
|
|
|
|
|
/* We don't need the distraction of CPUs appearing and vanishing. */
|
2006-08-13 23:24:26 -07:00
|
|
|
mutex_lock(&workqueue_mutex);
|
2005-04-16 15:20:36 -07:00
|
|
|
if (is_single_threaded(wq))
|
2006-01-08 02:05:12 -07:00
|
|
|
cleanup_workqueue_thread(wq, singlethread_cpu);
|
2005-04-16 15:20:36 -07:00
|
|
|
else {
|
|
|
|
for_each_online_cpu(cpu)
|
|
|
|
cleanup_workqueue_thread(wq, cpu);
|
|
|
|
list_del(&wq->list);
|
|
|
|
}
|
2006-08-13 23:24:26 -07:00
|
|
|
mutex_unlock(&workqueue_mutex);
|
2005-10-30 16:01:59 -07:00
|
|
|
free_percpu(wq->cpu_wq);
|
2005-04-16 15:20:36 -07:00
|
|
|
kfree(wq);
|
|
|
|
}
|
2006-06-29 22:40:45 -07:00
|
|
|
EXPORT_SYMBOL_GPL(destroy_workqueue);
|
2005-04-16 15:20:36 -07:00
|
|
|
|
|
|
|
static struct workqueue_struct *keventd_wq;
|
|
|
|
|
2006-07-30 03:03:42 -07:00
|
|
|
/**
|
|
|
|
* schedule_work - put work task in global workqueue
|
|
|
|
* @work: job to be done
|
|
|
|
*
|
|
|
|
* This puts a job in the kernel-global workqueue.
|
|
|
|
*/
|
2005-04-16 15:20:36 -07:00
|
|
|
int fastcall schedule_work(struct work_struct *work)
|
|
|
|
{
|
|
|
|
return queue_work(keventd_wq, work);
|
|
|
|
}
|
2006-06-29 22:40:45 -07:00
|
|
|
EXPORT_SYMBOL(schedule_work);
|
2005-04-16 15:20:36 -07:00
|
|
|
|
2006-07-30 03:03:42 -07:00
|
|
|
/**
|
|
|
|
* schedule_delayed_work - put work task in global workqueue after delay
|
2006-11-22 07:54:01 -07:00
|
|
|
* @dwork: job to be done
|
|
|
|
* @delay: number of jiffies to wait or 0 for immediate execution
|
2006-07-30 03:03:42 -07:00
|
|
|
*
|
|
|
|
* After waiting for a given time this puts a job in the kernel-global
|
|
|
|
* workqueue.
|
|
|
|
*/
|
[PATCH] Add debugging feature /proc/timer_stat
Add /proc/timer_stats support: debugging feature to profile timer expiration.
Both the starting site, process/PID and the expiration function is captured.
This allows the quick identification of timer event sources in a system.
Sample output:
# echo 1 > /proc/timer_stats
# cat /proc/timer_stats
Timer Stats Version: v0.1
Sample period: 4.010 s
24, 0 swapper hrtimer_stop_sched_tick (hrtimer_sched_tick)
11, 0 swapper sk_reset_timer (tcp_delack_timer)
6, 0 swapper hrtimer_stop_sched_tick (hrtimer_sched_tick)
2, 1 swapper queue_delayed_work_on (delayed_work_timer_fn)
17, 0 swapper hrtimer_restart_sched_tick (hrtimer_sched_tick)
2, 1 swapper queue_delayed_work_on (delayed_work_timer_fn)
4, 2050 pcscd do_nanosleep (hrtimer_wakeup)
5, 4179 sshd sk_reset_timer (tcp_write_timer)
4, 2248 yum-updatesd schedule_timeout (process_timeout)
18, 0 swapper hrtimer_restart_sched_tick (hrtimer_sched_tick)
3, 0 swapper sk_reset_timer (tcp_delack_timer)
1, 1 swapper neigh_table_init_no_netlink (neigh_periodic_timer)
2, 1 swapper e1000_up (e1000_watchdog)
1, 1 init schedule_timeout (process_timeout)
100 total events, 25.24 events/sec
[ cleanups and hrtimers support from Thomas Gleixner <tglx@linutronix.de> ]
[bunk@stusta.de: nr_entries can become static]
Signed-off-by: Ingo Molnar <mingo@elte.hu>
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
Cc: john stultz <johnstul@us.ibm.com>
Cc: Roman Zippel <zippel@linux-m68k.org>
Cc: Andi Kleen <ak@suse.de>
Signed-off-by: Adrian Bunk <bunk@stusta.de>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2007-02-16 02:28:13 -07:00
|
|
|
int fastcall schedule_delayed_work(struct delayed_work *dwork,
|
|
|
|
unsigned long delay)
|
2005-04-16 15:20:36 -07:00
|
|
|
{
|
[PATCH] Add debugging feature /proc/timer_stat
Add /proc/timer_stats support: debugging feature to profile timer expiration.
Both the starting site, process/PID and the expiration function is captured.
This allows the quick identification of timer event sources in a system.
Sample output:
# echo 1 > /proc/timer_stats
# cat /proc/timer_stats
Timer Stats Version: v0.1
Sample period: 4.010 s
24, 0 swapper hrtimer_stop_sched_tick (hrtimer_sched_tick)
11, 0 swapper sk_reset_timer (tcp_delack_timer)
6, 0 swapper hrtimer_stop_sched_tick (hrtimer_sched_tick)
2, 1 swapper queue_delayed_work_on (delayed_work_timer_fn)
17, 0 swapper hrtimer_restart_sched_tick (hrtimer_sched_tick)
2, 1 swapper queue_delayed_work_on (delayed_work_timer_fn)
4, 2050 pcscd do_nanosleep (hrtimer_wakeup)
5, 4179 sshd sk_reset_timer (tcp_write_timer)
4, 2248 yum-updatesd schedule_timeout (process_timeout)
18, 0 swapper hrtimer_restart_sched_tick (hrtimer_sched_tick)
3, 0 swapper sk_reset_timer (tcp_delack_timer)
1, 1 swapper neigh_table_init_no_netlink (neigh_periodic_timer)
2, 1 swapper e1000_up (e1000_watchdog)
1, 1 init schedule_timeout (process_timeout)
100 total events, 25.24 events/sec
[ cleanups and hrtimers support from Thomas Gleixner <tglx@linutronix.de> ]
[bunk@stusta.de: nr_entries can become static]
Signed-off-by: Ingo Molnar <mingo@elte.hu>
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
Cc: john stultz <johnstul@us.ibm.com>
Cc: Roman Zippel <zippel@linux-m68k.org>
Cc: Andi Kleen <ak@suse.de>
Signed-off-by: Adrian Bunk <bunk@stusta.de>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2007-02-16 02:28:13 -07:00
|
|
|
timer_stats_timer_set_start_info(&dwork->timer);
|
2006-11-22 07:54:01 -07:00
|
|
|
return queue_delayed_work(keventd_wq, dwork, delay);
|
2005-04-16 15:20:36 -07:00
|
|
|
}
|
2006-06-29 22:40:45 -07:00
|
|
|
EXPORT_SYMBOL(schedule_delayed_work);
|
2005-04-16 15:20:36 -07:00
|
|
|
|
2006-07-30 03:03:42 -07:00
|
|
|
/**
|
|
|
|
* schedule_delayed_work_on - queue work in global workqueue on CPU after delay
|
|
|
|
* @cpu: cpu to use
|
2006-11-22 07:54:01 -07:00
|
|
|
* @dwork: job to be done
|
2006-07-30 03:03:42 -07:00
|
|
|
* @delay: number of jiffies to wait
|
|
|
|
*
|
|
|
|
* After waiting for a given time this puts a job in the kernel-global
|
|
|
|
* workqueue on the specified CPU.
|
|
|
|
*/
|
2005-04-16 15:20:36 -07:00
|
|
|
int schedule_delayed_work_on(int cpu,
|
2006-11-22 07:54:01 -07:00
|
|
|
struct delayed_work *dwork, unsigned long delay)
|
2005-04-16 15:20:36 -07:00
|
|
|
{
|
2006-11-22 07:54:01 -07:00
|
|
|
return queue_delayed_work_on(cpu, keventd_wq, dwork, delay);
|
2005-04-16 15:20:36 -07:00
|
|
|
}
|
2006-06-29 22:40:45 -07:00
|
|
|
EXPORT_SYMBOL(schedule_delayed_work_on);
|
2005-04-16 15:20:36 -07:00
|
|
|
|
2006-06-25 05:47:49 -07:00
|
|
|
/**
|
|
|
|
* schedule_on_each_cpu - call a function on each online CPU from keventd
|
|
|
|
* @func: the function to call
|
|
|
|
*
|
|
|
|
* Returns zero on success.
|
|
|
|
* Returns -ve errno on failure.
|
|
|
|
*
|
|
|
|
* Appears to be racy against CPU hotplug.
|
|
|
|
*
|
|
|
|
* schedule_on_each_cpu() is very slow.
|
|
|
|
*/
|
2006-11-22 07:55:48 -07:00
|
|
|
int schedule_on_each_cpu(work_func_t func)
|
2006-01-08 02:00:43 -07:00
|
|
|
{
|
|
|
|
int cpu;
|
2006-06-25 05:47:49 -07:00
|
|
|
struct work_struct *works;
|
2006-01-08 02:00:43 -07:00
|
|
|
|
2006-06-25 05:47:49 -07:00
|
|
|
works = alloc_percpu(struct work_struct);
|
|
|
|
if (!works)
|
2006-01-08 02:00:43 -07:00
|
|
|
return -ENOMEM;
|
2006-06-25 05:47:49 -07:00
|
|
|
|
2007-05-09 02:33:50 -07:00
|
|
|
preempt_disable(); /* CPU hotplug */
|
2006-01-08 02:00:43 -07:00
|
|
|
for_each_online_cpu(cpu) {
|
2006-12-18 12:05:09 -07:00
|
|
|
struct work_struct *work = per_cpu_ptr(works, cpu);
|
|
|
|
|
|
|
|
INIT_WORK(work, func);
|
|
|
|
set_bit(WORK_STRUCT_PENDING, work_data_bits(work));
|
|
|
|
__queue_work(per_cpu_ptr(keventd_wq->cpu_wq, cpu), work);
|
2006-01-08 02:00:43 -07:00
|
|
|
}
|
2007-05-09 02:33:50 -07:00
|
|
|
preempt_enable();
|
2006-01-08 02:00:43 -07:00
|
|
|
flush_workqueue(keventd_wq);
|
2006-06-25 05:47:49 -07:00
|
|
|
free_percpu(works);
|
2006-01-08 02:00:43 -07:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2005-04-16 15:20:36 -07:00
|
|
|
void flush_scheduled_work(void)
|
|
|
|
{
|
|
|
|
flush_workqueue(keventd_wq);
|
|
|
|
}
|
2006-06-29 22:40:45 -07:00
|
|
|
EXPORT_SYMBOL(flush_scheduled_work);
|
2005-04-16 15:20:36 -07:00
|
|
|
|
implement flush_work()
A basic problem with flush_scheduled_work() is that it blocks behind _all_
presently-queued works, rather than just the work whcih the caller wants to
flush. If the caller holds some lock, and if one of the queued work happens
to want that lock as well then accidental deadlocks can occur.
One example of this is the phy layer: it wants to flush work while holding
rtnl_lock(). But if a linkwatch event happens to be queued, the phy code will
deadlock because the linkwatch callback function takes rtnl_lock.
So we implement a new function which will flush a *single* work - just the one
which the caller wants to free up. Thus we avoid the accidental deadlocks
which can arise from unrelated subsystems' callbacks taking shared locks.
flush_work() non-blockingly dequeues the work_struct which we want to kill,
then it waits for its handler to complete on all CPUs.
Add ->current_work to the "struct cpu_workqueue_struct", it points to
currently running "struct work_struct". When flush_work(work) detects
->current_work == work, it inserts a barrier at the _head_ of ->worklist
(and thus right _after_ that work) and waits for completition. This means
that the next work fired on that CPU will be this barrier, or another
barrier queued by concurrent flush_work(), so the caller of flush_work()
will be woken before any "regular" work has a chance to run.
When wait_on_work() unlocks workqueue_mutex (or whatever we choose to protect
against CPU hotplug), CPU may go away. But in that case take_over_work() will
move a barrier we queued to another CPU, it will be fired sometime, and
wait_on_work() will be woken.
Actually, we are doing cleanup_workqueue_thread()->kthread_stop() before
take_over_work(), so cwq->thread should complete its ->worklist (and thus
the barrier), because currently we don't check kthread_should_stop() in
run_workqueue(). But even if we did, everything should be ok.
[akpm@osdl.org: cleanup]
[akpm@osdl.org: add flush_work_keventd() wrapper]
Signed-off-by: Oleg Nesterov <oleg@tv-sign.ru>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2007-05-09 02:33:52 -07:00
|
|
|
void flush_work_keventd(struct work_struct *work)
|
|
|
|
{
|
|
|
|
flush_work(keventd_wq, work);
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(flush_work_keventd);
|
|
|
|
|
2005-04-16 15:20:36 -07:00
|
|
|
/**
|
2007-02-10 02:45:59 -07:00
|
|
|
* cancel_rearming_delayed_workqueue - reliably kill off a delayed work whose handler rearms the delayed work.
|
2005-04-16 15:20:36 -07:00
|
|
|
* @wq: the controlling workqueue structure
|
2006-11-22 07:54:01 -07:00
|
|
|
* @dwork: the delayed work struct
|
2005-04-16 15:20:36 -07:00
|
|
|
*/
|
2005-04-16 15:23:59 -07:00
|
|
|
void cancel_rearming_delayed_workqueue(struct workqueue_struct *wq,
|
2006-11-22 07:54:01 -07:00
|
|
|
struct delayed_work *dwork)
|
2005-04-16 15:20:36 -07:00
|
|
|
{
|
2006-11-22 07:54:01 -07:00
|
|
|
while (!cancel_delayed_work(dwork))
|
2005-04-16 15:20:36 -07:00
|
|
|
flush_workqueue(wq);
|
|
|
|
}
|
2005-04-16 15:23:59 -07:00
|
|
|
EXPORT_SYMBOL(cancel_rearming_delayed_workqueue);
|
2005-04-16 15:20:36 -07:00
|
|
|
|
|
|
|
/**
|
2007-02-10 02:45:59 -07:00
|
|
|
* cancel_rearming_delayed_work - reliably kill off a delayed keventd work whose handler rearms the delayed work.
|
2006-11-22 07:54:01 -07:00
|
|
|
* @dwork: the delayed work struct
|
2005-04-16 15:20:36 -07:00
|
|
|
*/
|
2006-11-22 07:54:01 -07:00
|
|
|
void cancel_rearming_delayed_work(struct delayed_work *dwork)
|
2005-04-16 15:20:36 -07:00
|
|
|
{
|
2006-11-22 07:54:01 -07:00
|
|
|
cancel_rearming_delayed_workqueue(keventd_wq, dwork);
|
2005-04-16 15:20:36 -07:00
|
|
|
}
|
|
|
|
EXPORT_SYMBOL(cancel_rearming_delayed_work);
|
|
|
|
|
2006-02-23 11:43:43 -07:00
|
|
|
/**
|
|
|
|
* execute_in_process_context - reliably execute the routine with user context
|
|
|
|
* @fn: the function to execute
|
|
|
|
* @ew: guaranteed storage for the execute work structure (must
|
|
|
|
* be available when the work executes)
|
|
|
|
*
|
|
|
|
* Executes the function immediately if process context is available,
|
|
|
|
* otherwise schedules the function for delayed execution.
|
|
|
|
*
|
|
|
|
* Returns: 0 - function was executed
|
|
|
|
* 1 - function was scheduled for execution
|
|
|
|
*/
|
2006-11-22 07:55:48 -07:00
|
|
|
int execute_in_process_context(work_func_t fn, struct execute_work *ew)
|
2006-02-23 11:43:43 -07:00
|
|
|
{
|
|
|
|
if (!in_interrupt()) {
|
2006-11-22 07:55:48 -07:00
|
|
|
fn(&ew->work);
|
2006-02-23 11:43:43 -07:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2006-11-22 07:55:48 -07:00
|
|
|
INIT_WORK(&ew->work, fn);
|
2006-02-23 11:43:43 -07:00
|
|
|
schedule_work(&ew->work);
|
|
|
|
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
EXPORT_SYMBOL_GPL(execute_in_process_context);
|
|
|
|
|
2005-04-16 15:20:36 -07:00
|
|
|
int keventd_up(void)
|
|
|
|
{
|
|
|
|
return keventd_wq != NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
int current_is_keventd(void)
|
|
|
|
{
|
|
|
|
struct cpu_workqueue_struct *cwq;
|
|
|
|
int cpu = smp_processor_id(); /* preempt-safe: keventd is per-cpu */
|
|
|
|
int ret = 0;
|
|
|
|
|
|
|
|
BUG_ON(!keventd_wq);
|
|
|
|
|
2005-10-30 16:01:59 -07:00
|
|
|
cwq = per_cpu_ptr(keventd_wq->cpu_wq, cpu);
|
2005-04-16 15:20:36 -07:00
|
|
|
if (current == cwq->thread)
|
|
|
|
ret = 1;
|
|
|
|
|
|
|
|
return ret;
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Take the work from this (downed) CPU. */
|
|
|
|
static void take_over_work(struct workqueue_struct *wq, unsigned int cpu)
|
|
|
|
{
|
2005-10-30 16:01:59 -07:00
|
|
|
struct cpu_workqueue_struct *cwq = per_cpu_ptr(wq->cpu_wq, cpu);
|
2006-06-23 02:05:55 -07:00
|
|
|
struct list_head list;
|
2005-04-16 15:20:36 -07:00
|
|
|
struct work_struct *work;
|
|
|
|
|
|
|
|
spin_lock_irq(&cwq->lock);
|
2006-06-23 02:05:55 -07:00
|
|
|
list_replace_init(&cwq->worklist, &list);
|
2005-04-16 15:20:36 -07:00
|
|
|
|
|
|
|
while (!list_empty(&list)) {
|
|
|
|
printk("Taking work for %s\n", wq->name);
|
|
|
|
work = list_entry(list.next,struct work_struct,entry);
|
|
|
|
list_del(&work->entry);
|
2005-10-30 16:01:59 -07:00
|
|
|
__queue_work(per_cpu_ptr(wq->cpu_wq, smp_processor_id()), work);
|
2005-04-16 15:20:36 -07:00
|
|
|
}
|
|
|
|
spin_unlock_irq(&cwq->lock);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* We're holding the cpucontrol mutex here */
|
2006-06-27 02:54:07 -07:00
|
|
|
static int __devinit workqueue_cpu_callback(struct notifier_block *nfb,
|
2005-04-16 15:20:36 -07:00
|
|
|
unsigned long action,
|
|
|
|
void *hcpu)
|
|
|
|
{
|
|
|
|
unsigned int hotcpu = (unsigned long)hcpu;
|
|
|
|
struct workqueue_struct *wq;
|
|
|
|
|
|
|
|
switch (action) {
|
|
|
|
case CPU_UP_PREPARE:
|
2006-08-13 23:24:26 -07:00
|
|
|
mutex_lock(&workqueue_mutex);
|
2005-04-16 15:20:36 -07:00
|
|
|
/* Create a new workqueue thread for it. */
|
|
|
|
list_for_each_entry(wq, &workqueues, list) {
|
2006-12-06 21:34:49 -07:00
|
|
|
if (!create_workqueue_thread(wq, hotcpu, 0)) {
|
2005-04-16 15:20:36 -07:00
|
|
|
printk("workqueue for %i failed\n", hotcpu);
|
|
|
|
return NOTIFY_BAD;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
|
|
|
case CPU_ONLINE:
|
|
|
|
/* Kick off worker threads. */
|
|
|
|
list_for_each_entry(wq, &workqueues, list) {
|
2005-10-30 16:01:59 -07:00
|
|
|
struct cpu_workqueue_struct *cwq;
|
|
|
|
|
|
|
|
cwq = per_cpu_ptr(wq->cpu_wq, hotcpu);
|
|
|
|
kthread_bind(cwq->thread, hotcpu);
|
|
|
|
wake_up_process(cwq->thread);
|
2005-04-16 15:20:36 -07:00
|
|
|
}
|
2006-08-13 23:24:26 -07:00
|
|
|
mutex_unlock(&workqueue_mutex);
|
2005-04-16 15:20:36 -07:00
|
|
|
break;
|
|
|
|
|
|
|
|
case CPU_UP_CANCELED:
|
|
|
|
list_for_each_entry(wq, &workqueues, list) {
|
2006-06-25 05:49:10 -07:00
|
|
|
if (!per_cpu_ptr(wq->cpu_wq, hotcpu)->thread)
|
|
|
|
continue;
|
2005-04-16 15:20:36 -07:00
|
|
|
/* Unbind so it can run. */
|
2005-10-30 16:01:59 -07:00
|
|
|
kthread_bind(per_cpu_ptr(wq->cpu_wq, hotcpu)->thread,
|
2005-11-07 01:58:38 -07:00
|
|
|
any_online_cpu(cpu_online_map));
|
2005-04-16 15:20:36 -07:00
|
|
|
cleanup_workqueue_thread(wq, hotcpu);
|
|
|
|
}
|
2006-08-13 23:24:26 -07:00
|
|
|
mutex_unlock(&workqueue_mutex);
|
|
|
|
break;
|
|
|
|
|
|
|
|
case CPU_DOWN_PREPARE:
|
|
|
|
mutex_lock(&workqueue_mutex);
|
|
|
|
break;
|
|
|
|
|
|
|
|
case CPU_DOWN_FAILED:
|
|
|
|
mutex_unlock(&workqueue_mutex);
|
2005-04-16 15:20:36 -07:00
|
|
|
break;
|
|
|
|
|
|
|
|
case CPU_DEAD:
|
|
|
|
list_for_each_entry(wq, &workqueues, list)
|
|
|
|
cleanup_workqueue_thread(wq, hotcpu);
|
|
|
|
list_for_each_entry(wq, &workqueues, list)
|
|
|
|
take_over_work(wq, hotcpu);
|
2006-08-13 23:24:26 -07:00
|
|
|
mutex_unlock(&workqueue_mutex);
|
2005-04-16 15:20:36 -07:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
return NOTIFY_OK;
|
|
|
|
}
|
|
|
|
|
|
|
|
void init_workqueues(void)
|
|
|
|
{
|
2006-01-08 02:05:12 -07:00
|
|
|
singlethread_cpu = first_cpu(cpu_possible_map);
|
2005-04-16 15:20:36 -07:00
|
|
|
hotcpu_notifier(workqueue_cpu_callback, 0);
|
|
|
|
keventd_wq = create_workqueue("events");
|
|
|
|
BUG_ON(!keventd_wq);
|
|
|
|
}
|
|
|
|
|