Blame - kernel/workqueue.c - kernel/msm-4.9

blob: c462cd60c3743b58cf4fb15920d50d5fd5f2e23c [file] [log] [blame]

Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1	/*
Tejun Heo	c54fce6	2010-09-10 16:51:36 +0200	[diff] [blame]	2	* kernel/workqueue.c - generic async execution with shared worker pool
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3	*
Tejun Heo	c54fce6	2010-09-10 16:51:36 +0200	[diff] [blame]	4	* Copyright (C) 2002 Ingo Molnar
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	5	*
Tejun Heo	c54fce6	2010-09-10 16:51:36 +0200	[diff] [blame]	6	* Derived from the taskqueue/keventd code by:
				7	* David Woodhouse <dwmw2@infradead.org>
				8	* Andrew Morton
				9	* Kai Petzke <wpp@marie.physik.tu-berlin.de>
				10	* Theodore Ts'o <tytso@mit.edu>
Christoph Lameter	89ada67	2005-10-30 15:01:59 -0800	[diff] [blame]	11	*
Christoph Lameter	cde5353	2008-07-04 09:59:22 -0700	[diff] [blame]	12	* Made to use alloc_percpu by Christoph Lameter.
Tejun Heo	c54fce6	2010-09-10 16:51:36 +0200	[diff] [blame]	13	*
				14	* Copyright (C) 2010 SUSE Linux Products GmbH
				15	* Copyright (C) 2010 Tejun Heo <tj@kernel.org>
				16	*
				17	* This is the generic async execution mechanism. Work items as are
				18	* executed in process context. The worker pool is shared and
				19	* automatically managed. There is one worker pool for each CPU and
				20	* one extra for works which are better served by workers which are
				21	* not bound to any specific CPU.
				22	*
				23	* Please read Documentation/workqueue.txt for details.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	24	*/
				25
Paul Gortmaker	9984de1	2011-05-23 14:51:41 -0400	[diff] [blame]	26	#include <linux/export.h>
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	27	#include <linux/kernel.h>
				28	#include <linux/sched.h>
				29	#include <linux/init.h>
				30	#include <linux/signal.h>
				31	#include <linux/completion.h>
				32	#include <linux/workqueue.h>
				33	#include <linux/slab.h>
				34	#include <linux/cpu.h>
				35	#include <linux/notifier.h>
				36	#include <linux/kthread.h>
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	37	#include <linux/hardirq.h>
Christoph Lameter	4693402	2006-10-11 01:21:26 -0700	[diff] [blame]	38	#include <linux/mempolicy.h>
Rafael J. Wysocki	341a595	2006-12-06 20:34:49 -0800	[diff] [blame]	39	#include <linux/freezer.h>
Peter Zijlstra	d5abe66	2006-12-06 20:37:26 -0800	[diff] [blame]	40	#include <linux/kallsyms.h>
				41	#include <linux/debug_locks.h>
Johannes Berg	4e6045f	2007-10-18 23:39:55 -0700	[diff] [blame]	42	#include <linux/lockdep.h>
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	43	#include <linux/idr.h>
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	44
				45	#include "workqueue_sched.h"
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	46
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	47	enum {
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	48	/*
				49	* global_cwq flags
				50	*
				51	* A bound gcwq is either associated or disassociated with its CPU.
				52	* While associated (!DISASSOCIATED), all workers are bound to the
				53	* CPU and none has %WORKER_UNBOUND set and concurrency management
				54	* is in effect.
				55	*
				56	* While DISASSOCIATED, the cpu may be offline and all workers have
				57	* %WORKER_UNBOUND set and concurrency management disabled, and may
				58	* be executing on any CPU. The gcwq behaves as an unbound one.
				59	*
				60	* Note that DISASSOCIATED can be flipped only while holding
				61	* managership of all pools on the gcwq to avoid changing binding
				62	* state while create_worker() is in progress.
				63	*/
Tejun Heo	11ebea5	2012-07-12 14:46:37 -0700	[diff] [blame]	64	GCWQ_DISASSOCIATED = 1 << 0, /* cpu can't serve workers */
				65	GCWQ_FREEZING = 1 << 1, /* freeze in progress */
				66
				67	/* pool flags */
				68	POOL_MANAGE_WORKERS = 1 << 0, /* need to manage workers */
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	69
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	70	/* worker flags */
				71	WORKER_STARTED = 1 << 0, /* started */
				72	WORKER_DIE = 1 << 1, /* die die die */
				73	WORKER_IDLE = 1 << 2, /* is idle */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	74	WORKER_PREP = 1 << 3, /* preparing to run works */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	75	WORKER_REBIND = 1 << 5, /* mom is home, come back */
Tejun Heo	fb0e7be	2010-06-29 10:07:15 +0200	[diff] [blame]	76	WORKER_CPU_INTENSIVE = 1 << 6, /* cpu intensive */
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	77	WORKER_UNBOUND = 1 << 7, /* worker is unbound */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	78
Tejun Heo	403c821	2012-07-17 12:39:27 -0700	[diff] [blame]	79	WORKER_NOT_RUNNING = WORKER_PREP \| WORKER_REBIND \| WORKER_UNBOUND \|
				80	WORKER_CPU_INTENSIVE,
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	81
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	82	NR_WORKER_POOLS = 2, /* # worker pools per gcwq */
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	83
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	84	BUSY_WORKER_HASH_ORDER = 6, /* 64 pointers */
				85	BUSY_WORKER_HASH_SIZE = 1 << BUSY_WORKER_HASH_ORDER,
				86	BUSY_WORKER_HASH_MASK = BUSY_WORKER_HASH_SIZE - 1,
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	87
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	88	MAX_IDLE_WORKERS_RATIO = 4, /* 1/4 of busy can be idle */
				89	IDLE_WORKER_TIMEOUT = 300 * HZ, /* keep idle ones for 5 mins */
				90
Tejun Heo	3233cdb	2011-02-16 18:10:19 +0100	[diff] [blame]	91	MAYDAY_INITIAL_TIMEOUT = HZ / 100 >= 2 ? HZ / 100 : 2,
				92	/* call for help after 10ms
				93	(min two ticks) */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	94	MAYDAY_INTERVAL = HZ / 10, /* and then every 100ms */
				95	CREATE_COOLDOWN = HZ, /* time to breath after fail */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	96
				97	/*
				98	* Rescue workers are used only on emergencies and shared by
				99	* all cpus. Give -20.
				100	*/
				101	RESCUER_NICE_LEVEL = -20,
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	102	HIGHPRI_NICE_LEVEL = -20,
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	103	};
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	104
				105	/*
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	106	* Structure fields follow one of the following exclusion rules.
				107	*
Tejun Heo	e41e704	2010-08-24 14:22:47 +0200	[diff] [blame]	108	* I: Modifiable by initialization/destruction paths and read-only for
				109	* everyone else.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	110	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	111	* P: Preemption protected. Disabling preemption is enough and should
				112	* only be modified and accessed from the local cpu.
				113	*
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	114	* L: gcwq->lock protected. Access with gcwq->lock held.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	115	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	116	* X: During normal operation, modification requires gcwq->lock and
				117	* should be done only from local cpu. Either disabling preemption
				118	* on local cpu or grabbing gcwq->lock is enough for read access.
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	119	* If GCWQ_DISASSOCIATED is set, it's identical to L.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	120	*
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	121	* F: wq->flush_mutex protected.
				122	*
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	123	* W: workqueue_lock protected.
				124	*/
				125
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	126	struct global_cwq;
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	127	struct worker_pool;
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	128	struct idle_rebind;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	129
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	130	/*
				131	* The poor guys doing the actual heavy lifting. All on-duty workers
				132	* are either serving the manager role, on idle list or on busy hash.
				133	*/
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	134	struct worker {
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	135	/* on idle list while idle, on busy hash table while busy */
				136	union {
				137	struct list_head entry; /* L: while idle */
				138	struct hlist_node hentry; /* L: while busy */
				139	};
				140
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	141	struct work_struct current_work; / L: work being processed */
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	142	struct cpu_workqueue_struct current_cwq; / L: current_work's cwq */
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	143	struct list_head scheduled; /* L: scheduled works */
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	144	struct task_struct task; / I: worker task */
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	145	struct worker_pool pool; / I: the associated pool */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	146	/* 64 bytes boundary on 64bit, 32 on 32bit */
				147	unsigned long last_active; /* L: last active timestamp */
				148	unsigned int flags; /* X: flags */
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	149	int id; /* I: worker id */
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	150
				151	/* for rebinding worker to CPU */
				152	struct idle_rebind idle_rebind; / L: for idle worker */
				153	struct work_struct rebind_work; /* L: for busy worker */
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	154	};
				155
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	156	struct worker_pool {
				157	struct global_cwq gcwq; / I: the owning gcwq */
Tejun Heo	11ebea5	2012-07-12 14:46:37 -0700	[diff] [blame]	158	unsigned int flags; /* X: flags */
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	159
				160	struct list_head worklist; /* L: list of pending works */
				161	int nr_workers; /* L: total number of workers */
				162	int nr_idle; /* L: currently idle ones */
				163
				164	struct list_head idle_list; /* X: list of idle workers */
				165	struct timer_list idle_timer; /* L: worker idle timeout */
				166	struct timer_list mayday_timer; /* L: SOS timer for workers */
				167
Tejun Heo	6037315	2012-07-17 12:39:27 -0700	[diff] [blame]	168	struct mutex manager_mutex; /* mutex manager should hold */
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	169	struct ida worker_ida; /* L: for worker IDs */
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	170	};
				171
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	172	/*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	173	* Global per-cpu workqueue. There's one and only one for each cpu
				174	* and all works are queued and processed here regardless of their
				175	* target workqueues.
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	176	*/
				177	struct global_cwq {
				178	spinlock_t lock; /* the gcwq lock */
				179	unsigned int cpu; /* I: the associated cpu */
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	180	unsigned int flags; /* L: GCWQ_* flags */
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	181
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	182	/* workers are chained either in busy_hash or pool idle_list */
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	183	struct hlist_head busy_hash[BUSY_WORKER_HASH_SIZE];
				184	/* L: hash of busy workers */
				185
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	186	struct worker_pool pools[2]; /* normal and highpri pools */
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	187
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	188	wait_queue_head_t rebind_hold; /* rebind hold wait */
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	189	} ____cacheline_aligned_in_smp;
				190
				191	/*
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	192	* The per-CPU workqueue. The lower WORK_STRUCT_FLAG_BITS of
Tejun Heo	0f90004	2010-06-29 10:07:11 +0200	[diff] [blame]	193	* work_struct->data are used for flags and thus cwqs need to be
				194	* aligned at two's power of the number of flag bits.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	195	*/
				196	struct cpu_workqueue_struct {
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	197	struct worker_pool pool; / I: the associated pool */
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	198	struct workqueue_struct wq; / I: the owning workqueue */
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	199	int work_color; /* L: current color */
				200	int flush_color; /* L: flushing color */
				201	int nr_in_flight[WORK_NR_COLORS];
				202	/* L: nr of in_flight works */
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	203	int nr_active; /* L: nr of active works */
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	204	int max_active; /* L: max active works */
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	205	struct list_head delayed_works; /* L: delayed works */
Tejun Heo	0f90004	2010-06-29 10:07:11 +0200	[diff] [blame]	206	};
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	207
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	208	/*
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	209	* Structure used to wait for workqueue flush.
				210	*/
				211	struct wq_flusher {
				212	struct list_head list; /* F: list of flushers */
				213	int flush_color; /* F: flush color waiting for */
				214	struct completion done; /* flush completion */
				215	};
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	216
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	217	/*
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	218	* All cpumasks are assumed to be always set on UP and thus can't be
				219	* used to determine whether there's something to be done.
				220	*/
				221	#ifdef CONFIG_SMP
				222	typedef cpumask_var_t mayday_mask_t;
				223	#define mayday_test_and_set_cpu(cpu, mask) \
				224	cpumask_test_and_set_cpu((cpu), (mask))
				225	#define mayday_clear_cpu(cpu, mask) cpumask_clear_cpu((cpu), (mask))
				226	#define for_each_mayday_cpu(cpu, mask) for_each_cpu((cpu), (mask))
Tejun Heo	9c37547	2010-08-31 11:18:34 +0200	[diff] [blame]	227	#define alloc_mayday_mask(maskp, gfp) zalloc_cpumask_var((maskp), (gfp))
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	228	#define free_mayday_mask(mask) free_cpumask_var((mask))
				229	#else
				230	typedef unsigned long mayday_mask_t;
				231	#define mayday_test_and_set_cpu(cpu, mask) test_and_set_bit(0, &(mask))
				232	#define mayday_clear_cpu(cpu, mask) clear_bit(0, &(mask))
				233	#define for_each_mayday_cpu(cpu, mask) if ((cpu) = 0, (mask))
				234	#define alloc_mayday_mask(maskp, gfp) true
				235	#define free_mayday_mask(mask) do { } while (0)
				236	#endif
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	237
				238	/*
				239	* The externally visible workqueue abstraction is an array of
				240	* per-CPU workqueues:
				241	*/
				242	struct workqueue_struct {
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	243	unsigned int flags; /* W: WQ_* flags */
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	244	union {
				245	struct cpu_workqueue_struct __percpu *pcpu;
				246	struct cpu_workqueue_struct *single;
				247	unsigned long v;
				248	} cpu_wq; /* I: cwq's */
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	249	struct list_head list; /* W: list of all workqueues */
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	250
				251	struct mutex flush_mutex; /* protects wq flushing */
				252	int work_color; /* F: current work color */
				253	int flush_color; /* F: current flush color */
				254	atomic_t nr_cwqs_to_flush; /* flush in progress */
				255	struct wq_flusher first_flusher; / F: first flusher */
				256	struct list_head flusher_queue; /* F: flush waiters */
				257	struct list_head flusher_overflow; /* F: flush overflow list */
				258
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	259	mayday_mask_t mayday_mask; /* cpus requesting rescue */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	260	struct worker rescuer; / I: rescue worker */
				261
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	262	int nr_drainers; /* W: drain in progress */
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	263	int saved_max_active; /* W: saved cwq max_active */
Johannes Berg	4e6045f	2007-10-18 23:39:55 -0700	[diff] [blame]	264	#ifdef CONFIG_LOCKDEP
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	265	struct lockdep_map lockdep_map;
Johannes Berg	4e6045f	2007-10-18 23:39:55 -0700	[diff] [blame]	266	#endif
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	267	char name[]; /* I: workqueue name */
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	268	};
				269
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	270	struct workqueue_struct *system_wq __read_mostly;
				271	struct workqueue_struct *system_long_wq __read_mostly;
				272	struct workqueue_struct *system_nrt_wq __read_mostly;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	273	struct workqueue_struct *system_unbound_wq __read_mostly;
Tejun Heo	24d51ad	2011-02-21 09:52:50 +0100	[diff] [blame]	274	struct workqueue_struct *system_freezable_wq __read_mostly;
Alan Stern	62d3c54	2012-03-02 10:51:00 +0100	[diff] [blame]	275	struct workqueue_struct *system_nrt_freezable_wq __read_mostly;
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	276	EXPORT_SYMBOL_GPL(system_wq);
				277	EXPORT_SYMBOL_GPL(system_long_wq);
				278	EXPORT_SYMBOL_GPL(system_nrt_wq);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	279	EXPORT_SYMBOL_GPL(system_unbound_wq);
Tejun Heo	24d51ad	2011-02-21 09:52:50 +0100	[diff] [blame]	280	EXPORT_SYMBOL_GPL(system_freezable_wq);
Alan Stern	62d3c54	2012-03-02 10:51:00 +0100	[diff] [blame]	281	EXPORT_SYMBOL_GPL(system_nrt_freezable_wq);
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	282
Tejun Heo	97bd234	2010-10-05 10:41:14 +0200	[diff] [blame]	283	#define CREATE_TRACE_POINTS
				284	#include <trace/events/workqueue.h>
				285
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	286	#define for_each_worker_pool(pool, gcwq) \
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	287	for ((pool) = &(gcwq)->pools[0]; \
				288	(pool) < &(gcwq)->pools[NR_WORKER_POOLS]; (pool)++)
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	289
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	290	#define for_each_busy_worker(worker, i, pos, gcwq) \
				291	for (i = 0; i < BUSY_WORKER_HASH_SIZE; i++) \
				292	hlist_for_each_entry(worker, pos, &gcwq->busy_hash[i], hentry)
				293
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	294	static inline int __next_gcwq_cpu(int cpu, const struct cpumask *mask,
				295	unsigned int sw)
				296	{
				297	if (cpu < nr_cpu_ids) {
				298	if (sw & 1) {
				299	cpu = cpumask_next(cpu, mask);
				300	if (cpu < nr_cpu_ids)
				301	return cpu;
				302	}
				303	if (sw & 2)
				304	return WORK_CPU_UNBOUND;
				305	}
				306	return WORK_CPU_NONE;
				307	}
				308
				309	static inline int __next_wq_cpu(int cpu, const struct cpumask *mask,
				310	struct workqueue_struct *wq)
				311	{
				312	return __next_gcwq_cpu(cpu, mask, !(wq->flags & WQ_UNBOUND) ? 1 : 2);
				313	}
				314
Tejun Heo	0988495	2010-08-01 11:50:12 +0200	[diff] [blame]	315	/*
				316	* CPU iterators
				317	*
				318	* An extra gcwq is defined for an invalid cpu number
				319	* (WORK_CPU_UNBOUND) to host workqueues which are not bound to any
				320	* specific CPU. The following iterators are similar to
				321	* for_each_*_cpu() iterators but also considers the unbound gcwq.
				322	*
				323	* for_each_gcwq_cpu() : possible CPUs + WORK_CPU_UNBOUND
				324	* for_each_online_gcwq_cpu() : online CPUs + WORK_CPU_UNBOUND
				325	* for_each_cwq_cpu() : possible CPUs for bound workqueues,
				326	* WORK_CPU_UNBOUND for unbound workqueues
				327	*/
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	328	#define for_each_gcwq_cpu(cpu) \
				329	for ((cpu) = __next_gcwq_cpu(-1, cpu_possible_mask, 3); \
				330	(cpu) < WORK_CPU_NONE; \
				331	(cpu) = __next_gcwq_cpu((cpu), cpu_possible_mask, 3))
				332
				333	#define for_each_online_gcwq_cpu(cpu) \
				334	for ((cpu) = __next_gcwq_cpu(-1, cpu_online_mask, 3); \
				335	(cpu) < WORK_CPU_NONE; \
				336	(cpu) = __next_gcwq_cpu((cpu), cpu_online_mask, 3))
				337
				338	#define for_each_cwq_cpu(cpu, wq) \
				339	for ((cpu) = __next_wq_cpu(-1, cpu_possible_mask, (wq)); \
				340	(cpu) < WORK_CPU_NONE; \
				341	(cpu) = __next_wq_cpu((cpu), cpu_possible_mask, (wq)))
				342
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	343	#ifdef CONFIG_DEBUG_OBJECTS_WORK
				344
				345	static struct debug_obj_descr work_debug_descr;
				346
Stanislaw Gruszka	9977728	2011-03-07 09:58:33 +0100	[diff] [blame]	347	static void work_debug_hint(void addr)
				348	{
				349	return ((struct work_struct *) addr)->func;
				350	}
				351
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	352	/*
				353	* fixup_init is called when:
				354	* - an active object is initialized
				355	*/
				356	static int work_fixup_init(void *addr, enum debug_obj_state state)
				357	{
				358	struct work_struct *work = addr;
				359
				360	switch (state) {
				361	case ODEBUG_STATE_ACTIVE:
				362	cancel_work_sync(work);
				363	debug_object_init(work, &work_debug_descr);
				364	return 1;
				365	default:
				366	return 0;
				367	}
				368	}
				369
				370	/*
				371	* fixup_activate is called when:
				372	* - an active object is activated
				373	* - an unknown object is activated (might be a statically initialized object)
				374	*/
				375	static int work_fixup_activate(void *addr, enum debug_obj_state state)
				376	{
				377	struct work_struct *work = addr;
				378
				379	switch (state) {
				380
				381	case ODEBUG_STATE_NOTAVAILABLE:
				382	/*
				383	* This is not really a fixup. The work struct was
				384	* statically initialized. We just make sure that it
				385	* is tracked in the object tracker.
				386	*/
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	387	if (test_bit(WORK_STRUCT_STATIC_BIT, work_data_bits(work))) {
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	388	debug_object_init(work, &work_debug_descr);
				389	debug_object_activate(work, &work_debug_descr);
				390	return 0;
				391	}
				392	WARN_ON_ONCE(1);
				393	return 0;
				394
				395	case ODEBUG_STATE_ACTIVE:
				396	WARN_ON(1);
				397
				398	default:
				399	return 0;
				400	}
				401	}
				402
				403	/*
				404	* fixup_free is called when:
				405	* - an active object is freed
				406	*/
				407	static int work_fixup_free(void *addr, enum debug_obj_state state)
				408	{
				409	struct work_struct *work = addr;
				410
				411	switch (state) {
				412	case ODEBUG_STATE_ACTIVE:
				413	cancel_work_sync(work);
				414	debug_object_free(work, &work_debug_descr);
				415	return 1;
				416	default:
				417	return 0;
				418	}
				419	}
				420
				421	static struct debug_obj_descr work_debug_descr = {
				422	.name = "work_struct",
Stanislaw Gruszka	9977728	2011-03-07 09:58:33 +0100	[diff] [blame]	423	.debug_hint = work_debug_hint,
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	424	.fixup_init = work_fixup_init,
				425	.fixup_activate = work_fixup_activate,
				426	.fixup_free = work_fixup_free,
				427	};
				428
				429	static inline void debug_work_activate(struct work_struct *work)
				430	{
				431	debug_object_activate(work, &work_debug_descr);
				432	}
				433
				434	static inline void debug_work_deactivate(struct work_struct *work)
				435	{
				436	debug_object_deactivate(work, &work_debug_descr);
				437	}
				438
				439	void __init_work(struct work_struct *work, int onstack)
				440	{
				441	if (onstack)
				442	debug_object_init_on_stack(work, &work_debug_descr);
				443	else
				444	debug_object_init(work, &work_debug_descr);
				445	}
				446	EXPORT_SYMBOL_GPL(__init_work);
				447
				448	void destroy_work_on_stack(struct work_struct *work)
				449	{
				450	debug_object_free(work, &work_debug_descr);
				451	}
				452	EXPORT_SYMBOL_GPL(destroy_work_on_stack);
				453
				454	#else
				455	static inline void debug_work_activate(struct work_struct *work) { }
				456	static inline void debug_work_deactivate(struct work_struct *work) { }
				457	#endif
				458
Gautham R Shenoy	95402b3	2008-01-25 21:08:02 +0100	[diff] [blame]	459	/* Serializes the accesses to the list of workqueues. */
				460	static DEFINE_SPINLOCK(workqueue_lock);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	461	static LIST_HEAD(workqueues);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	462	static bool workqueue_freezing; /* W: have wqs started freezing? */
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	463
Oleg Nesterov	1444196	2007-05-23 13:57:57 -0700	[diff] [blame]	464	/*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	465	* The almighty global cpu workqueues. nr_running is the only field
				466	* which is expected to be used frequently by other cpus via
				467	* try_to_wake_up(). Put it in a separate cacheline.
Oleg Nesterov	1444196	2007-05-23 13:57:57 -0700	[diff] [blame]	468	*/
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	469	static DEFINE_PER_CPU(struct global_cwq, global_cwq);
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	470	static DEFINE_PER_CPU_SHARED_ALIGNED(atomic_t, pool_nr_running[NR_WORKER_POOLS]);
Nathan Lynch	f756d5e	2006-01-08 01:05:12 -0800	[diff] [blame]	471
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	472	/*
				473	* Global cpu workqueue and nr_running counter for unbound gcwq. The
				474	* gcwq is always online, has GCWQ_DISASSOCIATED set, and all its
				475	* workers have WORKER_UNBOUND set.
				476	*/
				477	static struct global_cwq unbound_global_cwq;
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	478	static atomic_t unbound_pool_nr_running[NR_WORKER_POOLS] = {
				479	[0 ... NR_WORKER_POOLS - 1] = ATOMIC_INIT(0), /* always 0 */
				480	};
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	481
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	482	static int worker_thread(void *__worker);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	483
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	484	static int worker_pool_pri(struct worker_pool *pool)
				485	{
				486	return pool - pool->gcwq->pools;
				487	}
				488
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	489	static struct global_cwq *get_gcwq(unsigned int cpu)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	490	{
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	491	if (cpu != WORK_CPU_UNBOUND)
				492	return &per_cpu(global_cwq, cpu);
				493	else
				494	return &unbound_global_cwq;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	495	}
				496
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	497	static atomic_t get_pool_nr_running(struct worker_pool pool)
Oleg Nesterov	b1f4ec1	2007-05-09 02:34:12 -0700	[diff] [blame]	498	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	499	int cpu = pool->gcwq->cpu;
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	500	int idx = worker_pool_pri(pool);
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	501
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	502	if (cpu != WORK_CPU_UNBOUND)
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	503	return &per_cpu(pool_nr_running, cpu)[idx];
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	504	else
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	505	return &unbound_pool_nr_running[idx];
Oleg Nesterov	b1f4ec1	2007-05-09 02:34:12 -0700	[diff] [blame]	506	}
				507
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	508	static struct cpu_workqueue_struct *get_cwq(unsigned int cpu,
				509	struct workqueue_struct *wq)
Oleg Nesterov	a848e3b	2007-05-09 02:34:17 -0700	[diff] [blame]	510	{
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	511	if (!(wq->flags & WQ_UNBOUND)) {
Lai Jiangshan	e06ffa1	2012-03-09 18:03:20 +0800	[diff] [blame]	512	if (likely(cpu < nr_cpu_ids))
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	513	return per_cpu_ptr(wq->cpu_wq.pcpu, cpu);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	514	} else if (likely(cpu == WORK_CPU_UNBOUND))
				515	return wq->cpu_wq.single;
				516	return NULL;
Oleg Nesterov	a848e3b	2007-05-09 02:34:17 -0700	[diff] [blame]	517	}
				518
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	519	static unsigned int work_color_to_flags(int color)
				520	{
				521	return color << WORK_STRUCT_COLOR_SHIFT;
				522	}
				523
				524	static int get_work_color(struct work_struct *work)
				525	{
				526	return (*work_data_bits(work) >> WORK_STRUCT_COLOR_SHIFT) &
				527	((1 << WORK_STRUCT_COLOR_BITS) - 1);
				528	}
				529
				530	static int work_next_color(int color)
				531	{
				532	return (color + 1) % WORK_NR_COLORS;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	533	}
				534
David Howells	4594bf1	2006-12-07 11:33:26 +0000	[diff] [blame]	535	/*
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	536	* A work's data points to the cwq with WORK_STRUCT_CWQ set while the
				537	* work is on queue. Once execution starts, WORK_STRUCT_CWQ is
				538	* cleared and the work data contains the cpu number it was last on.
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	539	*
				540	* set_work_{cwq\|cpu}() and clear_work_data() can be used to set the
				541	* cwq, cpu or clear work->data. These functions should only be
				542	* called while the work is owned - ie. while the PENDING bit is set.
				543	*
				544	* get_work_[g]cwq() can be used to obtain the gcwq or cwq
				545	* corresponding to a work. gcwq is available once the work has been
				546	* queued anywhere after initialization. cwq is available only from
				547	* queueing until execution starts.
David Howells	4594bf1	2006-12-07 11:33:26 +0000	[diff] [blame]	548	*/
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	549	static inline void set_work_data(struct work_struct *work, unsigned long data,
				550	unsigned long flags)
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	551	{
David Howells	4594bf1	2006-12-07 11:33:26 +0000	[diff] [blame]	552	BUG_ON(!work_pending(work));
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	553	atomic_long_set(&work->data, data \| flags \| work_static(work));
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	554	}
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	555
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	556	static void set_work_cwq(struct work_struct *work,
				557	struct cpu_workqueue_struct *cwq,
				558	unsigned long extra_flags)
Oleg Nesterov	4d707b9	2010-04-23 17:40:40 +0200	[diff] [blame]	559	{
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	560	set_work_data(work, (unsigned long)cwq,
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	561	WORK_STRUCT_PENDING \| WORK_STRUCT_CWQ \| extra_flags);
Oleg Nesterov	4d707b9	2010-04-23 17:40:40 +0200	[diff] [blame]	562	}
				563
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	564	static void set_work_cpu(struct work_struct *work, unsigned int cpu)
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	565	{
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	566	set_work_data(work, cpu << WORK_STRUCT_FLAG_BITS, WORK_STRUCT_PENDING);
				567	}
				568
				569	static void clear_work_data(struct work_struct *work)
				570	{
				571	set_work_data(work, WORK_STRUCT_NO_CPU, 0);
				572	}
				573
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	574	static struct cpu_workqueue_struct get_work_cwq(struct work_struct work)
				575	{
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	576	unsigned long data = atomic_long_read(&work->data);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	577
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	578	if (data & WORK_STRUCT_CWQ)
				579	return (void *)(data & WORK_STRUCT_WQ_DATA_MASK);
				580	else
				581	return NULL;
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	582	}
				583
				584	static struct global_cwq get_work_gcwq(struct work_struct work)
				585	{
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	586	unsigned long data = atomic_long_read(&work->data);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	587	unsigned int cpu;
				588
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	589	if (data & WORK_STRUCT_CWQ)
				590	return ((struct cpu_workqueue_struct *)
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	591	(data & WORK_STRUCT_WQ_DATA_MASK))->pool->gcwq;
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	592
				593	cpu = data >> WORK_STRUCT_FLAG_BITS;
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	594	if (cpu == WORK_CPU_NONE)
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	595	return NULL;
				596
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	597	BUG_ON(cpu >= nr_cpu_ids && cpu != WORK_CPU_UNBOUND);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	598	return get_gcwq(cpu);
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	599	}
				600
				601	/*
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	602	* Policy functions. These define the policies on how the global worker
				603	* pools are managed. Unless noted otherwise, these functions assume that
				604	* they're being called with gcwq->lock held.
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	605	*/
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	606
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	607	static bool __need_more_worker(struct worker_pool *pool)
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	608	{
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	609	return !atomic_read(get_pool_nr_running(pool));
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	610	}
				611
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	612	/*
				613	* Need to wake up a worker? Called from anything but currently
				614	* running workers.
Tejun Heo	974271c	2012-07-12 14:46:37 -0700	[diff] [blame]	615	*
				616	* Note that, because unbound workers never contribute to nr_running, this
				617	* function will always return %true for unbound gcwq as long as the
				618	* worklist isn't empty.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	619	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	620	static bool need_more_worker(struct worker_pool *pool)
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	621	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	622	return !list_empty(&pool->worklist) && __need_more_worker(pool);
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	623	}
				624
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	625	/* Can I start working? Called from busy but !running workers. */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	626	static bool may_start_working(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	627	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	628	return pool->nr_idle;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	629	}
				630
				631	/* Do I need to keep working? Called from currently running workers. */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	632	static bool keep_working(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	633	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	634	atomic_t *nr_running = get_pool_nr_running(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	635
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	636	return !list_empty(&pool->worklist) && atomic_read(nr_running) <= 1;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	637	}
				638
				639	/* Do we need a new worker? Called from manager. */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	640	static bool need_to_create_worker(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	641	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	642	return need_more_worker(pool) && !may_start_working(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	643	}
				644
				645	/* Do I need to be the manager? */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	646	static bool need_to_manage_workers(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	647	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	648	return need_to_create_worker(pool) \|\|
Tejun Heo	11ebea5	2012-07-12 14:46:37 -0700	[diff] [blame]	649	(pool->flags & POOL_MANAGE_WORKERS);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	650	}
				651
				652	/* Do we have too many workers and should some go away? */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	653	static bool too_many_workers(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	654	{
Tejun Heo	6037315	2012-07-17 12:39:27 -0700	[diff] [blame]	655	bool managing = mutex_is_locked(&pool->manager_mutex);
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	656	int nr_idle = pool->nr_idle + managing; /* manager is considered idle */
				657	int nr_busy = pool->nr_workers - nr_idle;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	658
				659	return nr_idle > 2 && (nr_idle - 2) * MAX_IDLE_WORKERS_RATIO >= nr_busy;
				660	}
				661
				662	/*
				663	* Wake up functions.
				664	*/
				665
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	666	/* Return the first worker. Safe with preemption disabled */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	667	static struct worker first_worker(struct worker_pool pool)
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	668	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	669	if (unlikely(list_empty(&pool->idle_list)))
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	670	return NULL;
				671
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	672	return list_first_entry(&pool->idle_list, struct worker, entry);
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	673	}
				674
				675	/**
				676	* wake_up_worker - wake up an idle worker
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	677	* @pool: worker pool to wake worker from
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	678	*
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	679	* Wake up the first idle worker of @pool.
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	680	*
				681	* CONTEXT:
				682	* spin_lock_irq(gcwq->lock).
				683	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	684	static void wake_up_worker(struct worker_pool *pool)
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	685	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	686	struct worker *worker = first_worker(pool);
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	687
				688	if (likely(worker))
				689	wake_up_process(worker->task);
				690	}
				691
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	692	/**
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	693	* wq_worker_waking_up - a worker is waking up
				694	* @task: task waking up
				695	* @cpu: CPU @task is waking up to
				696	*
				697	* This function is called during try_to_wake_up() when a worker is
				698	* being awoken.
				699	*
				700	* CONTEXT:
				701	* spin_lock_irq(rq->lock)
				702	*/
				703	void wq_worker_waking_up(struct task_struct *task, unsigned int cpu)
				704	{
				705	struct worker *worker = kthread_data(task);
				706
Steven Rostedt	2d64672	2010-12-03 23:12:33 -0500	[diff] [blame]	707	if (!(worker->flags & WORKER_NOT_RUNNING))
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	708	atomic_inc(get_pool_nr_running(worker->pool));
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	709	}
				710
				711	/**
				712	* wq_worker_sleeping - a worker is going to sleep
				713	* @task: task going to sleep
				714	* @cpu: CPU in question, must be the current CPU number
				715	*
				716	* This function is called during schedule() when a busy worker is
				717	* going to sleep. Worker on the same cpu can be woken up by
				718	* returning pointer to its task.
				719	*
				720	* CONTEXT:
				721	* spin_lock_irq(rq->lock)
				722	*
				723	* RETURNS:
				724	* Worker task on @cpu to wake up, %NULL if none.
				725	*/
				726	struct task_struct wq_worker_sleeping(struct task_struct task,
				727	unsigned int cpu)
				728	{
				729	struct worker worker = kthread_data(task), to_wakeup = NULL;
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	730	struct worker_pool *pool = worker->pool;
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	731	atomic_t *nr_running = get_pool_nr_running(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	732
Steven Rostedt	2d64672	2010-12-03 23:12:33 -0500	[diff] [blame]	733	if (worker->flags & WORKER_NOT_RUNNING)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	734	return NULL;
				735
				736	/* this can only happen on the local cpu */
				737	BUG_ON(cpu != raw_smp_processor_id());
				738
				739	/*
				740	* The counterpart of the following dec_and_test, implied mb,
				741	* worklist not empty test sequence is in insert_work().
				742	* Please read comment there.
				743	*
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	744	* NOT_RUNNING is clear. This means that we're bound to and
				745	* running on the local cpu w/ rq lock held and preemption
				746	* disabled, which in turn means that none else could be
				747	* manipulating idle_list, so dereferencing idle_list without gcwq
				748	* lock is safe.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	749	*/
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	750	if (atomic_dec_and_test(nr_running) && !list_empty(&pool->worklist))
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	751	to_wakeup = first_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	752	return to_wakeup ? to_wakeup->task : NULL;
				753	}
				754
				755	/**
				756	* worker_set_flags - set worker flags and adjust nr_running accordingly
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	757	* @worker: self
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	758	* @flags: flags to set
				759	* @wakeup: wakeup an idle worker if necessary
				760	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	761	* Set @flags in @worker->flags and adjust nr_running accordingly. If
				762	* nr_running becomes zero and @wakeup is %true, an idle worker is
				763	* woken up.
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	764	*
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	765	* CONTEXT:
				766	* spin_lock_irq(gcwq->lock)
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	767	*/
				768	static inline void worker_set_flags(struct worker *worker, unsigned int flags,
				769	bool wakeup)
				770	{
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	771	struct worker_pool *pool = worker->pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	772
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	773	WARN_ON_ONCE(worker->task != current);
				774
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	775	/*
				776	* If transitioning into NOT_RUNNING, adjust nr_running and
				777	* wake up an idle worker as necessary if requested by
				778	* @wakeup.
				779	*/
				780	if ((flags & WORKER_NOT_RUNNING) &&
				781	!(worker->flags & WORKER_NOT_RUNNING)) {
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	782	atomic_t *nr_running = get_pool_nr_running(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	783
				784	if (wakeup) {
				785	if (atomic_dec_and_test(nr_running) &&
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	786	!list_empty(&pool->worklist))
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	787	wake_up_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	788	} else
				789	atomic_dec(nr_running);
				790	}
				791
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	792	worker->flags \|= flags;
				793	}
				794
				795	/**
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	796	* worker_clr_flags - clear worker flags and adjust nr_running accordingly
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	797	* @worker: self
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	798	* @flags: flags to clear
				799	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	800	* Clear @flags in @worker->flags and adjust nr_running accordingly.
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	801	*
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	802	* CONTEXT:
				803	* spin_lock_irq(gcwq->lock)
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	804	*/
				805	static inline void worker_clr_flags(struct worker *worker, unsigned int flags)
				806	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	807	struct worker_pool *pool = worker->pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	808	unsigned int oflags = worker->flags;
				809
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	810	WARN_ON_ONCE(worker->task != current);
				811
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	812	worker->flags &= ~flags;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	813
Tejun Heo	42c025f	2011-01-11 15:58:49 +0100	[diff] [blame]	814	/*
				815	* If transitioning out of NOT_RUNNING, increment nr_running. Note
				816	* that the nested NOT_RUNNING is not a noop. NOT_RUNNING is mask
				817	* of multiple flags, not a single flag.
				818	*/
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	819	if ((flags & WORKER_NOT_RUNNING) && (oflags & WORKER_NOT_RUNNING))
				820	if (!(worker->flags & WORKER_NOT_RUNNING))
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	821	atomic_inc(get_pool_nr_running(pool));
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	822	}
				823
				824	/**
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	825	* busy_worker_head - return the busy hash head for a work
				826	* @gcwq: gcwq of interest
				827	* @work: work to be hashed
				828	*
				829	* Return hash head of @gcwq for @work.
				830	*
				831	* CONTEXT:
				832	* spin_lock_irq(gcwq->lock).
				833	*
				834	* RETURNS:
				835	* Pointer to the hash head.
				836	*/
				837	static struct hlist_head busy_worker_head(struct global_cwq gcwq,
				838	struct work_struct *work)
				839	{
				840	const int base_shift = ilog2(sizeof(struct work_struct));
				841	unsigned long v = (unsigned long)work;
				842
				843	/* simple shift and fold hash, do we need something better? */
				844	v >>= base_shift;
				845	v += v >> BUSY_WORKER_HASH_ORDER;
				846	v &= BUSY_WORKER_HASH_MASK;
				847
				848	return &gcwq->busy_hash[v];
				849	}
				850
				851	/**
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	852	* __find_worker_executing_work - find worker which is executing a work
				853	* @gcwq: gcwq of interest
				854	* @bwh: hash head as returned by busy_worker_head()
				855	* @work: work to find worker for
				856	*
				857	* Find a worker which is executing @work on @gcwq. @bwh should be
				858	* the hash head obtained by calling busy_worker_head() with the same
				859	* work.
				860	*
				861	* CONTEXT:
				862	* spin_lock_irq(gcwq->lock).
				863	*
				864	* RETURNS:
				865	* Pointer to worker which is executing @work if found, NULL
				866	* otherwise.
				867	*/
				868	static struct worker __find_worker_executing_work(struct global_cwq gcwq,
				869	struct hlist_head *bwh,
				870	struct work_struct *work)
				871	{
				872	struct worker *worker;
				873	struct hlist_node *tmp;
				874
				875	hlist_for_each_entry(worker, tmp, bwh, hentry)
				876	if (worker->current_work == work)
				877	return worker;
				878	return NULL;
				879	}
				880
				881	/**
				882	* find_worker_executing_work - find worker which is executing a work
				883	* @gcwq: gcwq of interest
				884	* @work: work to find worker for
				885	*
				886	* Find a worker which is executing @work on @gcwq. This function is
				887	* identical to __find_worker_executing_work() except that this
				888	* function calculates @bwh itself.
				889	*
				890	* CONTEXT:
				891	* spin_lock_irq(gcwq->lock).
				892	*
				893	* RETURNS:
				894	* Pointer to worker which is executing @work if found, NULL
				895	* otherwise.
				896	*/
				897	static struct worker find_worker_executing_work(struct global_cwq gcwq,
				898	struct work_struct *work)
				899	{
				900	return __find_worker_executing_work(gcwq, busy_worker_head(gcwq, work),
				901	work);
				902	}
				903
				904	/**
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	905	* insert_work - insert a work into gcwq
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	906	* @cwq: cwq @work belongs to
				907	* @work: work to insert
				908	* @head: insertion point
				909	* @extra_flags: extra WORK_STRUCT_* flags to set
				910	*
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	911	* Insert @work which belongs to @cwq into @gcwq after @head.
				912	* @extra_flags is or'd to work_struct flags.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	913	*
				914	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	915	* spin_lock_irq(gcwq->lock).
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	916	*/
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	917	static void insert_work(struct cpu_workqueue_struct *cwq,
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	918	struct work_struct work, struct list_head head,
				919	unsigned int extra_flags)
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	920	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	921	struct worker_pool *pool = cwq->pool;
Frederic Weisbecker	e1d8aa9	2009-01-12 23:15:46 +0100	[diff] [blame]	922
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	923	/* we own @work, set data and link */
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	924	set_work_cwq(work, cwq, extra_flags);
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	925
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	926	/*
				927	* Ensure that we get the right work->data if we see the
				928	* result of list_add() below, see try_to_grab_pending().
				929	*/
				930	smp_wmb();
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	931
Oleg Nesterov	1a4d9b0	2008-07-25 01:47:47 -0700	[diff] [blame]	932	list_add_tail(&work->entry, head);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	933
				934	/*
				935	* Ensure either worker_sched_deactivated() sees the above
				936	* list_add_tail() or we see zero nr_running to avoid workers
				937	* lying around lazily while there are works to be processed.
				938	*/
				939	smp_mb();
				940
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	941	if (__need_more_worker(pool))
				942	wake_up_worker(pool);
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	943	}
				944
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	945	/*
				946	* Test whether @work is being queued from another work executing on the
				947	* same workqueue. This is rather expensive and should only be used from
				948	* cold paths.
				949	*/
				950	static bool is_chained_work(struct workqueue_struct *wq)
				951	{
				952	unsigned long flags;
				953	unsigned int cpu;
				954
				955	for_each_gcwq_cpu(cpu) {
				956	struct global_cwq *gcwq = get_gcwq(cpu);
				957	struct worker *worker;
				958	struct hlist_node *pos;
				959	int i;
				960
				961	spin_lock_irqsave(&gcwq->lock, flags);
				962	for_each_busy_worker(worker, i, pos, gcwq) {
				963	if (worker->task != current)
				964	continue;
				965	spin_unlock_irqrestore(&gcwq->lock, flags);
				966	/*
				967	* I'm @worker, no locking necessary. See if @work
				968	* is headed to the same workqueue.
				969	*/
				970	return worker->current_cwq->wq == wq;
				971	}
				972	spin_unlock_irqrestore(&gcwq->lock, flags);
				973	}
				974	return false;
				975	}
				976
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	977	static void __queue_work(unsigned int cpu, struct workqueue_struct *wq,
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	978	struct work_struct *work)
				979	{
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	980	struct global_cwq *gcwq;
				981	struct cpu_workqueue_struct *cwq;
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	982	struct list_head *worklist;
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	983	unsigned int work_flags;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	984	unsigned long flags;
				985
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	986	debug_work_activate(work);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	987
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	988	/* if dying, only works from the same workqueue are allowed */
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	989	if (unlikely(wq->flags & WQ_DRAINING) &&
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	990	WARN_ON_ONCE(!is_chained_work(wq)))
Tejun Heo	e41e704	2010-08-24 14:22:47 +0200	[diff] [blame]	991	return;
				992
Tejun Heo	c7fc77f	2010-07-02 10:03:51 +0200	[diff] [blame]	993	/* determine gcwq to use */
				994	if (!(wq->flags & WQ_UNBOUND)) {
Tejun Heo	18aa9ef	2010-06-29 10:07:13 +0200	[diff] [blame]	995	struct global_cwq *last_gcwq;
				996
Tejun Heo	c7fc77f	2010-07-02 10:03:51 +0200	[diff] [blame]	997	if (unlikely(cpu == WORK_CPU_UNBOUND))
				998	cpu = raw_smp_processor_id();
				999
Tejun Heo	18aa9ef	2010-06-29 10:07:13 +0200	[diff] [blame]	1000	/*
				1001	* It's multi cpu. If @wq is non-reentrant and @work
				1002	* was previously on a different cpu, it might still
				1003	* be running there, in which case the work needs to
				1004	* be queued on that cpu to guarantee non-reentrance.
				1005	*/
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	1006	gcwq = get_gcwq(cpu);
Tejun Heo	18aa9ef	2010-06-29 10:07:13 +0200	[diff] [blame]	1007	if (wq->flags & WQ_NON_REENTRANT &&
				1008	(last_gcwq = get_work_gcwq(work)) && last_gcwq != gcwq) {
				1009	struct worker *worker;
				1010
				1011	spin_lock_irqsave(&last_gcwq->lock, flags);
				1012
				1013	worker = find_worker_executing_work(last_gcwq, work);
				1014
				1015	if (worker && worker->current_cwq->wq == wq)
				1016	gcwq = last_gcwq;
				1017	else {
				1018	/* meh... not running there, queue here */
				1019	spin_unlock_irqrestore(&last_gcwq->lock, flags);
				1020	spin_lock_irqsave(&gcwq->lock, flags);
				1021	}
				1022	} else
				1023	spin_lock_irqsave(&gcwq->lock, flags);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1024	} else {
				1025	gcwq = get_gcwq(WORK_CPU_UNBOUND);
				1026	spin_lock_irqsave(&gcwq->lock, flags);
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	1027	}
				1028
				1029	/* gcwq determined, get cwq and queue */
				1030	cwq = get_cwq(gcwq->cpu, wq);
Tejun Heo	cdadf00	2010-10-05 10:49:55 +0200	[diff] [blame]	1031	trace_workqueue_queue_work(cpu, cwq, work);
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	1032
Dan Carpenter	f5b2552	2012-04-13 22:06:58 +0300	[diff] [blame]	1033	if (WARN_ON(!list_empty(&work->entry))) {
				1034	spin_unlock_irqrestore(&gcwq->lock, flags);
				1035	return;
				1036	}
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1037
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1038	cwq->nr_in_flight[cwq->work_color]++;
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1039	work_flags = work_color_to_flags(cwq->work_color);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1040
				1041	if (likely(cwq->nr_active < cwq->max_active)) {
Tejun Heo	cdadf00	2010-10-05 10:49:55 +0200	[diff] [blame]	1042	trace_workqueue_activate_work(work);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1043	cwq->nr_active++;
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	1044	worklist = &cwq->pool->worklist;
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1045	} else {
				1046	work_flags \|= WORK_STRUCT_DELAYED;
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1047	worklist = &cwq->delayed_works;
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1048	}
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1049
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1050	insert_work(cwq, work, worklist, work_flags);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1051
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1052	spin_unlock_irqrestore(&gcwq->lock, flags);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1053	}
				1054
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1055	/**
				1056	* queue_work - queue work on a workqueue
				1057	* @wq: workqueue to use
				1058	* @work: work to queue
				1059	*
Alan Stern	057647f	2006-10-28 10:38:58 -0700	[diff] [blame]	1060	* Returns 0 if @work was already on a queue, non-zero otherwise.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1061	*
Oleg Nesterov	00dfcaf	2008-04-29 01:00:27 -0700	[diff] [blame]	1062	* We queue the work to the CPU on which it was submitted, but if the CPU dies
				1063	* it can be processed by another CPU.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1064	*/
Harvey Harrison	7ad5b3a	2008-02-08 04:19:53 -0800	[diff] [blame]	1065	int queue_work(struct workqueue_struct wq, struct work_struct work)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1066	{
Oleg Nesterov	ef1ca23	2008-07-25 01:47:53 -0700	[diff] [blame]	1067	int ret;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1068
Oleg Nesterov	ef1ca23	2008-07-25 01:47:53 -0700	[diff] [blame]	1069	ret = queue_work_on(get_cpu(), wq, work);
				1070	put_cpu();
				1071
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1072	return ret;
				1073	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	1074	EXPORT_SYMBOL_GPL(queue_work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1075
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	1076	/**
				1077	* queue_work_on - queue work on specific cpu
				1078	* @cpu: CPU number to execute work on
				1079	* @wq: workqueue to use
				1080	* @work: work to queue
				1081	*
				1082	* Returns 0 if @work was already on a queue, non-zero otherwise.
				1083	*
				1084	* We queue the work to a specific CPU, the caller must ensure it
				1085	* can't go away.
				1086	*/
				1087	int
				1088	queue_work_on(int cpu, struct workqueue_struct wq, struct work_struct work)
				1089	{
				1090	int ret = 0;
				1091
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	1092	if (!test_and_set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(work))) {
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1093	__queue_work(cpu, wq, work);
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	1094	ret = 1;
				1095	}
				1096	return ret;
				1097	}
				1098	EXPORT_SYMBOL_GPL(queue_work_on);
				1099
Li Zefan	6d141c3	2008-02-08 04:21:09 -0800	[diff] [blame]	1100	static void delayed_work_timer_fn(unsigned long __data)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1101	{
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1102	struct delayed_work dwork = (struct delayed_work )__data;
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	1103	struct cpu_workqueue_struct *cwq = get_work_cwq(&dwork->work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1104
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1105	__queue_work(smp_processor_id(), cwq->wq, &dwork->work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1106	}
				1107
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1108	/**
				1109	* queue_delayed_work - queue work on a workqueue after delay
				1110	* @wq: workqueue to use
Randy Dunlap	af9997e	2006-12-22 01:06:52 -0800	[diff] [blame]	1111	* @dwork: delayable work to queue
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1112	* @delay: number of jiffies to wait before queueing
				1113	*
Alan Stern	057647f	2006-10-28 10:38:58 -0700	[diff] [blame]	1114	* Returns 0 if @work was already on a queue, non-zero otherwise.
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1115	*/
Harvey Harrison	7ad5b3a	2008-02-08 04:19:53 -0800	[diff] [blame]	1116	int queue_delayed_work(struct workqueue_struct *wq,
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1117	struct delayed_work *dwork, unsigned long delay)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1118	{
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1119	if (delay == 0)
Oleg Nesterov	63bc036	2007-05-09 02:34:16 -0700	[diff] [blame]	1120	return queue_work(wq, &dwork->work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1121
Oleg Nesterov	63bc036	2007-05-09 02:34:16 -0700	[diff] [blame]	1122	return queue_delayed_work_on(-1, wq, dwork, delay);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1123	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	1124	EXPORT_SYMBOL_GPL(queue_delayed_work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1125
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1126	/**
				1127	* queue_delayed_work_on - queue work on specific CPU after delay
				1128	* @cpu: CPU number to execute work on
				1129	* @wq: workqueue to use
Randy Dunlap	af9997e	2006-12-22 01:06:52 -0800	[diff] [blame]	1130	* @dwork: work to queue
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1131	* @delay: number of jiffies to wait before queueing
				1132	*
Alan Stern	057647f	2006-10-28 10:38:58 -0700	[diff] [blame]	1133	* Returns 0 if @work was already on a queue, non-zero otherwise.
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1134	*/
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1135	int queue_delayed_work_on(int cpu, struct workqueue_struct *wq,
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1136	struct delayed_work *dwork, unsigned long delay)
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1137	{
				1138	int ret = 0;
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1139	struct timer_list *timer = &dwork->timer;
				1140	struct work_struct *work = &dwork->work;
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1141
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	1142	if (!test_and_set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(work))) {
Tejun Heo	c7fc77f	2010-07-02 10:03:51 +0200	[diff] [blame]	1143	unsigned int lcpu;
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	1144
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1145	BUG_ON(timer_pending(timer));
				1146	BUG_ON(!list_empty(&work->entry));
				1147
Andrew Liu	8a3e77c	2008-05-01 04:35:14 -0700	[diff] [blame]	1148	timer_stats_timer_set_start_info(&dwork->timer);
				1149
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	1150	/*
				1151	* This stores cwq for the moment, for the timer_fn.
				1152	* Note that the work's gcwq is preserved to allow
				1153	* reentrance detection for delayed works.
				1154	*/
Tejun Heo	c7fc77f	2010-07-02 10:03:51 +0200	[diff] [blame]	1155	if (!(wq->flags & WQ_UNBOUND)) {
				1156	struct global_cwq *gcwq = get_work_gcwq(work);
				1157
				1158	if (gcwq && gcwq->cpu != WORK_CPU_UNBOUND)
				1159	lcpu = gcwq->cpu;
				1160	else
				1161	lcpu = raw_smp_processor_id();
				1162	} else
				1163	lcpu = WORK_CPU_UNBOUND;
				1164
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	1165	set_work_cwq(work, get_cwq(lcpu, wq), 0);
Tejun Heo	c7fc77f	2010-07-02 10:03:51 +0200	[diff] [blame]	1166
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1167	timer->expires = jiffies + delay;
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1168	timer->data = (unsigned long)dwork;
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1169	timer->function = delayed_work_timer_fn;
Oleg Nesterov	63bc036	2007-05-09 02:34:16 -0700	[diff] [blame]	1170
				1171	if (unlikely(cpu >= 0))
				1172	add_timer_on(timer, cpu);
				1173	else
				1174	add_timer(timer);
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1175	ret = 1;
				1176	}
				1177	return ret;
				1178	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	1179	EXPORT_SYMBOL_GPL(queue_delayed_work_on);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1180
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1181	/**
				1182	* worker_enter_idle - enter idle state
				1183	* @worker: worker which is entering idle state
				1184	*
				1185	* @worker is entering idle state. Update stats and idle timer if
				1186	* necessary.
				1187	*
				1188	* LOCKING:
				1189	* spin_lock_irq(gcwq->lock).
				1190	*/
				1191	static void worker_enter_idle(struct worker *worker)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1192	{
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1193	struct worker_pool *pool = worker->pool;
				1194	struct global_cwq *gcwq = pool->gcwq;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1195
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1196	BUG_ON(worker->flags & WORKER_IDLE);
				1197	BUG_ON(!list_empty(&worker->entry) &&
				1198	(worker->hentry.next \|\| worker->hentry.pprev));
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1199
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	1200	/* can't use worker_set_flags(), also called from start_worker() */
				1201	worker->flags \|= WORKER_IDLE;
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1202	pool->nr_idle++;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1203	worker->last_active = jiffies;
Peter Zijlstra	d5abe66	2006-12-06 20:37:26 -0800	[diff] [blame]	1204
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1205	/* idle_list is LIFO */
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1206	list_add(&worker->entry, &pool->idle_list);
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	1207
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	1208	if (too_many_workers(pool) && !timer_pending(&pool->idle_timer))
				1209	mod_timer(&pool->idle_timer, jiffies + IDLE_WORKER_TIMEOUT);
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	1210
Tejun Heo	544ecf3	2012-05-14 15:04:50 -0700	[diff] [blame]	1211	/*
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	1212	* Sanity check nr_running. Because gcwq_unbind_fn() releases
				1213	* gcwq->lock between setting %WORKER_UNBOUND and zapping
				1214	* nr_running, the warning may trigger spuriously. Check iff
				1215	* unbind is not in progress.
Tejun Heo	544ecf3	2012-05-14 15:04:50 -0700	[diff] [blame]	1216	*/
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	1217	WARN_ON_ONCE(!(gcwq->flags & GCWQ_DISASSOCIATED) &&
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1218	pool->nr_workers == pool->nr_idle &&
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1219	atomic_read(get_pool_nr_running(pool)));
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1220	}
				1221
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1222	/**
				1223	* worker_leave_idle - leave idle state
				1224	* @worker: worker which is leaving idle state
				1225	*
				1226	* @worker is leaving idle state. Update stats.
				1227	*
				1228	* LOCKING:
				1229	* spin_lock_irq(gcwq->lock).
				1230	*/
				1231	static void worker_leave_idle(struct worker *worker)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1232	{
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1233	struct worker_pool *pool = worker->pool;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1234
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1235	BUG_ON(!(worker->flags & WORKER_IDLE));
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	1236	worker_clr_flags(worker, WORKER_IDLE);
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1237	pool->nr_idle--;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1238	list_del_init(&worker->entry);
				1239	}
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1240
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1241	/**
				1242	* worker_maybe_bind_and_lock - bind worker to its cpu if possible and lock gcwq
				1243	* @worker: self
				1244	*
				1245	* Works which are scheduled while the cpu is online must at least be
				1246	* scheduled to a worker which is bound to the cpu so that if they are
				1247	* flushed from cpu callbacks while cpu is going down, they are
				1248	* guaranteed to execute on the cpu.
				1249	*
				1250	* This function is to be used by rogue workers and rescuers to bind
				1251	* themselves to the target cpu and may race with cpu going down or
				1252	* coming online. kthread_bind() can't be used because it may put the
				1253	* worker to already dead cpu and set_cpus_allowed_ptr() can't be used
				1254	* verbatim as it's best effort and blocking and gcwq may be
				1255	* [dis]associated in the meantime.
				1256	*
Tejun Heo	f2d5a0e	2012-07-17 12:39:26 -0700	[diff] [blame]	1257	* This function tries set_cpus_allowed() and locks gcwq and verifies the
				1258	* binding against %GCWQ_DISASSOCIATED which is set during
				1259	* %CPU_DOWN_PREPARE and cleared during %CPU_ONLINE, so if the worker
				1260	* enters idle state or fetches works without dropping lock, it can
				1261	* guarantee the scheduling requirement described in the first paragraph.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1262	*
				1263	* CONTEXT:
				1264	* Might sleep. Called without any lock but returns with gcwq->lock
				1265	* held.
				1266	*
				1267	* RETURNS:
				1268	* %true if the associated gcwq is online (@worker is successfully
				1269	* bound), %false if offline.
				1270	*/
				1271	static bool worker_maybe_bind_and_lock(struct worker *worker)
Namhyung Kim	972fa1c	2010-08-22 23:19:43 +0900	[diff] [blame]	1272	__acquires(&gcwq->lock)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1273	{
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1274	struct global_cwq *gcwq = worker->pool->gcwq;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1275	struct task_struct *task = worker->task;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1276
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1277	while (true) {
				1278	/*
				1279	* The following call may fail, succeed or succeed
				1280	* without actually migrating the task to the cpu if
				1281	* it races with cpu hotunplug operation. Verify
				1282	* against GCWQ_DISASSOCIATED.
				1283	*/
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1284	if (!(gcwq->flags & GCWQ_DISASSOCIATED))
				1285	set_cpus_allowed_ptr(task, get_cpu_mask(gcwq->cpu));
Oleg Nesterov	85f4186	2007-05-09 02:34:20 -0700	[diff] [blame]	1286
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1287	spin_lock_irq(&gcwq->lock);
				1288	if (gcwq->flags & GCWQ_DISASSOCIATED)
				1289	return false;
				1290	if (task_cpu(task) == gcwq->cpu &&
				1291	cpumask_equal(&current->cpus_allowed,
				1292	get_cpu_mask(gcwq->cpu)))
				1293	return true;
				1294	spin_unlock_irq(&gcwq->lock);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	1295
Tejun Heo	5035b20	2011-04-29 18:08:37 +0200	[diff] [blame]	1296	/*
				1297	* We've raced with CPU hot[un]plug. Give it a breather
				1298	* and retry migration. cond_resched() is required here;
				1299	* otherwise, we might deadlock against cpu_stop trying to
				1300	* bring down the CPU on non-preemptive kernel.
				1301	*/
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1302	cpu_relax();
Tejun Heo	5035b20	2011-04-29 18:08:37 +0200	[diff] [blame]	1303	cond_resched();
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1304	}
				1305	}
				1306
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1307	struct idle_rebind {
				1308	int cnt; /* # workers to be rebound */
				1309	struct completion done; /* all workers rebound */
				1310	};
				1311
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1312	/*
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1313	* Rebind an idle @worker to its CPU. During CPU onlining, this has to
				1314	* happen synchronously for idle workers. worker_thread() will test
				1315	* %WORKER_REBIND before leaving idle and call this function.
				1316	*/
				1317	static void idle_worker_rebind(struct worker *worker)
				1318	{
				1319	struct global_cwq *gcwq = worker->pool->gcwq;
				1320
				1321	/* CPU must be online at this point */
				1322	WARN_ON(!worker_maybe_bind_and_lock(worker));
				1323	if (!--worker->idle_rebind->cnt)
				1324	complete(&worker->idle_rebind->done);
				1325	spin_unlock_irq(&worker->pool->gcwq->lock);
				1326
				1327	/* we did our part, wait for rebind_workers() to finish up */
				1328	wait_event(gcwq->rebind_hold, !(worker->flags & WORKER_REBIND));
				1329	}
				1330
				1331	/*
				1332	* Function for @worker->rebind.work used to rebind unbound busy workers to
Tejun Heo	403c821	2012-07-17 12:39:27 -0700	[diff] [blame]	1333	* the associated cpu which is coming back online. This is scheduled by
				1334	* cpu up but can race with other cpu hotplug operations and may be
				1335	* executed twice without intervening cpu down.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1336	*/
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1337	static void busy_worker_rebind_fn(struct work_struct *work)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1338	{
				1339	struct worker *worker = container_of(work, struct worker, rebind_work);
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1340	struct global_cwq *gcwq = worker->pool->gcwq;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1341
				1342	if (worker_maybe_bind_and_lock(worker))
				1343	worker_clr_flags(worker, WORKER_REBIND);
				1344
				1345	spin_unlock_irq(&gcwq->lock);
				1346	}
				1347
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1348	/**
				1349	* rebind_workers - rebind all workers of a gcwq to the associated CPU
				1350	* @gcwq: gcwq of interest
				1351	*
				1352	* @gcwq->cpu is coming online. Rebind all workers to the CPU. Rebinding
				1353	* is different for idle and busy ones.
				1354	*
				1355	* The idle ones should be rebound synchronously and idle rebinding should
				1356	* be complete before any worker starts executing work items with
				1357	* concurrency management enabled; otherwise, scheduler may oops trying to
				1358	* wake up non-local idle worker from wq_worker_sleeping().
				1359	*
				1360	* This is achieved by repeatedly requesting rebinding until all idle
				1361	* workers are known to have been rebound under @gcwq->lock and holding all
				1362	* idle workers from becoming busy until idle rebinding is complete.
				1363	*
				1364	* Once idle workers are rebound, busy workers can be rebound as they
				1365	* finish executing their current work items. Queueing the rebind work at
				1366	* the head of their scheduled lists is enough. Note that nr_running will
				1367	* be properbly bumped as busy workers rebind.
				1368	*
				1369	* On return, all workers are guaranteed to either be bound or have rebind
				1370	* work item scheduled.
				1371	*/
				1372	static void rebind_workers(struct global_cwq *gcwq)
				1373	__releases(&gcwq->lock) __acquires(&gcwq->lock)
				1374	{
				1375	struct idle_rebind idle_rebind;
				1376	struct worker_pool *pool;
				1377	struct worker *worker;
				1378	struct hlist_node *pos;
				1379	int i;
				1380
				1381	lockdep_assert_held(&gcwq->lock);
				1382
				1383	for_each_worker_pool(pool, gcwq)
				1384	lockdep_assert_held(&pool->manager_mutex);
				1385
				1386	/*
				1387	* Rebind idle workers. Interlocked both ways. We wait for
				1388	* workers to rebind via @idle_rebind.done. Workers will wait for
				1389	* us to finish up by watching %WORKER_REBIND.
				1390	*/
				1391	init_completion(&idle_rebind.done);
				1392	retry:
				1393	idle_rebind.cnt = 1;
				1394	INIT_COMPLETION(idle_rebind.done);
				1395
				1396	/* set REBIND and kick idle ones, we'll wait for these later */
				1397	for_each_worker_pool(pool, gcwq) {
				1398	list_for_each_entry(worker, &pool->idle_list, entry) {
Lai Jiangshan	96e6530	2012-09-02 00:28:19 +0800	[diff] [blame^]	1399	unsigned long worker_flags = worker->flags;
				1400
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1401	if (worker->flags & WORKER_REBIND)
				1402	continue;
				1403
Lai Jiangshan	96e6530	2012-09-02 00:28:19 +0800	[diff] [blame^]	1404	/* morph UNBOUND to REBIND atomically */
				1405	worker_flags &= ~WORKER_UNBOUND;
				1406	worker_flags \|= WORKER_REBIND;
				1407	ACCESS_ONCE(worker->flags) = worker_flags;
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1408
				1409	idle_rebind.cnt++;
				1410	worker->idle_rebind = &idle_rebind;
				1411
				1412	/* worker_thread() will call idle_worker_rebind() */
				1413	wake_up_process(worker->task);
				1414	}
				1415	}
				1416
				1417	if (--idle_rebind.cnt) {
				1418	spin_unlock_irq(&gcwq->lock);
				1419	wait_for_completion(&idle_rebind.done);
				1420	spin_lock_irq(&gcwq->lock);
				1421	/* busy ones might have become idle while waiting, retry */
				1422	goto retry;
				1423	}
				1424
				1425	/*
				1426	* All idle workers are rebound and waiting for %WORKER_REBIND to
				1427	* be cleared inside idle_worker_rebind(). Clear and release.
				1428	* Clearing %WORKER_REBIND from this foreign context is safe
				1429	* because these workers are still guaranteed to be idle.
				1430	*/
				1431	for_each_worker_pool(pool, gcwq)
				1432	list_for_each_entry(worker, &pool->idle_list, entry)
				1433	worker->flags &= ~WORKER_REBIND;
				1434
				1435	wake_up_all(&gcwq->rebind_hold);
				1436
				1437	/* rebind busy workers */
				1438	for_each_busy_worker(worker, i, pos, gcwq) {
				1439	struct work_struct *rebind_work = &worker->rebind_work;
Lai Jiangshan	96e6530	2012-09-02 00:28:19 +0800	[diff] [blame^]	1440	unsigned long worker_flags = worker->flags;
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1441
Lai Jiangshan	96e6530	2012-09-02 00:28:19 +0800	[diff] [blame^]	1442	/* morph UNBOUND to REBIND atomically */
				1443	worker_flags &= ~WORKER_UNBOUND;
				1444	worker_flags \|= WORKER_REBIND;
				1445	ACCESS_ONCE(worker->flags) = worker_flags;
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1446
				1447	if (test_and_set_bit(WORK_STRUCT_PENDING_BIT,
				1448	work_data_bits(rebind_work)))
				1449	continue;
				1450
				1451	/* wq doesn't matter, use the default one */
				1452	debug_work_activate(rebind_work);
				1453	insert_work(get_cwq(gcwq->cpu, system_wq), rebind_work,
				1454	worker->scheduled.next,
				1455	work_color_to_flags(WORK_NO_COLOR));
				1456	}
				1457	}
				1458
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1459	static struct worker *alloc_worker(void)
				1460	{
				1461	struct worker *worker;
				1462
				1463	worker = kzalloc(sizeof(*worker), GFP_KERNEL);
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1464	if (worker) {
				1465	INIT_LIST_HEAD(&worker->entry);
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1466	INIT_LIST_HEAD(&worker->scheduled);
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1467	INIT_WORK(&worker->rebind_work, busy_worker_rebind_fn);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1468	/* on creation a worker is in !idle && prep state */
				1469	worker->flags = WORKER_PREP;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1470	}
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1471	return worker;
				1472	}
				1473
				1474	/**
				1475	* create_worker - create a new workqueue worker
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1476	* @pool: pool the new worker will belong to
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1477	*
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1478	* Create a new worker which is bound to @pool. The returned worker
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1479	* can be started by calling start_worker() or destroyed using
				1480	* destroy_worker().
				1481	*
				1482	* CONTEXT:
				1483	* Might sleep. Does GFP_KERNEL allocations.
				1484	*
				1485	* RETURNS:
				1486	* Pointer to the newly created worker.
				1487	*/
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	1488	static struct worker create_worker(struct worker_pool pool)
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1489	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1490	struct global_cwq *gcwq = pool->gcwq;
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	1491	const char *pri = worker_pool_pri(pool) ? "H" : "";
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1492	struct worker *worker = NULL;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1493	int id = -1;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1494
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1495	spin_lock_irq(&gcwq->lock);
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1496	while (ida_get_new(&pool->worker_ida, &id)) {
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1497	spin_unlock_irq(&gcwq->lock);
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1498	if (!ida_pre_get(&pool->worker_ida, GFP_KERNEL))
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1499	goto fail;
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1500	spin_lock_irq(&gcwq->lock);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1501	}
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1502	spin_unlock_irq(&gcwq->lock);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1503
				1504	worker = alloc_worker();
				1505	if (!worker)
				1506	goto fail;
				1507
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1508	worker->pool = pool;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1509	worker->id = id;
				1510
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	1511	if (gcwq->cpu != WORK_CPU_UNBOUND)
Eric Dumazet	94dcf29	2011-03-22 16:30:45 -0700	[diff] [blame]	1512	worker->task = kthread_create_on_node(worker_thread,
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	1513	worker, cpu_to_node(gcwq->cpu),
				1514	"kworker/%u:%d%s", gcwq->cpu, id, pri);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1515	else
				1516	worker->task = kthread_create(worker_thread, worker,
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	1517	"kworker/u:%d%s", id, pri);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1518	if (IS_ERR(worker->task))
				1519	goto fail;
				1520
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	1521	if (worker_pool_pri(pool))
				1522	set_user_nice(worker->task, HIGHPRI_NICE_LEVEL);
				1523
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	1524	/*
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	1525	* Determine CPU binding of the new worker depending on
				1526	* %GCWQ_DISASSOCIATED. The caller is responsible for ensuring the
				1527	* flag remains stable across this function. See the comments
				1528	* above the flag definition for details.
				1529	*
				1530	* As an unbound worker may later become a regular one if CPU comes
				1531	* online, make sure every worker has %PF_THREAD_BOUND set.
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	1532	*/
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	1533	if (!(gcwq->flags & GCWQ_DISASSOCIATED)) {
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1534	kthread_bind(worker->task, gcwq->cpu);
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	1535	} else {
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	1536	worker->task->flags \|= PF_THREAD_BOUND;
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	1537	worker->flags \|= WORKER_UNBOUND;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1538	}
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	1539
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1540	return worker;
				1541	fail:
				1542	if (id >= 0) {
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1543	spin_lock_irq(&gcwq->lock);
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1544	ida_remove(&pool->worker_ida, id);
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1545	spin_unlock_irq(&gcwq->lock);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1546	}
				1547	kfree(worker);
				1548	return NULL;
				1549	}
				1550
				1551	/**
				1552	* start_worker - start a newly created worker
				1553	* @worker: worker to start
				1554	*
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1555	* Make the gcwq aware of @worker and start it.
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1556	*
				1557	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1558	* spin_lock_irq(gcwq->lock).
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1559	*/
				1560	static void start_worker(struct worker *worker)
				1561	{
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	1562	worker->flags \|= WORKER_STARTED;
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1563	worker->pool->nr_workers++;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1564	worker_enter_idle(worker);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1565	wake_up_process(worker->task);
				1566	}
				1567
				1568	/**
				1569	* destroy_worker - destroy a workqueue worker
				1570	* @worker: worker to be destroyed
				1571	*
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1572	* Destroy @worker and adjust @gcwq stats accordingly.
				1573	*
				1574	* CONTEXT:
				1575	* spin_lock_irq(gcwq->lock) which is released and regrabbed.
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1576	*/
				1577	static void destroy_worker(struct worker *worker)
				1578	{
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1579	struct worker_pool *pool = worker->pool;
				1580	struct global_cwq *gcwq = pool->gcwq;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1581	int id = worker->id;
				1582
				1583	/* sanity check frenzy */
				1584	BUG_ON(worker->current_work);
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1585	BUG_ON(!list_empty(&worker->scheduled));
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1586
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1587	if (worker->flags & WORKER_STARTED)
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1588	pool->nr_workers--;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1589	if (worker->flags & WORKER_IDLE)
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1590	pool->nr_idle--;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1591
				1592	list_del_init(&worker->entry);
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	1593	worker->flags \|= WORKER_DIE;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1594
				1595	spin_unlock_irq(&gcwq->lock);
				1596
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1597	kthread_stop(worker->task);
				1598	kfree(worker);
				1599
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1600	spin_lock_irq(&gcwq->lock);
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1601	ida_remove(&pool->worker_ida, id);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1602	}
				1603
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1604	static void idle_worker_timeout(unsigned long __pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1605	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1606	struct worker_pool pool = (void )__pool;
				1607	struct global_cwq *gcwq = pool->gcwq;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1608
				1609	spin_lock_irq(&gcwq->lock);
				1610
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1611	if (too_many_workers(pool)) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1612	struct worker *worker;
				1613	unsigned long expires;
				1614
				1615	/* idle_list is kept in LIFO order, check the last one */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1616	worker = list_entry(pool->idle_list.prev, struct worker, entry);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1617	expires = worker->last_active + IDLE_WORKER_TIMEOUT;
				1618
				1619	if (time_before(jiffies, expires))
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1620	mod_timer(&pool->idle_timer, expires);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1621	else {
				1622	/* it's been idle for too long, wake up manager */
Tejun Heo	11ebea5	2012-07-12 14:46:37 -0700	[diff] [blame]	1623	pool->flags \|= POOL_MANAGE_WORKERS;
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1624	wake_up_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1625	}
				1626	}
				1627
				1628	spin_unlock_irq(&gcwq->lock);
				1629	}
				1630
				1631	static bool send_mayday(struct work_struct *work)
				1632	{
				1633	struct cpu_workqueue_struct *cwq = get_work_cwq(work);
				1634	struct workqueue_struct *wq = cwq->wq;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1635	unsigned int cpu;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1636
				1637	if (!(wq->flags & WQ_RESCUER))
				1638	return false;
				1639
				1640	/* mayday mayday mayday */
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1641	cpu = cwq->pool->gcwq->cpu;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1642	/* WORK_CPU_UNBOUND can't be set in cpumask, use cpu 0 instead */
				1643	if (cpu == WORK_CPU_UNBOUND)
				1644	cpu = 0;
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	1645	if (!mayday_test_and_set_cpu(cpu, wq->mayday_mask))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1646	wake_up_process(wq->rescuer->task);
				1647	return true;
				1648	}
				1649
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1650	static void gcwq_mayday_timeout(unsigned long __pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1651	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1652	struct worker_pool pool = (void )__pool;
				1653	struct global_cwq *gcwq = pool->gcwq;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1654	struct work_struct *work;
				1655
				1656	spin_lock_irq(&gcwq->lock);
				1657
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1658	if (need_to_create_worker(pool)) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1659	/*
				1660	* We've been trying to create a new worker but
				1661	* haven't been successful. We might be hitting an
				1662	* allocation deadlock. Send distress signals to
				1663	* rescuers.
				1664	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1665	list_for_each_entry(work, &pool->worklist, entry)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1666	send_mayday(work);
				1667	}
				1668
				1669	spin_unlock_irq(&gcwq->lock);
				1670
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1671	mod_timer(&pool->mayday_timer, jiffies + MAYDAY_INTERVAL);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1672	}
				1673
				1674	/**
				1675	* maybe_create_worker - create a new worker if necessary
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1676	* @pool: pool to create a new worker for
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1677	*
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1678	* Create a new worker for @pool if necessary. @pool is guaranteed to
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1679	* have at least one idle worker on return from this function. If
				1680	* creating a new worker takes longer than MAYDAY_INTERVAL, mayday is
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1681	* sent to all rescuers with works scheduled on @pool to resolve
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1682	* possible allocation deadlock.
				1683	*
				1684	* On return, need_to_create_worker() is guaranteed to be false and
				1685	* may_start_working() true.
				1686	*
				1687	* LOCKING:
				1688	* spin_lock_irq(gcwq->lock) which may be released and regrabbed
				1689	* multiple times. Does GFP_KERNEL allocations. Called only from
				1690	* manager.
				1691	*
				1692	* RETURNS:
				1693	* false if no action was taken and gcwq->lock stayed locked, true
				1694	* otherwise.
				1695	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1696	static bool maybe_create_worker(struct worker_pool *pool)
Namhyung Kim	06bd6eb	2010-08-22 23:19:42 +0900	[diff] [blame]	1697	__releases(&gcwq->lock)
				1698	__acquires(&gcwq->lock)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1699	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1700	struct global_cwq *gcwq = pool->gcwq;
				1701
				1702	if (!need_to_create_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1703	return false;
				1704	restart:
Tejun Heo	9f9c236	2010-07-14 11:31:20 +0200	[diff] [blame]	1705	spin_unlock_irq(&gcwq->lock);
				1706
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1707	/* if we don't make progress in MAYDAY_INITIAL_TIMEOUT, call for help */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1708	mod_timer(&pool->mayday_timer, jiffies + MAYDAY_INITIAL_TIMEOUT);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1709
				1710	while (true) {
				1711	struct worker *worker;
				1712
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	1713	worker = create_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1714	if (worker) {
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1715	del_timer_sync(&pool->mayday_timer);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1716	spin_lock_irq(&gcwq->lock);
				1717	start_worker(worker);
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1718	BUG_ON(need_to_create_worker(pool));
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1719	return true;
				1720	}
				1721
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1722	if (!need_to_create_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1723	break;
				1724
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1725	__set_current_state(TASK_INTERRUPTIBLE);
				1726	schedule_timeout(CREATE_COOLDOWN);
Tejun Heo	9f9c236	2010-07-14 11:31:20 +0200	[diff] [blame]	1727
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1728	if (!need_to_create_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1729	break;
				1730	}
				1731
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1732	del_timer_sync(&pool->mayday_timer);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1733	spin_lock_irq(&gcwq->lock);
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1734	if (need_to_create_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1735	goto restart;
				1736	return true;
				1737	}
				1738
				1739	/**
				1740	* maybe_destroy_worker - destroy workers which have been idle for a while
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1741	* @pool: pool to destroy workers for
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1742	*
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1743	* Destroy @pool workers which have been idle for longer than
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1744	* IDLE_WORKER_TIMEOUT.
				1745	*
				1746	* LOCKING:
				1747	* spin_lock_irq(gcwq->lock) which may be released and regrabbed
				1748	* multiple times. Called only from manager.
				1749	*
				1750	* RETURNS:
				1751	* false if no action was taken and gcwq->lock stayed locked, true
				1752	* otherwise.
				1753	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1754	static bool maybe_destroy_workers(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1755	{
				1756	bool ret = false;
				1757
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1758	while (too_many_workers(pool)) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1759	struct worker *worker;
				1760	unsigned long expires;
				1761
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1762	worker = list_entry(pool->idle_list.prev, struct worker, entry);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1763	expires = worker->last_active + IDLE_WORKER_TIMEOUT;
				1764
				1765	if (time_before(jiffies, expires)) {
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1766	mod_timer(&pool->idle_timer, expires);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1767	break;
				1768	}
				1769
				1770	destroy_worker(worker);
				1771	ret = true;
				1772	}
				1773
				1774	return ret;
				1775	}
				1776
				1777	/**
				1778	* manage_workers - manage worker pool
				1779	* @worker: self
				1780	*
				1781	* Assume the manager role and manage gcwq worker pool @worker belongs
				1782	* to. At any given time, there can be only zero or one manager per
				1783	* gcwq. The exclusion is handled automatically by this function.
				1784	*
				1785	* The caller can safely start processing works on false return. On
				1786	* true return, it's guaranteed that need_to_create_worker() is false
				1787	* and may_start_working() is true.
				1788	*
				1789	* CONTEXT:
				1790	* spin_lock_irq(gcwq->lock) which may be released and regrabbed
				1791	* multiple times. Does GFP_KERNEL allocations.
				1792	*
				1793	* RETURNS:
				1794	* false if no action was taken and gcwq->lock stayed locked, true if
				1795	* some action was taken.
				1796	*/
				1797	static bool manage_workers(struct worker *worker)
				1798	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1799	struct worker_pool *pool = worker->pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1800	bool ret = false;
				1801
Tejun Heo	6037315	2012-07-17 12:39:27 -0700	[diff] [blame]	1802	if (!mutex_trylock(&pool->manager_mutex))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1803	return ret;
				1804
Tejun Heo	11ebea5	2012-07-12 14:46:37 -0700	[diff] [blame]	1805	pool->flags &= ~POOL_MANAGE_WORKERS;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1806
				1807	/*
				1808	* Destroy and then create so that may_start_working() is true
				1809	* on return.
				1810	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1811	ret \|= maybe_destroy_workers(pool);
				1812	ret \|= maybe_create_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1813
Tejun Heo	6037315	2012-07-17 12:39:27 -0700	[diff] [blame]	1814	mutex_unlock(&pool->manager_mutex);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1815	return ret;
				1816	}
				1817
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1818	/**
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1819	* move_linked_works - move linked works to a list
				1820	* @work: start of series of works to be scheduled
				1821	* @head: target list to append @work to
				1822	* @nextp: out paramter for nested worklist walking
				1823	*
				1824	* Schedule linked works starting from @work to @head. Work series to
				1825	* be scheduled starts at @work and includes any consecutive work with
				1826	* WORK_STRUCT_LINKED set in its predecessor.
				1827	*
				1828	* If @nextp is not NULL, it's updated to point to the next work of
				1829	* the last scheduled work. This allows move_linked_works() to be
				1830	* nested inside outer list_for_each_entry_safe().
				1831	*
				1832	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1833	* spin_lock_irq(gcwq->lock).
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1834	*/
				1835	static void move_linked_works(struct work_struct work, struct list_head head,
				1836	struct work_struct **nextp)
				1837	{
				1838	struct work_struct *n;
				1839
				1840	/*
				1841	* Linked worklist will always end before the end of the list,
				1842	* use NULL for list head.
				1843	*/
				1844	list_for_each_entry_safe_from(work, n, NULL, entry) {
				1845	list_move_tail(&work->entry, head);
				1846	if (!(*work_data_bits(work) & WORK_STRUCT_LINKED))
				1847	break;
				1848	}
				1849
				1850	/*
				1851	* If we're already inside safe list traversal and have moved
				1852	* multiple works to the scheduled queue, the next position
				1853	* needs to be updated.
				1854	*/
				1855	if (nextp)
				1856	*nextp = n;
				1857	}
				1858
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1859	static void cwq_activate_first_delayed(struct cpu_workqueue_struct *cwq)
				1860	{
				1861	struct work_struct *work = list_first_entry(&cwq->delayed_works,
				1862	struct work_struct, entry);
				1863
Tejun Heo	cdadf00	2010-10-05 10:49:55 +0200	[diff] [blame]	1864	trace_workqueue_activate_work(work);
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	1865	move_linked_works(work, &cwq->pool->worklist, NULL);
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1866	__clear_bit(WORK_STRUCT_DELAYED_BIT, work_data_bits(work));
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1867	cwq->nr_active++;
				1868	}
				1869
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1870	/**
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1871	* cwq_dec_nr_in_flight - decrement cwq's nr_in_flight
				1872	* @cwq: cwq of interest
				1873	* @color: color of work which left the queue
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1874	* @delayed: for a delayed work
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1875	*
				1876	* A work either has completed or is removed from pending queue,
				1877	* decrement nr_in_flight of its cwq and handle workqueue flushing.
				1878	*
				1879	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1880	* spin_lock_irq(gcwq->lock).
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1881	*/
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1882	static void cwq_dec_nr_in_flight(struct cpu_workqueue_struct *cwq, int color,
				1883	bool delayed)
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1884	{
				1885	/* ignore uncolored works */
				1886	if (color == WORK_NO_COLOR)
				1887	return;
				1888
				1889	cwq->nr_in_flight[color]--;
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1890
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1891	if (!delayed) {
				1892	cwq->nr_active--;
				1893	if (!list_empty(&cwq->delayed_works)) {
				1894	/* one down, submit a delayed one */
				1895	if (cwq->nr_active < cwq->max_active)
				1896	cwq_activate_first_delayed(cwq);
				1897	}
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	1898	}
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1899
				1900	/* is flush in progress and are we at the flushing tip? */
				1901	if (likely(cwq->flush_color != color))
				1902	return;
				1903
				1904	/* are there still in-flight works? */
				1905	if (cwq->nr_in_flight[color])
				1906	return;
				1907
				1908	/* this cwq is done, clear flush_color */
				1909	cwq->flush_color = -1;
				1910
				1911	/*
				1912	* If this was the last cwq, wake up the first flusher. It
				1913	* will handle the rest.
				1914	*/
				1915	if (atomic_dec_and_test(&cwq->wq->nr_cwqs_to_flush))
				1916	complete(&cwq->wq->first_flusher->done);
				1917	}
				1918
				1919	/**
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1920	* process_one_work - process single work
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1921	* @worker: self
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1922	* @work: work to process
				1923	*
				1924	* Process @work. This function contains all the logics necessary to
				1925	* process a single work including synchronization against and
				1926	* interaction with other workers on the same cpu, queueing and
				1927	* flushing. As long as context requirement is met, any worker can
				1928	* call this function to process a work.
				1929	*
				1930	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1931	* spin_lock_irq(gcwq->lock) which is released and regrabbed.
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1932	*/
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1933	static void process_one_work(struct worker worker, struct work_struct work)
Namhyung Kim	06bd6eb	2010-08-22 23:19:42 +0900	[diff] [blame]	1934	__releases(&gcwq->lock)
				1935	__acquires(&gcwq->lock)
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1936	{
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	1937	struct cpu_workqueue_struct *cwq = get_work_cwq(work);
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1938	struct worker_pool *pool = worker->pool;
				1939	struct global_cwq *gcwq = pool->gcwq;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1940	struct hlist_head *bwh = busy_worker_head(gcwq, work);
Tejun Heo	fb0e7be	2010-06-29 10:07:15 +0200	[diff] [blame]	1941	bool cpu_intensive = cwq->wq->flags & WQ_CPU_INTENSIVE;
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1942	work_func_t f = work->func;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1943	int work_color;
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	1944	struct worker *collision;
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1945	#ifdef CONFIG_LOCKDEP
				1946	/*
				1947	* It is permissible to free the struct work_struct from
				1948	* inside the function that is called from it, this we need to
				1949	* take into account for lockdep too. To avoid bogus "held
				1950	* lock freed" warnings as well as problems when looking into
				1951	* work->lockdep_map, make a copy and use that here.
				1952	*/
Peter Zijlstra	4d82a1d	2012-05-15 08:06:19 -0700	[diff] [blame]	1953	struct lockdep_map lockdep_map;
				1954
				1955	lockdep_copy_map(&lockdep_map, &work->lockdep_map);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1956	#endif
Tejun Heo	6fec10a	2012-07-22 10:16:34 -0700	[diff] [blame]	1957	/*
				1958	* Ensure we're on the correct CPU. DISASSOCIATED test is
				1959	* necessary to avoid spurious warnings from rescuers servicing the
				1960	* unbound or a disassociated gcwq.
				1961	*/
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1962	WARN_ON_ONCE(!(worker->flags & (WORKER_UNBOUND \| WORKER_REBIND)) &&
Tejun Heo	6fec10a	2012-07-22 10:16:34 -0700	[diff] [blame]	1963	!(gcwq->flags & GCWQ_DISASSOCIATED) &&
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1964	raw_smp_processor_id() != gcwq->cpu);
				1965
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	1966	/*
				1967	* A single work shouldn't be executed concurrently by
				1968	* multiple workers on a single cpu. Check whether anyone is
				1969	* already processing the work. If so, defer the work to the
				1970	* currently executing one.
				1971	*/
				1972	collision = __find_worker_executing_work(gcwq, bwh, work);
				1973	if (unlikely(collision)) {
				1974	move_linked_works(work, &collision->scheduled, NULL);
				1975	return;
				1976	}
				1977
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1978	/* claim and process */
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1979	debug_work_deactivate(work);
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1980	hlist_add_head(&worker->hentry, bwh);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1981	worker->current_work = work;
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	1982	worker->current_cwq = cwq;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1983	work_color = get_work_color(work);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	1984
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	1985	/* record the current cpu number in the work data and dequeue */
				1986	set_work_cpu(work, gcwq->cpu);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1987	list_del_init(&work->entry);
				1988
Tejun Heo	649027d	2010-06-29 10:07:14 +0200	[diff] [blame]	1989	/*
Tejun Heo	fb0e7be	2010-06-29 10:07:15 +0200	[diff] [blame]	1990	* CPU intensive works don't participate in concurrency
				1991	* management. They're the scheduler's responsibility.
				1992	*/
				1993	if (unlikely(cpu_intensive))
				1994	worker_set_flags(worker, WORKER_CPU_INTENSIVE, true);
				1995
Tejun Heo	974271c	2012-07-12 14:46:37 -0700	[diff] [blame]	1996	/*
				1997	* Unbound gcwq isn't concurrency managed and work items should be
				1998	* executed ASAP. Wake up another worker if necessary.
				1999	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2000	if ((worker->flags & WORKER_UNBOUND) && need_more_worker(pool))
				2001	wake_up_worker(pool);
Tejun Heo	974271c	2012-07-12 14:46:37 -0700	[diff] [blame]	2002
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2003	spin_unlock_irq(&gcwq->lock);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2004
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2005	work_clear_pending(work);
Tejun Heo	e159489	2011-01-09 23:32:15 +0100	[diff] [blame]	2006	lock_map_acquire_read(&cwq->wq->lockdep_map);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2007	lock_map_acquire(&lockdep_map);
Arjan van de Ven	e36c886	2010-08-21 13:07:26 -0700	[diff] [blame]	2008	trace_workqueue_execute_start(work);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2009	f(work);
Arjan van de Ven	e36c886	2010-08-21 13:07:26 -0700	[diff] [blame]	2010	/*
				2011	* While we must be careful to not use "work" after this, the trace
				2012	* point will only record its address.
				2013	*/
				2014	trace_workqueue_execute_end(work);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2015	lock_map_release(&lockdep_map);
				2016	lock_map_release(&cwq->wq->lockdep_map);
				2017
				2018	if (unlikely(in_atomic() \|\| lockdep_depth(current) > 0)) {
				2019	printk(KERN_ERR "BUG: workqueue leaked lock or atomic: "
				2020	"%s/0x%08x/%d\n",
				2021	current->comm, preempt_count(), task_pid_nr(current));
				2022	printk(KERN_ERR " last function: ");
				2023	print_symbol("%s\n", (unsigned long)f);
				2024	debug_show_held_locks(current);
				2025	dump_stack();
				2026	}
				2027
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2028	spin_lock_irq(&gcwq->lock);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2029
Tejun Heo	fb0e7be	2010-06-29 10:07:15 +0200	[diff] [blame]	2030	/* clear cpu intensive status */
				2031	if (unlikely(cpu_intensive))
				2032	worker_clr_flags(worker, WORKER_CPU_INTENSIVE);
				2033
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2034	/* we're done with it, release */
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2035	hlist_del_init(&worker->hentry);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2036	worker->current_work = NULL;
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	2037	worker->current_cwq = NULL;
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	2038	cwq_dec_nr_in_flight(cwq, work_color, false);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2039	}
				2040
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2041	/**
				2042	* process_scheduled_works - process scheduled works
				2043	* @worker: self
				2044	*
				2045	* Process all scheduled works. Please note that the scheduled list
				2046	* may change while processing a work, so this function repeatedly
				2047	* fetches a work from the top and executes it.
				2048	*
				2049	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2050	* spin_lock_irq(gcwq->lock) which may be released and regrabbed
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2051	* multiple times.
				2052	*/
				2053	static void process_scheduled_works(struct worker *worker)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2054	{
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2055	while (!list_empty(&worker->scheduled)) {
				2056	struct work_struct *work = list_first_entry(&worker->scheduled,
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2057	struct work_struct, entry);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2058	process_one_work(worker, work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2059	}
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2060	}
				2061
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2062	/**
				2063	* worker_thread - the worker thread function
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2064	* @__worker: self
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2065	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2066	* The gcwq worker thread function. There's a single dynamic pool of
				2067	* these per each cpu. These workers process all works regardless of
				2068	* their specific target workqueue. The only exception is works which
				2069	* belong to workqueues with a rescuer which will be explained in
				2070	* rescuer_thread().
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2071	*/
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2072	static int worker_thread(void *__worker)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2073	{
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2074	struct worker *worker = __worker;
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	2075	struct worker_pool *pool = worker->pool;
				2076	struct global_cwq *gcwq = pool->gcwq;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2077
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2078	/* tell the scheduler that this is a workqueue worker */
				2079	worker->task->flags \|= PF_WQ_WORKER;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2080	woke_up:
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2081	spin_lock_irq(&gcwq->lock);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2082
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	2083	/*
				2084	* DIE can be set only while idle and REBIND set while busy has
				2085	* @worker->rebind_work scheduled. Checking here is enough.
				2086	*/
				2087	if (unlikely(worker->flags & (WORKER_REBIND \| WORKER_DIE))) {
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2088	spin_unlock_irq(&gcwq->lock);
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	2089
				2090	if (worker->flags & WORKER_DIE) {
				2091	worker->task->flags &= ~PF_WQ_WORKER;
				2092	return 0;
				2093	}
				2094
				2095	idle_worker_rebind(worker);
				2096	goto woke_up;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2097	}
				2098
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2099	worker_leave_idle(worker);
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	2100	recheck:
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2101	/* no more worker necessary? */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2102	if (!need_more_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2103	goto sleep;
				2104
				2105	/* do we need to manage? */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2106	if (unlikely(!may_start_working(pool)) && manage_workers(worker))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2107	goto recheck;
				2108
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2109	/*
				2110	* ->scheduled list can only be filled while a worker is
				2111	* preparing to process a work or actually processing it.
				2112	* Make sure nobody diddled with it while I was sleeping.
				2113	*/
				2114	BUG_ON(!list_empty(&worker->scheduled));
				2115
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2116	/*
				2117	* When control reaches this point, we're guaranteed to have
				2118	* at least one idle worker or that someone else has already
				2119	* assumed the manager role.
				2120	*/
				2121	worker_clr_flags(worker, WORKER_PREP);
				2122
				2123	do {
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2124	struct work_struct *work =
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	2125	list_first_entry(&pool->worklist,
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2126	struct work_struct, entry);
				2127
				2128	if (likely(!(*work_data_bits(work) & WORK_STRUCT_LINKED))) {
				2129	/* optimization path, not strictly necessary */
				2130	process_one_work(worker, work);
				2131	if (unlikely(!list_empty(&worker->scheduled)))
				2132	process_scheduled_works(worker);
				2133	} else {
				2134	move_linked_works(work, &worker->scheduled, NULL);
				2135	process_scheduled_works(worker);
				2136	}
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2137	} while (keep_working(pool));
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2138
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2139	worker_set_flags(worker, WORKER_PREP, false);
Tejun Heo	d313dd8	2010-07-02 10:03:51 +0200	[diff] [blame]	2140	sleep:
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2141	if (unlikely(need_to_manage_workers(pool)) && manage_workers(worker))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2142	goto recheck;
Tejun Heo	d313dd8	2010-07-02 10:03:51 +0200	[diff] [blame]	2143
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2144	/*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2145	* gcwq->lock is held and there's no work to process and no
				2146	* need to manage, sleep. Workers are woken up only while
				2147	* holding gcwq->lock or from local cpu, so setting the
				2148	* current state before releasing gcwq->lock is enough to
				2149	* prevent losing any event.
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2150	*/
				2151	worker_enter_idle(worker);
				2152	__set_current_state(TASK_INTERRUPTIBLE);
				2153	spin_unlock_irq(&gcwq->lock);
				2154	schedule();
				2155	goto woke_up;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2156	}
				2157
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2158	/**
				2159	* rescuer_thread - the rescuer thread function
				2160	* @__wq: the associated workqueue
				2161	*
				2162	* Workqueue rescuer thread function. There's one rescuer for each
				2163	* workqueue which has WQ_RESCUER set.
				2164	*
				2165	* Regular work processing on a gcwq may block trying to create a new
				2166	* worker which uses GFP_KERNEL allocation which has slight chance of
				2167	* developing into deadlock if some works currently on the same queue
				2168	* need to be processed to satisfy the GFP_KERNEL allocation. This is
				2169	* the problem rescuer solves.
				2170	*
				2171	* When such condition is possible, the gcwq summons rescuers of all
				2172	* workqueues which have works queued on the gcwq and let them process
				2173	* those works so that forward progress can be guaranteed.
				2174	*
				2175	* This should happen rarely.
				2176	*/
				2177	static int rescuer_thread(void *__wq)
				2178	{
				2179	struct workqueue_struct *wq = __wq;
				2180	struct worker *rescuer = wq->rescuer;
				2181	struct list_head *scheduled = &rescuer->scheduled;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2182	bool is_unbound = wq->flags & WQ_UNBOUND;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2183	unsigned int cpu;
				2184
				2185	set_user_nice(current, RESCUER_NICE_LEVEL);
				2186	repeat:
				2187	set_current_state(TASK_INTERRUPTIBLE);
				2188
				2189	if (kthread_should_stop())
				2190	return 0;
				2191
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2192	/*
				2193	* See whether any cpu is asking for help. Unbounded
				2194	* workqueues use cpu 0 in mayday_mask for CPU_UNBOUND.
				2195	*/
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	2196	for_each_mayday_cpu(cpu, wq->mayday_mask) {
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2197	unsigned int tcpu = is_unbound ? WORK_CPU_UNBOUND : cpu;
				2198	struct cpu_workqueue_struct *cwq = get_cwq(tcpu, wq);
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	2199	struct worker_pool *pool = cwq->pool;
				2200	struct global_cwq *gcwq = pool->gcwq;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2201	struct work_struct work, n;
				2202
				2203	__set_current_state(TASK_RUNNING);
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	2204	mayday_clear_cpu(cpu, wq->mayday_mask);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2205
				2206	/* migrate to the target cpu if possible */
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	2207	rescuer->pool = pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2208	worker_maybe_bind_and_lock(rescuer);
				2209
				2210	/*
				2211	* Slurp in all works issued via this workqueue and
				2212	* process'em.
				2213	*/
				2214	BUG_ON(!list_empty(&rescuer->scheduled));
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	2215	list_for_each_entry_safe(work, n, &pool->worklist, entry)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2216	if (get_work_cwq(work) == cwq)
				2217	move_linked_works(work, scheduled, &n);
				2218
				2219	process_scheduled_works(rescuer);
Tejun Heo	7576958	2011-02-14 14:04:46 +0100	[diff] [blame]	2220
				2221	/*
				2222	* Leave this gcwq. If keep_working() is %true, notify a
				2223	* regular worker; otherwise, we end up with 0 concurrency
				2224	* and stalling the execution.
				2225	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2226	if (keep_working(pool))
				2227	wake_up_worker(pool);
Tejun Heo	7576958	2011-02-14 14:04:46 +0100	[diff] [blame]	2228
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2229	spin_unlock_irq(&gcwq->lock);
				2230	}
				2231
				2232	schedule();
				2233	goto repeat;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2234	}
				2235
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2236	struct wq_barrier {
				2237	struct work_struct work;
				2238	struct completion done;
				2239	};
				2240
				2241	static void wq_barrier_func(struct work_struct *work)
				2242	{
				2243	struct wq_barrier *barr = container_of(work, struct wq_barrier, work);
				2244	complete(&barr->done);
				2245	}
				2246
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2247	/**
				2248	* insert_wq_barrier - insert a barrier work
				2249	* @cwq: cwq to insert barrier into
				2250	* @barr: wq_barrier to insert
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2251	* @target: target work to attach @barr to
				2252	* @worker: worker currently executing @target, NULL if @target is not executing
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2253	*
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2254	* @barr is linked to @target such that @barr is completed only after
				2255	* @target finishes execution. Please note that the ordering
				2256	* guarantee is observed only with respect to @target and on the local
				2257	* cpu.
				2258	*
				2259	* Currently, a queued barrier can't be canceled. This is because
				2260	* try_to_grab_pending() can't determine whether the work to be
				2261	* grabbed is at the head of the queue and thus can't clear LINKED
				2262	* flag of the previous work while there must be a valid next work
				2263	* after a work with LINKED flag set.
				2264	*
				2265	* Note that when @worker is non-NULL, @target may be modified
				2266	* underneath us, so we can't reliably determine cwq from @target.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2267	*
				2268	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2269	* spin_lock_irq(gcwq->lock).
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2270	*/
Oleg Nesterov	83c2252	2007-05-09 02:33:54 -0700	[diff] [blame]	2271	static void insert_wq_barrier(struct cpu_workqueue_struct *cwq,
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2272	struct wq_barrier *barr,
				2273	struct work_struct target, struct worker worker)
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2274	{
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2275	struct list_head *head;
				2276	unsigned int linked = 0;
				2277
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2278	/*
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2279	* debugobject calls are safe here even with gcwq->lock locked
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2280	* as we know for sure that this will not trigger any of the
				2281	* checks and call back into the fixup functions where we
				2282	* might deadlock.
				2283	*/
Andrew Morton	ca1cab3	2010-10-26 14:22:34 -0700	[diff] [blame]	2284	INIT_WORK_ONSTACK(&barr->work, wq_barrier_func);
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	2285	__set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(&barr->work));
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2286	init_completion(&barr->done);
Oleg Nesterov	83c2252	2007-05-09 02:33:54 -0700	[diff] [blame]	2287
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2288	/*
				2289	* If @target is currently being executed, schedule the
				2290	* barrier to the worker; otherwise, put it after @target.
				2291	*/
				2292	if (worker)
				2293	head = worker->scheduled.next;
				2294	else {
				2295	unsigned long *bits = work_data_bits(target);
				2296
				2297	head = target->entry.next;
				2298	/* there can already be other linked works, inherit and set */
				2299	linked = *bits & WORK_STRUCT_LINKED;
				2300	__set_bit(WORK_STRUCT_LINKED_BIT, bits);
				2301	}
				2302
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2303	debug_work_activate(&barr->work);
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2304	insert_work(cwq, &barr->work, head,
				2305	work_color_to_flags(WORK_NO_COLOR) \| linked);
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2306	}
				2307
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2308	/**
				2309	* flush_workqueue_prep_cwqs - prepare cwqs for workqueue flushing
				2310	* @wq: workqueue being flushed
				2311	* @flush_color: new flush color, < 0 for no-op
				2312	* @work_color: new work color, < 0 for no-op
				2313	*
				2314	* Prepare cwqs for workqueue flushing.
				2315	*
				2316	* If @flush_color is non-negative, flush_color on all cwqs should be
				2317	* -1. If no cwq has in-flight commands at the specified color, all
				2318	* cwq->flush_color's stay at -1 and %false is returned. If any cwq
				2319	* has in flight commands, its cwq->flush_color is set to
				2320	* @flush_color, @wq->nr_cwqs_to_flush is updated accordingly, cwq
				2321	* wakeup logic is armed and %true is returned.
				2322	*
				2323	* The caller should have initialized @wq->first_flusher prior to
				2324	* calling this function with non-negative @flush_color. If
				2325	* @flush_color is negative, no flush color update is done and %false
				2326	* is returned.
				2327	*
				2328	* If @work_color is non-negative, all cwqs should have the same
				2329	* work_color which is previous to @work_color and all will be
				2330	* advanced to @work_color.
				2331	*
				2332	* CONTEXT:
				2333	* mutex_lock(wq->flush_mutex).
				2334	*
				2335	* RETURNS:
				2336	* %true if @flush_color >= 0 and there's something to flush. %false
				2337	* otherwise.
				2338	*/
				2339	static bool flush_workqueue_prep_cwqs(struct workqueue_struct *wq,
				2340	int flush_color, int work_color)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2341	{
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2342	bool wait = false;
				2343	unsigned int cpu;
Oleg Nesterov	1444196	2007-05-23 13:57:57 -0700	[diff] [blame]	2344
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2345	if (flush_color >= 0) {
				2346	BUG_ON(atomic_read(&wq->nr_cwqs_to_flush));
				2347	atomic_set(&wq->nr_cwqs_to_flush, 1);
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2348	}
Oleg Nesterov	1444196	2007-05-23 13:57:57 -0700	[diff] [blame]	2349
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2350	for_each_cwq_cpu(cpu, wq) {
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2351	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	2352	struct global_cwq *gcwq = cwq->pool->gcwq;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2353
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2354	spin_lock_irq(&gcwq->lock);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2355
				2356	if (flush_color >= 0) {
				2357	BUG_ON(cwq->flush_color != -1);
				2358
				2359	if (cwq->nr_in_flight[flush_color]) {
				2360	cwq->flush_color = flush_color;
				2361	atomic_inc(&wq->nr_cwqs_to_flush);
				2362	wait = true;
				2363	}
				2364	}
				2365
				2366	if (work_color >= 0) {
				2367	BUG_ON(work_color != work_next_color(cwq->work_color));
				2368	cwq->work_color = work_color;
				2369	}
				2370
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2371	spin_unlock_irq(&gcwq->lock);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2372	}
				2373
				2374	if (flush_color >= 0 && atomic_dec_and_test(&wq->nr_cwqs_to_flush))
				2375	complete(&wq->first_flusher->done);
				2376
				2377	return wait;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2378	}
				2379
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2380	/**
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2381	* flush_workqueue - ensure that any scheduled work has run to completion.
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2382	* @wq: workqueue to flush
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2383	*
				2384	* Forces execution of the workqueue and blocks until its completion.
				2385	* This is typically used in driver shutdown handlers.
				2386	*
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2387	* We sleep until all works which were queued on entry have been handled,
				2388	* but we are not livelocked by new incoming ones.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2389	*/
Harvey Harrison	7ad5b3a	2008-02-08 04:19:53 -0800	[diff] [blame]	2390	void flush_workqueue(struct workqueue_struct *wq)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2391	{
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2392	struct wq_flusher this_flusher = {
				2393	.list = LIST_HEAD_INIT(this_flusher.list),
				2394	.flush_color = -1,
				2395	.done = COMPLETION_INITIALIZER_ONSTACK(this_flusher.done),
				2396	};
				2397	int next_color;
Oleg Nesterov	b1f4ec1	2007-05-09 02:34:12 -0700	[diff] [blame]	2398
Ingo Molnar	3295f0e	2008-08-11 10:30:30 +0200	[diff] [blame]	2399	lock_map_acquire(&wq->lockdep_map);
				2400	lock_map_release(&wq->lockdep_map);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2401
				2402	mutex_lock(&wq->flush_mutex);
				2403
				2404	/*
				2405	* Start-to-wait phase
				2406	*/
				2407	next_color = work_next_color(wq->work_color);
				2408
				2409	if (next_color != wq->flush_color) {
				2410	/*
				2411	* Color space is not full. The current work_color
				2412	* becomes our flush_color and work_color is advanced
				2413	* by one.
				2414	*/
				2415	BUG_ON(!list_empty(&wq->flusher_overflow));
				2416	this_flusher.flush_color = wq->work_color;
				2417	wq->work_color = next_color;
				2418
				2419	if (!wq->first_flusher) {
				2420	/* no flush in progress, become the first flusher */
				2421	BUG_ON(wq->flush_color != this_flusher.flush_color);
				2422
				2423	wq->first_flusher = &this_flusher;
				2424
				2425	if (!flush_workqueue_prep_cwqs(wq, wq->flush_color,
				2426	wq->work_color)) {
				2427	/* nothing to flush, done */
				2428	wq->flush_color = next_color;
				2429	wq->first_flusher = NULL;
				2430	goto out_unlock;
				2431	}
				2432	} else {
				2433	/* wait in queue */
				2434	BUG_ON(wq->flush_color == this_flusher.flush_color);
				2435	list_add_tail(&this_flusher.list, &wq->flusher_queue);
				2436	flush_workqueue_prep_cwqs(wq, -1, wq->work_color);
				2437	}
				2438	} else {
				2439	/*
				2440	* Oops, color space is full, wait on overflow queue.
				2441	* The next flush completion will assign us
				2442	* flush_color and transfer to flusher_queue.
				2443	*/
				2444	list_add_tail(&this_flusher.list, &wq->flusher_overflow);
				2445	}
				2446
				2447	mutex_unlock(&wq->flush_mutex);
				2448
				2449	wait_for_completion(&this_flusher.done);
				2450
				2451	/*
				2452	* Wake-up-and-cascade phase
				2453	*
				2454	* First flushers are responsible for cascading flushes and
				2455	* handling overflow. Non-first flushers can simply return.
				2456	*/
				2457	if (wq->first_flusher != &this_flusher)
				2458	return;
				2459
				2460	mutex_lock(&wq->flush_mutex);
				2461
Tejun Heo	4ce48b3	2010-07-02 10:03:51 +0200	[diff] [blame]	2462	/* we might have raced, check again with mutex held */
				2463	if (wq->first_flusher != &this_flusher)
				2464	goto out_unlock;
				2465
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2466	wq->first_flusher = NULL;
				2467
				2468	BUG_ON(!list_empty(&this_flusher.list));
				2469	BUG_ON(wq->flush_color != this_flusher.flush_color);
				2470
				2471	while (true) {
				2472	struct wq_flusher next, tmp;
				2473
				2474	/* complete all the flushers sharing the current flush color */
				2475	list_for_each_entry_safe(next, tmp, &wq->flusher_queue, list) {
				2476	if (next->flush_color != wq->flush_color)
				2477	break;
				2478	list_del_init(&next->list);
				2479	complete(&next->done);
				2480	}
				2481
				2482	BUG_ON(!list_empty(&wq->flusher_overflow) &&
				2483	wq->flush_color != work_next_color(wq->work_color));
				2484
				2485	/* this flush_color is finished, advance by one */
				2486	wq->flush_color = work_next_color(wq->flush_color);
				2487
				2488	/* one color has been freed, handle overflow queue */
				2489	if (!list_empty(&wq->flusher_overflow)) {
				2490	/*
				2491	* Assign the same color to all overflowed
				2492	* flushers, advance work_color and append to
				2493	* flusher_queue. This is the start-to-wait
				2494	* phase for these overflowed flushers.
				2495	*/
				2496	list_for_each_entry(tmp, &wq->flusher_overflow, list)
				2497	tmp->flush_color = wq->work_color;
				2498
				2499	wq->work_color = work_next_color(wq->work_color);
				2500
				2501	list_splice_tail_init(&wq->flusher_overflow,
				2502	&wq->flusher_queue);
				2503	flush_workqueue_prep_cwqs(wq, -1, wq->work_color);
				2504	}
				2505
				2506	if (list_empty(&wq->flusher_queue)) {
				2507	BUG_ON(wq->flush_color != wq->work_color);
				2508	break;
				2509	}
				2510
				2511	/*
				2512	* Need to flush more colors. Make the next flusher
				2513	* the new first flusher and arm cwqs.
				2514	*/
				2515	BUG_ON(wq->flush_color == wq->work_color);
				2516	BUG_ON(wq->flush_color != next->flush_color);
				2517
				2518	list_del_init(&next->list);
				2519	wq->first_flusher = next;
				2520
				2521	if (flush_workqueue_prep_cwqs(wq, wq->flush_color, -1))
				2522	break;
				2523
				2524	/*
				2525	* Meh... this color is already done, clear first
				2526	* flusher and repeat cascading.
				2527	*/
				2528	wq->first_flusher = NULL;
				2529	}
				2530
				2531	out_unlock:
				2532	mutex_unlock(&wq->flush_mutex);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2533	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	2534	EXPORT_SYMBOL_GPL(flush_workqueue);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2535
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2536	/**
				2537	* drain_workqueue - drain a workqueue
				2538	* @wq: workqueue to drain
				2539	*
				2540	* Wait until the workqueue becomes empty. While draining is in progress,
				2541	* only chain queueing is allowed. IOW, only currently pending or running
				2542	* work items on @wq can queue further work items on it. @wq is flushed
				2543	* repeatedly until it becomes empty. The number of flushing is detemined
				2544	* by the depth of chaining and should be relatively short. Whine if it
				2545	* takes too long.
				2546	*/
				2547	void drain_workqueue(struct workqueue_struct *wq)
				2548	{
				2549	unsigned int flush_cnt = 0;
				2550	unsigned int cpu;
				2551
				2552	/*
				2553	* __queue_work() needs to test whether there are drainers, is much
				2554	* hotter than drain_workqueue() and already looks at @wq->flags.
				2555	* Use WQ_DRAINING so that queue doesn't have to check nr_drainers.
				2556	*/
				2557	spin_lock(&workqueue_lock);
				2558	if (!wq->nr_drainers++)
				2559	wq->flags \|= WQ_DRAINING;
				2560	spin_unlock(&workqueue_lock);
				2561	reflush:
				2562	flush_workqueue(wq);
				2563
				2564	for_each_cwq_cpu(cpu, wq) {
				2565	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
Thomas Tuttle	fa2563e	2011-09-14 16:22:28 -0700	[diff] [blame]	2566	bool drained;
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2567
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	2568	spin_lock_irq(&cwq->pool->gcwq->lock);
Thomas Tuttle	fa2563e	2011-09-14 16:22:28 -0700	[diff] [blame]	2569	drained = !cwq->nr_active && list_empty(&cwq->delayed_works);
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	2570	spin_unlock_irq(&cwq->pool->gcwq->lock);
Thomas Tuttle	fa2563e	2011-09-14 16:22:28 -0700	[diff] [blame]	2571
				2572	if (drained)
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2573	continue;
				2574
				2575	if (++flush_cnt == 10 \|\|
				2576	(flush_cnt % 100 == 0 && flush_cnt <= 1000))
				2577	pr_warning("workqueue %s: flush on destruction isn't complete after %u tries\n",
				2578	wq->name, flush_cnt);
				2579	goto reflush;
				2580	}
				2581
				2582	spin_lock(&workqueue_lock);
				2583	if (!--wq->nr_drainers)
				2584	wq->flags &= ~WQ_DRAINING;
				2585	spin_unlock(&workqueue_lock);
				2586	}
				2587	EXPORT_SYMBOL_GPL(drain_workqueue);
				2588
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2589	static bool start_flush_work(struct work_struct work, struct wq_barrier barr,
				2590	bool wait_executing)
				2591	{
				2592	struct worker *worker = NULL;
				2593	struct global_cwq *gcwq;
				2594	struct cpu_workqueue_struct *cwq;
				2595
				2596	might_sleep();
				2597	gcwq = get_work_gcwq(work);
				2598	if (!gcwq)
				2599	return false;
				2600
				2601	spin_lock_irq(&gcwq->lock);
				2602	if (!list_empty(&work->entry)) {
				2603	/*
				2604	* See the comment near try_to_grab_pending()->smp_rmb().
				2605	* If it was re-queued to a different gcwq under us, we
				2606	* are not going to wait.
				2607	*/
				2608	smp_rmb();
				2609	cwq = get_work_cwq(work);
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	2610	if (unlikely(!cwq \|\| gcwq != cwq->pool->gcwq))
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2611	goto already_gone;
				2612	} else if (wait_executing) {
				2613	worker = find_worker_executing_work(gcwq, work);
				2614	if (!worker)
				2615	goto already_gone;
				2616	cwq = worker->current_cwq;
				2617	} else
				2618	goto already_gone;
				2619
				2620	insert_wq_barrier(cwq, barr, work, worker);
				2621	spin_unlock_irq(&gcwq->lock);
				2622
Tejun Heo	e159489	2011-01-09 23:32:15 +0100	[diff] [blame]	2623	/*
				2624	* If @max_active is 1 or rescuer is in use, flushing another work
				2625	* item on the same workqueue may lead to deadlock. Make sure the
				2626	* flusher is not running on the same workqueue by verifying write
				2627	* access.
				2628	*/
				2629	if (cwq->wq->saved_max_active == 1 \|\| cwq->wq->flags & WQ_RESCUER)
				2630	lock_map_acquire(&cwq->wq->lockdep_map);
				2631	else
				2632	lock_map_acquire_read(&cwq->wq->lockdep_map);
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2633	lock_map_release(&cwq->wq->lockdep_map);
Tejun Heo	e159489	2011-01-09 23:32:15 +0100	[diff] [blame]	2634
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2635	return true;
				2636	already_gone:
				2637	spin_unlock_irq(&gcwq->lock);
				2638	return false;
				2639	}
				2640
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2641	/**
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2642	* flush_work - wait for a work to finish executing the last queueing instance
				2643	* @work: the work to flush
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2644	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2645	* Wait until @work has finished execution. This function considers
				2646	* only the last queueing instance of @work. If @work has been
				2647	* enqueued across different CPUs on a non-reentrant workqueue or on
				2648	* multiple workqueues, @work might still be executing on return on
				2649	* some of the CPUs from earlier queueing.
Oleg Nesterov	a67da70	2008-07-25 01:47:52 -0700	[diff] [blame]	2650	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2651	* If @work was queued only on a non-reentrant, ordered or unbound
				2652	* workqueue, @work is guaranteed to be idle on return if it hasn't
				2653	* been requeued since flush started.
				2654	*
				2655	* RETURNS:
				2656	* %true if flush_work() waited for the work to finish execution,
				2657	* %false if it was already idle.
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2658	*/
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2659	bool flush_work(struct work_struct *work)
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2660	{
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2661	struct wq_barrier barr;
				2662
Stephen Boyd	0976dfc	2012-04-20 17:28:50 -0700	[diff] [blame]	2663	lock_map_acquire(&work->lockdep_map);
				2664	lock_map_release(&work->lockdep_map);
				2665
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2666	if (start_flush_work(work, &barr, true)) {
				2667	wait_for_completion(&barr.done);
				2668	destroy_work_on_stack(&barr.work);
				2669	return true;
				2670	} else
				2671	return false;
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2672	}
				2673	EXPORT_SYMBOL_GPL(flush_work);
				2674
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2675	static bool wait_on_cpu_work(struct global_cwq gcwq, struct work_struct work)
				2676	{
				2677	struct wq_barrier barr;
				2678	struct worker *worker;
				2679
				2680	spin_lock_irq(&gcwq->lock);
				2681
				2682	worker = find_worker_executing_work(gcwq, work);
				2683	if (unlikely(worker))
				2684	insert_wq_barrier(worker->current_cwq, &barr, work, worker);
				2685
				2686	spin_unlock_irq(&gcwq->lock);
				2687
				2688	if (unlikely(worker)) {
				2689	wait_for_completion(&barr.done);
				2690	destroy_work_on_stack(&barr.work);
				2691	return true;
				2692	} else
				2693	return false;
				2694	}
				2695
				2696	static bool wait_on_work(struct work_struct *work)
				2697	{
				2698	bool ret = false;
				2699	int cpu;
				2700
				2701	might_sleep();
				2702
				2703	lock_map_acquire(&work->lockdep_map);
				2704	lock_map_release(&work->lockdep_map);
				2705
				2706	for_each_gcwq_cpu(cpu)
				2707	ret \|= wait_on_cpu_work(get_gcwq(cpu), work);
				2708	return ret;
				2709	}
				2710
Tejun Heo	0938349	2010-09-16 10:48:29 +0200	[diff] [blame]	2711	/**
				2712	* flush_work_sync - wait until a work has finished execution
				2713	* @work: the work to flush
				2714	*
				2715	* Wait until @work has finished execution. On return, it's
				2716	* guaranteed that all queueing instances of @work which happened
				2717	* before this function is called are finished. In other words, if
				2718	* @work hasn't been requeued since this function was called, @work is
				2719	* guaranteed to be idle on return.
				2720	*
				2721	* RETURNS:
				2722	* %true if flush_work_sync() waited for the work to finish execution,
				2723	* %false if it was already idle.
				2724	*/
				2725	bool flush_work_sync(struct work_struct *work)
				2726	{
				2727	struct wq_barrier barr;
				2728	bool pending, waited;
				2729
				2730	/* we'll wait for executions separately, queue barr only if pending */
				2731	pending = start_flush_work(work, &barr, false);
				2732
				2733	/* wait for executions to finish */
				2734	waited = wait_on_work(work);
				2735
				2736	/* wait for the pending one */
				2737	if (pending) {
				2738	wait_for_completion(&barr.done);
				2739	destroy_work_on_stack(&barr.work);
				2740	}
				2741
				2742	return pending \|\| waited;
				2743	}
				2744	EXPORT_SYMBOL_GPL(flush_work_sync);
				2745
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2746	/*
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2747	* Upon a successful return (>= 0), the caller "owns" WORK_STRUCT_PENDING bit,
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2748	* so this work can't be re-armed in any way.
				2749	*/
				2750	static int try_to_grab_pending(struct work_struct *work)
				2751	{
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2752	struct global_cwq *gcwq;
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2753	int ret = -1;
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2754
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	2755	if (!test_and_set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(work)))
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2756	return 0;
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2757
				2758	/*
				2759	* The queueing is in progress, or it is already queued. Try to
				2760	* steal it from ->worklist without clearing WORK_STRUCT_PENDING.
				2761	*/
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	2762	gcwq = get_work_gcwq(work);
				2763	if (!gcwq)
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2764	return ret;
				2765
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2766	spin_lock_irq(&gcwq->lock);
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2767	if (!list_empty(&work->entry)) {
				2768	/*
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	2769	* This work is queued, but perhaps we locked the wrong gcwq.
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2770	* In that case we must see the new value after rmb(), see
				2771	* insert_work()->wmb().
				2772	*/
				2773	smp_rmb();
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	2774	if (gcwq == get_work_gcwq(work)) {
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2775	debug_work_deactivate(work);
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2776	list_del_init(&work->entry);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	2777	cwq_dec_nr_in_flight(get_work_cwq(work),
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	2778	get_work_color(work),
				2779	*work_data_bits(work) & WORK_STRUCT_DELAYED);
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2780	ret = 1;
				2781	}
				2782	}
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2783	spin_unlock_irq(&gcwq->lock);
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2784
				2785	return ret;
				2786	}
				2787
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2788	static bool __cancel_work_timer(struct work_struct *work,
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2789	struct timer_list* timer)
				2790	{
				2791	int ret;
				2792
				2793	do {
				2794	ret = (timer && likely(del_timer(timer)));
				2795	if (!ret)
				2796	ret = try_to_grab_pending(work);
				2797	wait_on_work(work);
				2798	} while (unlikely(ret < 0));
				2799
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	2800	clear_work_data(work);
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2801	return ret;
				2802	}
				2803
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2804	/**
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2805	* cancel_work_sync - cancel a work and wait for it to finish
				2806	* @work: the work to cancel
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2807	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2808	* Cancel @work and wait for its execution to finish. This function
				2809	* can be used even if the work re-queues itself or migrates to
				2810	* another workqueue. On return from this function, @work is
				2811	* guaranteed to be not pending or executing on any CPU.
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2812	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2813	* cancel_work_sync(&delayed_work->work) must not be used for
				2814	* delayed_work's. Use cancel_delayed_work_sync() instead.
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2815	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2816	* The caller must ensure that the workqueue on which @work was last
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2817	* queued can't be destroyed before this function returns.
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2818	*
				2819	* RETURNS:
				2820	* %true if @work was pending, %false otherwise.
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2821	*/
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2822	bool cancel_work_sync(struct work_struct *work)
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2823	{
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2824	return __cancel_work_timer(work, NULL);
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	2825	}
Oleg Nesterov	28e53bd	2007-05-09 02:34:22 -0700	[diff] [blame]	2826	EXPORT_SYMBOL_GPL(cancel_work_sync);
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	2827
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2828	/**
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2829	* flush_delayed_work - wait for a dwork to finish executing the last queueing
				2830	* @dwork: the delayed work to flush
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2831	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2832	* Delayed timer is cancelled and the pending work is queued for
				2833	* immediate execution. Like flush_work(), this function only
				2834	* considers the last queueing instance of @dwork.
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2835	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2836	* RETURNS:
				2837	* %true if flush_work() waited for the work to finish execution,
				2838	* %false if it was already idle.
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2839	*/
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2840	bool flush_delayed_work(struct delayed_work *dwork)
				2841	{
				2842	if (del_timer_sync(&dwork->timer))
				2843	__queue_work(raw_smp_processor_id(),
				2844	get_work_cwq(&dwork->work)->wq, &dwork->work);
				2845	return flush_work(&dwork->work);
				2846	}
				2847	EXPORT_SYMBOL(flush_delayed_work);
				2848
				2849	/**
Tejun Heo	0938349	2010-09-16 10:48:29 +0200	[diff] [blame]	2850	* flush_delayed_work_sync - wait for a dwork to finish
				2851	* @dwork: the delayed work to flush
				2852	*
				2853	* Delayed timer is cancelled and the pending work is queued for
				2854	* execution immediately. Other than timer handling, its behavior
				2855	* is identical to flush_work_sync().
				2856	*
				2857	* RETURNS:
				2858	* %true if flush_work_sync() waited for the work to finish execution,
				2859	* %false if it was already idle.
				2860	*/
				2861	bool flush_delayed_work_sync(struct delayed_work *dwork)
				2862	{
				2863	if (del_timer_sync(&dwork->timer))
				2864	__queue_work(raw_smp_processor_id(),
				2865	get_work_cwq(&dwork->work)->wq, &dwork->work);
				2866	return flush_work_sync(&dwork->work);
				2867	}
				2868	EXPORT_SYMBOL(flush_delayed_work_sync);
				2869
				2870	/**
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2871	* cancel_delayed_work_sync - cancel a delayed work and wait for it to finish
				2872	* @dwork: the delayed work cancel
				2873	*
				2874	* This is cancel_work_sync() for delayed works.
				2875	*
				2876	* RETURNS:
				2877	* %true if @dwork was pending, %false otherwise.
				2878	*/
				2879	bool cancel_delayed_work_sync(struct delayed_work *dwork)
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2880	{
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2881	return __cancel_work_timer(&dwork->work, &dwork->timer);
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2882	}
Oleg Nesterov	f5a421a	2007-07-15 23:41:44 -0700	[diff] [blame]	2883	EXPORT_SYMBOL(cancel_delayed_work_sync);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2884
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2885	/**
				2886	* schedule_work - put work task in global workqueue
				2887	* @work: job to be done
				2888	*
Bart Van Assche	5b0f437d	2009-07-30 19:00:53 +0200	[diff] [blame]	2889	* Returns zero if @work was already on the kernel-global workqueue and
				2890	* non-zero otherwise.
				2891	*
				2892	* This puts a job in the kernel-global workqueue if it was not already
				2893	* queued and leaves it in the same position on the kernel-global
				2894	* workqueue otherwise.
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2895	*/
Harvey Harrison	7ad5b3a	2008-02-08 04:19:53 -0800	[diff] [blame]	2896	int schedule_work(struct work_struct *work)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2897	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	2898	return queue_work(system_wq, work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2899	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	2900	EXPORT_SYMBOL(schedule_work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2901
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	2902	/*
				2903	* schedule_work_on - put work task on a specific cpu
				2904	* @cpu: cpu to put the work task on
				2905	* @work: job to be done
				2906	*
				2907	* This puts a job on a specific cpu
				2908	*/
				2909	int schedule_work_on(int cpu, struct work_struct *work)
				2910	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	2911	return queue_work_on(cpu, system_wq, work);
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	2912	}
				2913	EXPORT_SYMBOL(schedule_work_on);
				2914
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2915	/**
				2916	* schedule_delayed_work - put work task in global workqueue after delay
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	2917	* @dwork: job to be done
				2918	* @delay: number of jiffies to wait or 0 for immediate execution
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2919	*
				2920	* After waiting for a given time this puts a job in the kernel-global
				2921	* workqueue.
				2922	*/
Harvey Harrison	7ad5b3a	2008-02-08 04:19:53 -0800	[diff] [blame]	2923	int schedule_delayed_work(struct delayed_work *dwork,
Ingo Molnar	82f67cd	2007-02-16 01:28:13 -0800	[diff] [blame]	2924	unsigned long delay)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2925	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	2926	return queue_delayed_work(system_wq, dwork, delay);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2927	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	2928	EXPORT_SYMBOL(schedule_delayed_work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2929
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2930	/**
				2931	* schedule_delayed_work_on - queue work in global workqueue on CPU after delay
				2932	* @cpu: cpu to use
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	2933	* @dwork: job to be done
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2934	* @delay: number of jiffies to wait
				2935	*
				2936	* After waiting for a given time this puts a job in the kernel-global
				2937	* workqueue on the specified CPU.
				2938	*/
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2939	int schedule_delayed_work_on(int cpu,
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	2940	struct delayed_work *dwork, unsigned long delay)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2941	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	2942	return queue_delayed_work_on(cpu, system_wq, dwork, delay);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2943	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	2944	EXPORT_SYMBOL(schedule_delayed_work_on);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2945
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2946	/**
Tejun Heo	31ddd87	2010-10-19 11:14:49 +0200	[diff] [blame]	2947	* schedule_on_each_cpu - execute a function synchronously on each online CPU
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2948	* @func: the function to call
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2949	*
Tejun Heo	31ddd87	2010-10-19 11:14:49 +0200	[diff] [blame]	2950	* schedule_on_each_cpu() executes @func on each online CPU using the
				2951	* system workqueue and blocks until all CPUs have completed.
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2952	* schedule_on_each_cpu() is very slow.
Tejun Heo	31ddd87	2010-10-19 11:14:49 +0200	[diff] [blame]	2953	*
				2954	* RETURNS:
				2955	* 0 on success, -errno on failure.
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2956	*/
David Howells	65f27f3	2006-11-22 14:55:48 +0000	[diff] [blame]	2957	int schedule_on_each_cpu(work_func_t func)
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	2958	{
				2959	int cpu;
Namhyung Kim	38f5156	2010-08-08 14:24:09 +0200	[diff] [blame]	2960	struct work_struct __percpu *works;
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	2961
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2962	works = alloc_percpu(struct work_struct);
				2963	if (!works)
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	2964	return -ENOMEM;
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2965
Gautham R Shenoy	95402b3	2008-01-25 21:08:02 +0100	[diff] [blame]	2966	get_online_cpus();
Tejun Heo	9398180	2009-11-17 14:06:20 -0800	[diff] [blame]	2967
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	2968	for_each_online_cpu(cpu) {
Ingo Molnar	9bfb183	2006-12-18 20:05:09 +0100	[diff] [blame]	2969	struct work_struct *work = per_cpu_ptr(works, cpu);
				2970
				2971	INIT_WORK(work, func);
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	2972	schedule_work_on(cpu, work);
Andi Kleen	65a6446	2009-10-14 06:22:47 +0200	[diff] [blame]	2973	}
Tejun Heo	9398180	2009-11-17 14:06:20 -0800	[diff] [blame]	2974
				2975	for_each_online_cpu(cpu)
				2976	flush_work(per_cpu_ptr(works, cpu));
				2977
Gautham R Shenoy	95402b3	2008-01-25 21:08:02 +0100	[diff] [blame]	2978	put_online_cpus();
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2979	free_percpu(works);
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	2980	return 0;
				2981	}
				2982
Alan Stern	eef6a7d	2010-02-12 17:39:21 +0900	[diff] [blame]	2983	/**
				2984	* flush_scheduled_work - ensure that any scheduled work has run to completion.
				2985	*
				2986	* Forces execution of the kernel-global workqueue and blocks until its
				2987	* completion.
				2988	*
				2989	* Think twice before calling this function! It's very easy to get into
				2990	* trouble if you don't take great care. Either of the following situations
				2991	* will lead to deadlock:
				2992	*
				2993	* One of the work items currently on the workqueue needs to acquire
				2994	* a lock held by your code or its caller.
				2995	*
				2996	* Your code is running in the context of a work routine.
				2997	*
				2998	* They will be detected by lockdep when they occur, but the first might not
				2999	* occur very often. It depends on what work items are on the workqueue and
				3000	* what locks they need, which you have no control over.
				3001	*
				3002	* In most situations flushing the entire workqueue is overkill; you merely
				3003	* need to know that a particular work item isn't queued and isn't running.
				3004	* In such cases you should use cancel_delayed_work_sync() or
				3005	* cancel_work_sync() instead.
				3006	*/
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3007	void flush_scheduled_work(void)
				3008	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3009	flush_workqueue(system_wq);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3010	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	3011	EXPORT_SYMBOL(flush_scheduled_work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3012
				3013	/**
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	3014	* execute_in_process_context - reliably execute the routine with user context
				3015	* @fn: the function to execute
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	3016	* @ew: guaranteed storage for the execute work structure (must
				3017	* be available when the work executes)
				3018	*
				3019	* Executes the function immediately if process context is available,
				3020	* otherwise schedules the function for delayed execution.
				3021	*
				3022	* Returns: 0 - function was executed
				3023	* 1 - function was scheduled for execution
				3024	*/
David Howells	65f27f3	2006-11-22 14:55:48 +0000	[diff] [blame]	3025	int execute_in_process_context(work_func_t fn, struct execute_work *ew)
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	3026	{
				3027	if (!in_interrupt()) {
David Howells	65f27f3	2006-11-22 14:55:48 +0000	[diff] [blame]	3028	fn(&ew->work);
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	3029	return 0;
				3030	}
				3031
David Howells	65f27f3	2006-11-22 14:55:48 +0000	[diff] [blame]	3032	INIT_WORK(&ew->work, fn);
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	3033	schedule_work(&ew->work);
				3034
				3035	return 1;
				3036	}
				3037	EXPORT_SYMBOL_GPL(execute_in_process_context);
				3038
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3039	int keventd_up(void)
				3040	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3041	return system_wq != NULL;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3042	}
				3043
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3044	static int alloc_cwqs(struct workqueue_struct *wq)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3045	{
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3046	/*
Tejun Heo	0f90004	2010-06-29 10:07:11 +0200	[diff] [blame]	3047	* cwqs are forced aligned according to WORK_STRUCT_FLAG_BITS.
				3048	* Make sure that the alignment isn't lower than that of
				3049	* unsigned long long.
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3050	*/
Tejun Heo	0f90004	2010-06-29 10:07:11 +0200	[diff] [blame]	3051	const size_t size = sizeof(struct cpu_workqueue_struct);
				3052	const size_t align = max_t(size_t, 1 << WORK_STRUCT_FLAG_BITS,
				3053	__alignof__(unsigned long long));
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3054
Lai Jiangshan	e06ffa1	2012-03-09 18:03:20 +0800	[diff] [blame]	3055	if (!(wq->flags & WQ_UNBOUND))
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3056	wq->cpu_wq.pcpu = __alloc_percpu(size, align);
Tejun Heo	931ac77	2010-07-20 11:07:48 +0200	[diff] [blame]	3057	else {
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3058	void *ptr;
Frederic Weisbecker	e1d8aa9	2009-01-12 23:15:46 +0100	[diff] [blame]	3059
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3060	/*
				3061	* Allocate enough room to align cwq and put an extra
				3062	* pointer at the end pointing back to the originally
				3063	* allocated pointer which will be used for free.
				3064	*/
				3065	ptr = kzalloc(size + align + sizeof(void *), GFP_KERNEL);
				3066	if (ptr) {
				3067	wq->cpu_wq.single = PTR_ALIGN(ptr, align);
				3068	(void *)(wq->cpu_wq.single + 1) = ptr;
				3069	}
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3070	}
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3071
Tejun Heo	0415b00d1	2011-03-24 18:50:09 +0100	[diff] [blame]	3072	/* just in case, make sure it's actually aligned */
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3073	BUG_ON(!IS_ALIGNED(wq->cpu_wq.v, align));
				3074	return wq->cpu_wq.v ? 0 : -ENOMEM;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3075	}
				3076
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3077	static void free_cwqs(struct workqueue_struct *wq)
Oleg Nesterov	06ba38a	2007-05-09 02:34:15 -0700	[diff] [blame]	3078	{
Lai Jiangshan	e06ffa1	2012-03-09 18:03:20 +0800	[diff] [blame]	3079	if (!(wq->flags & WQ_UNBOUND))
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3080	free_percpu(wq->cpu_wq.pcpu);
				3081	else if (wq->cpu_wq.single) {
				3082	/* the pointer to free is stored right after the cwq */
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3083	kfree((void *)(wq->cpu_wq.single + 1));
Oleg Nesterov	06ba38a	2007-05-09 02:34:15 -0700	[diff] [blame]	3084	}
				3085	}
				3086
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3087	static int wq_clamp_max_active(int max_active, unsigned int flags,
				3088	const char *name)
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	3089	{
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3090	int lim = flags & WQ_UNBOUND ? WQ_UNBOUND_MAX_ACTIVE : WQ_MAX_ACTIVE;
				3091
				3092	if (max_active < 1 \|\| max_active > lim)
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	3093	printk(KERN_WARNING "workqueue: max_active %d requested for %s "
				3094	"is out of range, clamping between %d and %d\n",
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3095	max_active, name, 1, lim);
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	3096
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3097	return clamp_val(max_active, 1, lim);
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	3098	}
				3099
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3100	struct workqueue_struct __alloc_workqueue_key(const char fmt,
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3101	unsigned int flags,
				3102	int max_active,
				3103	struct lock_class_key *key,
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3104	const char *lock_name, ...)
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3105	{
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3106	va_list args, args1;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3107	struct workqueue_struct *wq;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	3108	unsigned int cpu;
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3109	size_t namelen;
				3110
				3111	/* determine namelen, allocate wq and format name */
				3112	va_start(args, lock_name);
				3113	va_copy(args1, args);
				3114	namelen = vsnprintf(NULL, 0, fmt, args) + 1;
				3115
				3116	wq = kzalloc(sizeof(*wq) + namelen, GFP_KERNEL);
				3117	if (!wq)
				3118	goto err;
				3119
				3120	vsnprintf(wq->name, namelen, fmt, args1);
				3121	va_end(args);
				3122	va_end(args1);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3123
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3124	/*
Tejun Heo	6370a6a	2010-10-11 15:12:27 +0200	[diff] [blame]	3125	* Workqueues which may be used during memory reclaim should
				3126	* have a rescuer to guarantee forward progress.
				3127	*/
				3128	if (flags & WQ_MEM_RECLAIM)
				3129	flags \|= WQ_RESCUER;
				3130
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3131	max_active = max_active ?: WQ_DFL_ACTIVE;
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3132	max_active = wq_clamp_max_active(max_active, flags, wq->name);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3133
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3134	/* init wq */
Tejun Heo	97e37d7	2010-06-29 10:07:10 +0200	[diff] [blame]	3135	wq->flags = flags;
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3136	wq->saved_max_active = max_active;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	3137	mutex_init(&wq->flush_mutex);
				3138	atomic_set(&wq->nr_cwqs_to_flush, 0);
				3139	INIT_LIST_HEAD(&wq->flusher_queue);
				3140	INIT_LIST_HEAD(&wq->flusher_overflow);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3141
Johannes Berg	eb13ba8	2008-01-16 09:51:58 +0100	[diff] [blame]	3142	lockdep_init_map(&wq->lockdep_map, lock_name, key, 0);
Oleg Nesterov	cce1a16	2007-05-09 02:34:13 -0700	[diff] [blame]	3143	INIT_LIST_HEAD(&wq->list);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3144
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3145	if (alloc_cwqs(wq) < 0)
				3146	goto err;
				3147
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3148	for_each_cwq_cpu(cpu, wq) {
Tejun Heo	1537663	2010-06-29 10:07:11 +0200	[diff] [blame]	3149	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3150	struct global_cwq *gcwq = get_gcwq(cpu);
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	3151	int pool_idx = (bool)(flags & WQ_HIGHPRI);
Tejun Heo	1537663	2010-06-29 10:07:11 +0200	[diff] [blame]	3152
Tejun Heo	0f90004	2010-06-29 10:07:11 +0200	[diff] [blame]	3153	BUG_ON((unsigned long)cwq & WORK_STRUCT_FLAG_MASK);
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	3154	cwq->pool = &gcwq->pools[pool_idx];
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	3155	cwq->wq = wq;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	3156	cwq->flush_color = -1;
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	3157	cwq->max_active = max_active;
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	3158	INIT_LIST_HEAD(&cwq->delayed_works);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3159	}
				3160
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3161	if (flags & WQ_RESCUER) {
				3162	struct worker *rescuer;
				3163
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	3164	if (!alloc_mayday_mask(&wq->mayday_mask, GFP_KERNEL))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3165	goto err;
				3166
				3167	wq->rescuer = rescuer = alloc_worker();
				3168	if (!rescuer)
				3169	goto err;
				3170
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3171	rescuer->task = kthread_create(rescuer_thread, wq, "%s",
				3172	wq->name);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3173	if (IS_ERR(rescuer->task))
				3174	goto err;
				3175
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3176	rescuer->task->flags \|= PF_THREAD_BOUND;
				3177	wake_up_process(rescuer->task);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3178	}
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3179
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3180	/*
				3181	* workqueue_lock protects global freeze state and workqueues
				3182	* list. Grab it, set max_active accordingly and add the new
				3183	* workqueue to workqueues list.
				3184	*/
Tejun Heo	1537663	2010-06-29 10:07:11 +0200	[diff] [blame]	3185	spin_lock(&workqueue_lock);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3186
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3187	if (workqueue_freezing && wq->flags & WQ_FREEZABLE)
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3188	for_each_cwq_cpu(cpu, wq)
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3189	get_cwq(cpu, wq)->max_active = 0;
				3190
Tejun Heo	1537663	2010-06-29 10:07:11 +0200	[diff] [blame]	3191	list_add(&wq->list, &workqueues);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3192
Tejun Heo	1537663	2010-06-29 10:07:11 +0200	[diff] [blame]	3193	spin_unlock(&workqueue_lock);
				3194
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3195	return wq;
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	3196	err:
				3197	if (wq) {
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3198	free_cwqs(wq);
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	3199	free_mayday_mask(wq->mayday_mask);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3200	kfree(wq->rescuer);
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	3201	kfree(wq);
				3202	}
				3203	return NULL;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3204	}
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3205	EXPORT_SYMBOL_GPL(__alloc_workqueue_key);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3206
				3207	/**
				3208	* destroy_workqueue - safely terminate a workqueue
				3209	* @wq: target workqueue
				3210	*
				3211	* Safely destroy a workqueue. All work currently pending will be done first.
				3212	*/
				3213	void destroy_workqueue(struct workqueue_struct *wq)
				3214	{
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	3215	unsigned int cpu;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3216
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	3217	/* drain it before proceeding with destruction */
				3218	drain_workqueue(wq);
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	3219
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3220	/*
				3221	* wq list is used to freeze wq, remove from list after
				3222	* flushing is complete in case freeze races us.
				3223	*/
Gautham R Shenoy	95402b3	2008-01-25 21:08:02 +0100	[diff] [blame]	3224	spin_lock(&workqueue_lock);
Oleg Nesterov	b1f4ec1	2007-05-09 02:34:12 -0700	[diff] [blame]	3225	list_del(&wq->list);
Gautham R Shenoy	95402b3	2008-01-25 21:08:02 +0100	[diff] [blame]	3226	spin_unlock(&workqueue_lock);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3227
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3228	/* sanity check */
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3229	for_each_cwq_cpu(cpu, wq) {
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	3230	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
				3231	int i;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3232
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	3233	for (i = 0; i < WORK_NR_COLORS; i++)
				3234	BUG_ON(cwq->nr_in_flight[i]);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	3235	BUG_ON(cwq->nr_active);
				3236	BUG_ON(!list_empty(&cwq->delayed_works));
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	3237	}
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3238
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3239	if (wq->flags & WQ_RESCUER) {
				3240	kthread_stop(wq->rescuer->task);
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	3241	free_mayday_mask(wq->mayday_mask);
Xiaotian Feng	8d9df9f	2010-08-16 09:54:28 +0200	[diff] [blame]	3242	kfree(wq->rescuer);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3243	}
				3244
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3245	free_cwqs(wq);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3246	kfree(wq);
				3247	}
				3248	EXPORT_SYMBOL_GPL(destroy_workqueue);
				3249
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3250	/**
				3251	* workqueue_set_max_active - adjust max_active of a workqueue
				3252	* @wq: target workqueue
				3253	* @max_active: new max_active value.
				3254	*
				3255	* Set max_active of @wq to @max_active.
				3256	*
				3257	* CONTEXT:
				3258	* Don't call from IRQ context.
				3259	*/
				3260	void workqueue_set_max_active(struct workqueue_struct *wq, int max_active)
				3261	{
				3262	unsigned int cpu;
				3263
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3264	max_active = wq_clamp_max_active(max_active, wq->flags, wq->name);
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3265
				3266	spin_lock(&workqueue_lock);
				3267
				3268	wq->saved_max_active = max_active;
				3269
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3270	for_each_cwq_cpu(cpu, wq) {
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3271	struct global_cwq *gcwq = get_gcwq(cpu);
				3272
				3273	spin_lock_irq(&gcwq->lock);
				3274
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3275	if (!(wq->flags & WQ_FREEZABLE) \|\|
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3276	!(gcwq->flags & GCWQ_FREEZING))
				3277	get_cwq(gcwq->cpu, wq)->max_active = max_active;
				3278
				3279	spin_unlock_irq(&gcwq->lock);
				3280	}
				3281
				3282	spin_unlock(&workqueue_lock);
				3283	}
				3284	EXPORT_SYMBOL_GPL(workqueue_set_max_active);
				3285
				3286	/**
				3287	* workqueue_congested - test whether a workqueue is congested
				3288	* @cpu: CPU in question
				3289	* @wq: target workqueue
				3290	*
				3291	* Test whether @wq's cpu workqueue for @cpu is congested. There is
				3292	* no synchronization around this function and the test result is
				3293	* unreliable and only useful as advisory hints or for debugging.
				3294	*
				3295	* RETURNS:
				3296	* %true if congested, %false otherwise.
				3297	*/
				3298	bool workqueue_congested(unsigned int cpu, struct workqueue_struct *wq)
				3299	{
				3300	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
				3301
				3302	return !list_empty(&cwq->delayed_works);
				3303	}
				3304	EXPORT_SYMBOL_GPL(workqueue_congested);
				3305
				3306	/**
				3307	* work_cpu - return the last known associated cpu for @work
				3308	* @work: the work of interest
				3309	*
				3310	* RETURNS:
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3311	* CPU number if @work was ever queued. WORK_CPU_NONE otherwise.
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3312	*/
				3313	unsigned int work_cpu(struct work_struct *work)
				3314	{
				3315	struct global_cwq *gcwq = get_work_gcwq(work);
				3316
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3317	return gcwq ? gcwq->cpu : WORK_CPU_NONE;
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3318	}
				3319	EXPORT_SYMBOL_GPL(work_cpu);
				3320
				3321	/**
				3322	* work_busy - test whether a work is currently pending or running
				3323	* @work: the work to be tested
				3324	*
				3325	* Test whether @work is currently pending or running. There is no
				3326	* synchronization around this function and the test result is
				3327	* unreliable and only useful as advisory hints or for debugging.
				3328	* Especially for reentrant wqs, the pending state might hide the
				3329	* running state.
				3330	*
				3331	* RETURNS:
				3332	* OR'd bitmask of WORK_BUSY_* bits.
				3333	*/
				3334	unsigned int work_busy(struct work_struct *work)
				3335	{
				3336	struct global_cwq *gcwq = get_work_gcwq(work);
				3337	unsigned long flags;
				3338	unsigned int ret = 0;
				3339
				3340	if (!gcwq)
				3341	return false;
				3342
				3343	spin_lock_irqsave(&gcwq->lock, flags);
				3344
				3345	if (work_pending(work))
				3346	ret \|= WORK_BUSY_PENDING;
				3347	if (find_worker_executing_work(gcwq, work))
				3348	ret \|= WORK_BUSY_RUNNING;
				3349
				3350	spin_unlock_irqrestore(&gcwq->lock, flags);
				3351
				3352	return ret;
				3353	}
				3354	EXPORT_SYMBOL_GPL(work_busy);
				3355
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3356	/*
				3357	* CPU hotplug.
				3358	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3359	* There are two challenges in supporting CPU hotplug. Firstly, there
				3360	* are a lot of assumptions on strong associations among work, cwq and
				3361	* gcwq which make migrating pending and scheduled works very
				3362	* difficult to implement without impacting hot paths. Secondly,
				3363	* gcwqs serve mix of short, long and very long running works making
				3364	* blocked draining impractical.
				3365	*
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	3366	* This is solved by allowing a gcwq to be disassociated from the CPU
				3367	* running as an unbound one and allowing it to be reattached later if the
				3368	* cpu comes back online.
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3369	*/
				3370
Tejun Heo	6037315	2012-07-17 12:39:27 -0700	[diff] [blame]	3371	/* claim manager positions of all pools */
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	3372	static void gcwq_claim_management_and_lock(struct global_cwq *gcwq)
Tejun Heo	6037315	2012-07-17 12:39:27 -0700	[diff] [blame]	3373	{
				3374	struct worker_pool *pool;
				3375
				3376	for_each_worker_pool(pool, gcwq)
				3377	mutex_lock_nested(&pool->manager_mutex, pool - gcwq->pools);
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	3378	spin_lock_irq(&gcwq->lock);
Tejun Heo	6037315	2012-07-17 12:39:27 -0700	[diff] [blame]	3379	}
				3380
				3381	/* release manager positions */
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	3382	static void gcwq_release_management_and_unlock(struct global_cwq *gcwq)
Tejun Heo	6037315	2012-07-17 12:39:27 -0700	[diff] [blame]	3383	{
				3384	struct worker_pool *pool;
				3385
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	3386	spin_unlock_irq(&gcwq->lock);
Tejun Heo	6037315	2012-07-17 12:39:27 -0700	[diff] [blame]	3387	for_each_worker_pool(pool, gcwq)
				3388	mutex_unlock(&pool->manager_mutex);
				3389	}
				3390
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	3391	static void gcwq_unbind_fn(struct work_struct *work)
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3392	{
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	3393	struct global_cwq *gcwq = get_gcwq(smp_processor_id());
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	3394	struct worker_pool *pool;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3395	struct worker *worker;
				3396	struct hlist_node *pos;
				3397	int i;
				3398
				3399	BUG_ON(gcwq->cpu != smp_processor_id());
				3400
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	3401	gcwq_claim_management_and_lock(gcwq);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3402
Tejun Heo	f2d5a0e	2012-07-17 12:39:26 -0700	[diff] [blame]	3403	/*
				3404	* We've claimed all manager positions. Make all workers unbound
				3405	* and set DISASSOCIATED. Before this, all workers except for the
				3406	* ones which are still executing works from before the last CPU
				3407	* down must be on the cpu. After this, they may become diasporas.
				3408	*/
Tejun Heo	6037315	2012-07-17 12:39:27 -0700	[diff] [blame]	3409	for_each_worker_pool(pool, gcwq)
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	3410	list_for_each_entry(worker, &pool->idle_list, entry)
Tejun Heo	403c821	2012-07-17 12:39:27 -0700	[diff] [blame]	3411	worker->flags \|= WORKER_UNBOUND;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3412
				3413	for_each_busy_worker(worker, i, pos, gcwq)
Tejun Heo	403c821	2012-07-17 12:39:27 -0700	[diff] [blame]	3414	worker->flags \|= WORKER_UNBOUND;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3415
Tejun Heo	f2d5a0e	2012-07-17 12:39:26 -0700	[diff] [blame]	3416	gcwq->flags \|= GCWQ_DISASSOCIATED;
				3417
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	3418	gcwq_release_management_and_unlock(gcwq);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3419
				3420	/*
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	3421	* Call schedule() so that we cross rq->lock and thus can guarantee
				3422	* sched callbacks see the %WORKER_UNBOUND flag. This is necessary
				3423	* as scheduler callbacks may be invoked from other cpus.
				3424	*/
				3425	schedule();
				3426
				3427	/*
				3428	* Sched callbacks are disabled now. Zap nr_running. After this,
				3429	* nr_running stays zero and need_more_worker() and keep_working()
				3430	* are always true as long as the worklist is not empty. @gcwq now
				3431	* behaves as unbound (in terms of concurrency management) gcwq
				3432	* which is served by workers tied to the CPU.
				3433	*
				3434	* On return from this function, the current worker would trigger
				3435	* unbound chain execution of pending work items if other workers
				3436	* didn't already.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3437	*/
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	3438	for_each_worker_pool(pool, gcwq)
				3439	atomic_set(get_pool_nr_running(pool), 0);
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3440	}
				3441
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	3442	/*
				3443	* Workqueues should be brought up before normal priority CPU notifiers.
				3444	* This will be registered high priority CPU notifier.
				3445	*/
				3446	static int __devinit workqueue_cpu_up_callback(struct notifier_block *nfb,
				3447	unsigned long action,
				3448	void *hcpu)
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3449	{
				3450	unsigned int cpu = (unsigned long)hcpu;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3451	struct global_cwq *gcwq = get_gcwq(cpu);
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	3452	struct worker_pool *pool;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3453
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	3454	switch (action & ~CPU_TASKS_FROZEN) {
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3455	case CPU_UP_PREPARE:
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	3456	for_each_worker_pool(pool, gcwq) {
Tejun Heo	3ce6337	2012-07-17 12:39:27 -0700	[diff] [blame]	3457	struct worker *worker;
				3458
				3459	if (pool->nr_workers)
				3460	continue;
				3461
				3462	worker = create_worker(pool);
				3463	if (!worker)
				3464	return NOTIFY_BAD;
				3465
				3466	spin_lock_irq(&gcwq->lock);
				3467	start_worker(worker);
				3468	spin_unlock_irq(&gcwq->lock);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3469	}
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3470	break;
Oleg Nesterov	00dfcaf	2008-04-29 01:00:27 -0700	[diff] [blame]	3471
Tejun Heo	6575820	2012-07-17 12:39:26 -0700	[diff] [blame]	3472	case CPU_DOWN_FAILED:
				3473	case CPU_ONLINE:
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	3474	gcwq_claim_management_and_lock(gcwq);
				3475	gcwq->flags &= ~GCWQ_DISASSOCIATED;
				3476	rebind_workers(gcwq);
				3477	gcwq_release_management_and_unlock(gcwq);
				3478	break;
Tejun Heo	6575820	2012-07-17 12:39:26 -0700	[diff] [blame]	3479	}
				3480	return NOTIFY_OK;
				3481	}
				3482
				3483	/*
				3484	* Workqueues should be brought down after normal priority CPU notifiers.
				3485	* This will be registered as low priority CPU notifier.
				3486	*/
				3487	static int __devinit workqueue_cpu_down_callback(struct notifier_block *nfb,
				3488	unsigned long action,
				3489	void *hcpu)
				3490	{
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	3491	unsigned int cpu = (unsigned long)hcpu;
				3492	struct work_struct unbind_work;
				3493
Tejun Heo	6575820	2012-07-17 12:39:26 -0700	[diff] [blame]	3494	switch (action & ~CPU_TASKS_FROZEN) {
				3495	case CPU_DOWN_PREPARE:
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	3496	/* unbinding should happen on the local CPU */
				3497	INIT_WORK_ONSTACK(&unbind_work, gcwq_unbind_fn);
				3498	schedule_work_on(cpu, &unbind_work);
				3499	flush_work(&unbind_work);
				3500	break;
Tejun Heo	6575820	2012-07-17 12:39:26 -0700	[diff] [blame]	3501	}
				3502	return NOTIFY_OK;
				3503	}
				3504
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3505	#ifdef CONFIG_SMP
Rusty Russell	8ccad40	2009-01-16 15:31:15 -0800	[diff] [blame]	3506
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3507	struct work_for_cpu {
Andrew Morton	6b44003e	2009-04-09 09:50:37 -0600	[diff] [blame]	3508	struct completion completion;
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3509	long (fn)(void );
				3510	void *arg;
				3511	long ret;
				3512	};
				3513
Andrew Morton	6b44003e	2009-04-09 09:50:37 -0600	[diff] [blame]	3514	static int do_work_for_cpu(void *_wfc)
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3515	{
Andrew Morton	6b44003e	2009-04-09 09:50:37 -0600	[diff] [blame]	3516	struct work_for_cpu *wfc = _wfc;
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3517	wfc->ret = wfc->fn(wfc->arg);
Andrew Morton	6b44003e	2009-04-09 09:50:37 -0600	[diff] [blame]	3518	complete(&wfc->completion);
				3519	return 0;
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3520	}
				3521
				3522	/**
				3523	* work_on_cpu - run a function in user context on a particular cpu
				3524	* @cpu: the cpu to run on
				3525	* @fn: the function to run
				3526	* @arg: the function arg
				3527	*
Rusty Russell	31ad908	2009-01-16 15:31:15 -0800	[diff] [blame]	3528	* This will return the value @fn returns.
				3529	* It is up to the caller to ensure that the cpu doesn't go offline.
Andrew Morton	6b44003e	2009-04-09 09:50:37 -0600	[diff] [blame]	3530	* The caller must not hold any locks which would prevent @fn from completing.
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3531	*/
				3532	long work_on_cpu(unsigned int cpu, long (fn)(void ), void *arg)
				3533	{
Andrew Morton	6b44003e	2009-04-09 09:50:37 -0600	[diff] [blame]	3534	struct task_struct *sub_thread;
				3535	struct work_for_cpu wfc = {
				3536	.completion = COMPLETION_INITIALIZER_ONSTACK(wfc.completion),
				3537	.fn = fn,
				3538	.arg = arg,
				3539	};
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3540
Andrew Morton	6b44003e	2009-04-09 09:50:37 -0600	[diff] [blame]	3541	sub_thread = kthread_create(do_work_for_cpu, &wfc, "work_for_cpu");
				3542	if (IS_ERR(sub_thread))
				3543	return PTR_ERR(sub_thread);
				3544	kthread_bind(sub_thread, cpu);
				3545	wake_up_process(sub_thread);
				3546	wait_for_completion(&wfc.completion);
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3547	return wfc.ret;
				3548	}
				3549	EXPORT_SYMBOL_GPL(work_on_cpu);
				3550	#endif /* CONFIG_SMP */
				3551
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3552	#ifdef CONFIG_FREEZER
Rusty Russell	e7577c5	2009-01-01 10:12:25 +1030	[diff] [blame]	3553
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3554	/**
				3555	* freeze_workqueues_begin - begin freezing workqueues
				3556	*
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3557	* Start freezing workqueues. After this function returns, all freezable
				3558	* workqueues will queue new works to their frozen_works list instead of
				3559	* gcwq->worklist.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3560	*
				3561	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3562	* Grabs and releases workqueue_lock and gcwq->lock's.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3563	*/
				3564	void freeze_workqueues_begin(void)
				3565	{
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3566	unsigned int cpu;
				3567
				3568	spin_lock(&workqueue_lock);
				3569
				3570	BUG_ON(workqueue_freezing);
				3571	workqueue_freezing = true;
				3572
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3573	for_each_gcwq_cpu(cpu) {
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3574	struct global_cwq *gcwq = get_gcwq(cpu);
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3575	struct workqueue_struct *wq;
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3576
				3577	spin_lock_irq(&gcwq->lock);
				3578
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3579	BUG_ON(gcwq->flags & GCWQ_FREEZING);
				3580	gcwq->flags \|= GCWQ_FREEZING;
				3581
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3582	list_for_each_entry(wq, &workqueues, list) {
				3583	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
				3584
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3585	if (cwq && wq->flags & WQ_FREEZABLE)
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3586	cwq->max_active = 0;
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3587	}
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3588
				3589	spin_unlock_irq(&gcwq->lock);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3590	}
				3591
				3592	spin_unlock(&workqueue_lock);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3593	}
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3594
				3595	/**
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3596	* freeze_workqueues_busy - are freezable workqueues still busy?
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3597	*
				3598	* Check whether freezing is complete. This function must be called
				3599	* between freeze_workqueues_begin() and thaw_workqueues().
				3600	*
				3601	* CONTEXT:
				3602	* Grabs and releases workqueue_lock.
				3603	*
				3604	* RETURNS:
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3605	* %true if some freezable workqueues are still busy. %false if freezing
				3606	* is complete.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3607	*/
				3608	bool freeze_workqueues_busy(void)
				3609	{
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3610	unsigned int cpu;
				3611	bool busy = false;
				3612
				3613	spin_lock(&workqueue_lock);
				3614
				3615	BUG_ON(!workqueue_freezing);
				3616
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3617	for_each_gcwq_cpu(cpu) {
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3618	struct workqueue_struct *wq;
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3619	/*
				3620	* nr_active is monotonically decreasing. It's safe
				3621	* to peek without lock.
				3622	*/
				3623	list_for_each_entry(wq, &workqueues, list) {
				3624	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
				3625
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3626	if (!cwq \|\| !(wq->flags & WQ_FREEZABLE))
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3627	continue;
				3628
				3629	BUG_ON(cwq->nr_active < 0);
				3630	if (cwq->nr_active) {
				3631	busy = true;
				3632	goto out_unlock;
				3633	}
				3634	}
				3635	}
				3636	out_unlock:
				3637	spin_unlock(&workqueue_lock);
				3638	return busy;
				3639	}
				3640
				3641	/**
				3642	* thaw_workqueues - thaw workqueues
				3643	*
				3644	* Thaw workqueues. Normal queueing is restored and all collected
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	3645	* frozen works are transferred to their respective gcwq worklists.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3646	*
				3647	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3648	* Grabs and releases workqueue_lock and gcwq->lock's.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3649	*/
				3650	void thaw_workqueues(void)
				3651	{
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3652	unsigned int cpu;
				3653
				3654	spin_lock(&workqueue_lock);
				3655
				3656	if (!workqueue_freezing)
				3657	goto out_unlock;
				3658
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3659	for_each_gcwq_cpu(cpu) {
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3660	struct global_cwq *gcwq = get_gcwq(cpu);
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	3661	struct worker_pool *pool;
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3662	struct workqueue_struct *wq;
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3663
				3664	spin_lock_irq(&gcwq->lock);
				3665
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3666	BUG_ON(!(gcwq->flags & GCWQ_FREEZING));
				3667	gcwq->flags &= ~GCWQ_FREEZING;
				3668
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3669	list_for_each_entry(wq, &workqueues, list) {
				3670	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
				3671
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3672	if (!cwq \|\| !(wq->flags & WQ_FREEZABLE))
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3673	continue;
				3674
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3675	/* restore max_active and repopulate worklist */
				3676	cwq->max_active = wq->saved_max_active;
				3677
				3678	while (!list_empty(&cwq->delayed_works) &&
				3679	cwq->nr_active < cwq->max_active)
				3680	cwq_activate_first_delayed(cwq);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3681	}
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3682
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	3683	for_each_worker_pool(pool, gcwq)
				3684	wake_up_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3685
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3686	spin_unlock_irq(&gcwq->lock);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3687	}
				3688
				3689	workqueue_freezing = false;
				3690	out_unlock:
				3691	spin_unlock(&workqueue_lock);
				3692	}
				3693	#endif /* CONFIG_FREEZER */
				3694
Suresh Siddha	6ee0578	2010-07-30 14:57:37 -0700	[diff] [blame]	3695	static int __init init_workqueues(void)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3696	{
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	3697	unsigned int cpu;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	3698	int i;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	3699
Tejun Heo	6575820	2012-07-17 12:39:26 -0700	[diff] [blame]	3700	cpu_notifier(workqueue_cpu_up_callback, CPU_PRI_WORKQUEUE_UP);
				3701	cpu_notifier(workqueue_cpu_down_callback, CPU_PRI_WORKQUEUE_DOWN);
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3702
				3703	/* initialize gcwqs */
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3704	for_each_gcwq_cpu(cpu) {
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3705	struct global_cwq *gcwq = get_gcwq(cpu);
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	3706	struct worker_pool *pool;
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3707
				3708	spin_lock_init(&gcwq->lock);
				3709	gcwq->cpu = cpu;
Tejun Heo	477a3c3	2010-08-31 10:54:35 +0200	[diff] [blame]	3710	gcwq->flags \|= GCWQ_DISASSOCIATED;
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3711
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	3712	for (i = 0; i < BUSY_WORKER_HASH_SIZE; i++)
				3713	INIT_HLIST_HEAD(&gcwq->busy_hash[i]);
				3714
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	3715	for_each_worker_pool(pool, gcwq) {
				3716	pool->gcwq = gcwq;
				3717	INIT_LIST_HEAD(&pool->worklist);
				3718	INIT_LIST_HEAD(&pool->idle_list);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3719
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	3720	init_timer_deferrable(&pool->idle_timer);
				3721	pool->idle_timer.function = idle_worker_timeout;
				3722	pool->idle_timer.data = (unsigned long)pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3723
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	3724	setup_timer(&pool->mayday_timer, gcwq_mayday_timeout,
				3725	(unsigned long)pool);
				3726
Tejun Heo	6037315	2012-07-17 12:39:27 -0700	[diff] [blame]	3727	mutex_init(&pool->manager_mutex);
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	3728	ida_init(&pool->worker_ida);
				3729	}
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3730
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	3731	init_waitqueue_head(&gcwq->rebind_hold);
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3732	}
				3733
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3734	/* create the initial worker */
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3735	for_each_online_gcwq_cpu(cpu) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3736	struct global_cwq *gcwq = get_gcwq(cpu);
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	3737	struct worker_pool *pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3738
Tejun Heo	477a3c3	2010-08-31 10:54:35 +0200	[diff] [blame]	3739	if (cpu != WORK_CPU_UNBOUND)
				3740	gcwq->flags &= ~GCWQ_DISASSOCIATED;
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	3741
				3742	for_each_worker_pool(pool, gcwq) {
				3743	struct worker *worker;
				3744
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	3745	worker = create_worker(pool);
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	3746	BUG_ON(!worker);
				3747	spin_lock_irq(&gcwq->lock);
				3748	start_worker(worker);
				3749	spin_unlock_irq(&gcwq->lock);
				3750	}
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3751	}
				3752
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3753	system_wq = alloc_workqueue("events", 0, 0);
				3754	system_long_wq = alloc_workqueue("events_long", 0, 0);
				3755	system_nrt_wq = alloc_workqueue("events_nrt", WQ_NON_REENTRANT, 0);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3756	system_unbound_wq = alloc_workqueue("events_unbound", WQ_UNBOUND,
				3757	WQ_UNBOUND_MAX_ACTIVE);
Tejun Heo	24d51ad	2011-02-21 09:52:50 +0100	[diff] [blame]	3758	system_freezable_wq = alloc_workqueue("events_freezable",
				3759	WQ_FREEZABLE, 0);
Alan Stern	62d3c54	2012-03-02 10:51:00 +0100	[diff] [blame]	3760	system_nrt_freezable_wq = alloc_workqueue("events_nrt_freezable",
				3761	WQ_NON_REENTRANT \| WQ_FREEZABLE, 0);
Hitoshi Mitake	e5cba24	2010-11-26 12:06:44 +0100	[diff] [blame]	3762	BUG_ON(!system_wq \|\| !system_long_wq \|\| !system_nrt_wq \|\|
Alan Stern	62d3c54	2012-03-02 10:51:00 +0100	[diff] [blame]	3763	!system_unbound_wq \|\| !system_freezable_wq \|\|
				3764	!system_nrt_freezable_wq);
Suresh Siddha	6ee0578	2010-07-30 14:57:37 -0700	[diff] [blame]	3765	return 0;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3766	}
Suresh Siddha	6ee0578	2010-07-30 14:57:37 -0700	[diff] [blame]	3767	early_initcall(init_workqueues);