Blame - kernel/workqueue.c - android_kernel_htc_msm8960

blob: b5779df579f0581c16d4a60a11a5d78d81f37cf4 [file] [log] [blame]

Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1	/*
Tejun Heo	c54fce6	2010-09-10 16:51:36 +0200	[diff] [blame]	2	* kernel/workqueue.c - generic async execution with shared worker pool
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3	*
Tejun Heo	c54fce6	2010-09-10 16:51:36 +0200	[diff] [blame]	4	* Copyright (C) 2002 Ingo Molnar
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	5	*
Tejun Heo	c54fce6	2010-09-10 16:51:36 +0200	[diff] [blame]	6	* Derived from the taskqueue/keventd code by:
				7	* David Woodhouse <dwmw2@infradead.org>
				8	* Andrew Morton
				9	* Kai Petzke <wpp@marie.physik.tu-berlin.de>
				10	* Theodore Ts'o <tytso@mit.edu>
Christoph Lameter	89ada67	2005-10-30 15:01:59 -0800	[diff] [blame]	11	*
Christoph Lameter	cde5353	2008-07-04 09:59:22 -0700	[diff] [blame]	12	* Made to use alloc_percpu by Christoph Lameter.
Tejun Heo	c54fce6	2010-09-10 16:51:36 +0200	[diff] [blame]	13	*
				14	* Copyright (C) 2010 SUSE Linux Products GmbH
				15	* Copyright (C) 2010 Tejun Heo <tj@kernel.org>
				16	*
				17	* This is the generic async execution mechanism. Work items as are
				18	* executed in process context. The worker pool is shared and
				19	* automatically managed. There is one worker pool for each CPU and
				20	* one extra for works which are better served by workers which are
				21	* not bound to any specific CPU.
				22	*
				23	* Please read Documentation/workqueue.txt for details.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	24	*/
				25
Paul Gortmaker	9984de1	2011-05-23 14:51:41 -0400	[diff] [blame]	26	#include <linux/export.h>
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	27	#include <linux/kernel.h>
				28	#include <linux/sched.h>
				29	#include <linux/init.h>
				30	#include <linux/signal.h>
				31	#include <linux/completion.h>
				32	#include <linux/workqueue.h>
				33	#include <linux/slab.h>
				34	#include <linux/cpu.h>
				35	#include <linux/notifier.h>
				36	#include <linux/kthread.h>
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	37	#include <linux/hardirq.h>
Christoph Lameter	4693402	2006-10-11 01:21:26 -0700	[diff] [blame]	38	#include <linux/mempolicy.h>
Rafael J. Wysocki	341a595	2006-12-06 20:34:49 -0800	[diff] [blame]	39	#include <linux/freezer.h>
Peter Zijlstra	d5abe66	2006-12-06 20:37:26 -0800	[diff] [blame]	40	#include <linux/kallsyms.h>
				41	#include <linux/debug_locks.h>
Johannes Berg	4e6045f	2007-10-18 23:39:55 -0700	[diff] [blame]	42	#include <linux/lockdep.h>
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	43	#include <linux/idr.h>
Syed Rameez Mustafa	1bee7b9	2013-07-15 11:52:09 -0700	[diff] [blame]	44	#include <linux/bug.h>
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	45
				46	#include "workqueue_sched.h"
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	47
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	48	enum {
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	49	/* global_cwq flags */
Tejun Heo	22ad564	2012-07-12 14:46:37 -0700	[diff] [blame]	50	GCWQ_DISASSOCIATED = 1 << 0, /* cpu can't serve workers */
				51	GCWQ_FREEZING = 1 << 1, /* freeze in progress */
				52
				53	/* pool flags */
				54	POOL_MANAGE_WORKERS = 1 << 0, /* need to manage workers */
				55	POOL_MANAGING_WORKERS = 1 << 1, /* managing workers */
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	56
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	57	/* worker flags */
				58	WORKER_STARTED = 1 << 0, /* started */
				59	WORKER_DIE = 1 << 1, /* die die die */
				60	WORKER_IDLE = 1 << 2, /* is idle */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	61	WORKER_PREP = 1 << 3, /* preparing to run works */
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	62	WORKER_ROGUE = 1 << 4, /* not bound to any cpu */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	63	WORKER_REBIND = 1 << 5, /* mom is home, come back */
Tejun Heo	fb0e7be	2010-06-29 10:07:15 +0200	[diff] [blame]	64	WORKER_CPU_INTENSIVE = 1 << 6, /* cpu intensive */
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	65	WORKER_UNBOUND = 1 << 7, /* worker is unbound */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	66
Tejun Heo	fb0e7be	2010-06-29 10:07:15 +0200	[diff] [blame]	67	WORKER_NOT_RUNNING = WORKER_PREP \| WORKER_ROGUE \| WORKER_REBIND \|
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	68	WORKER_CPU_INTENSIVE \| WORKER_UNBOUND,
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	69
				70	/* gcwq->trustee_state */
				71	TRUSTEE_START = 0, /* start */
				72	TRUSTEE_IN_CHARGE = 1, /* trustee in charge of gcwq */
				73	TRUSTEE_BUTCHER = 2, /* butcher workers */
				74	TRUSTEE_RELEASE = 3, /* release workers */
				75	TRUSTEE_DONE = 4, /* trustee is done */
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	76
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	77	NR_WORKER_POOLS = 2, /* # worker pools per gcwq */
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	78
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	79	BUSY_WORKER_HASH_ORDER = 6, /* 64 pointers */
				80	BUSY_WORKER_HASH_SIZE = 1 << BUSY_WORKER_HASH_ORDER,
				81	BUSY_WORKER_HASH_MASK = BUSY_WORKER_HASH_SIZE - 1,
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	82
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	83	MAX_IDLE_WORKERS_RATIO = 4, /* 1/4 of busy can be idle */
				84	IDLE_WORKER_TIMEOUT = 300 * HZ, /* keep idle ones for 5 mins */
				85
Tejun Heo	3233cdb	2011-02-16 18:10:19 +0100	[diff] [blame]	86	MAYDAY_INITIAL_TIMEOUT = HZ / 100 >= 2 ? HZ / 100 : 2,
				87	/* call for help after 10ms
				88	(min two ticks) */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	89	MAYDAY_INTERVAL = HZ / 10, /* and then every 100ms */
				90	CREATE_COOLDOWN = HZ, /* time to breath after fail */
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	91	TRUSTEE_COOLDOWN = HZ / 10, /* for trustee draining */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	92
				93	/*
				94	* Rescue workers are used only on emergencies and shared by
				95	* all cpus. Give -20.
				96	*/
				97	RESCUER_NICE_LEVEL = -20,
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	98	HIGHPRI_NICE_LEVEL = -20,
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	99	};
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	100
				101	/*
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	102	* Structure fields follow one of the following exclusion rules.
				103	*
Tejun Heo	e41e704	2010-08-24 14:22:47 +0200	[diff] [blame]	104	* I: Modifiable by initialization/destruction paths and read-only for
				105	* everyone else.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	106	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	107	* P: Preemption protected. Disabling preemption is enough and should
				108	* only be modified and accessed from the local cpu.
				109	*
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	110	* L: gcwq->lock protected. Access with gcwq->lock held.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	111	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	112	* X: During normal operation, modification requires gcwq->lock and
				113	* should be done only from local cpu. Either disabling preemption
				114	* on local cpu or grabbing gcwq->lock is enough for read access.
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	115	* If GCWQ_DISASSOCIATED is set, it's identical to L.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	116	*
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	117	* F: wq->flush_mutex protected.
				118	*
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	119	* W: workqueue_lock protected.
				120	*/
				121
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	122	struct global_cwq;
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	123	struct worker_pool;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	124
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	125	/*
				126	* The poor guys doing the actual heavy lifting. All on-duty workers
				127	* are either serving the manager role, on idle list or on busy hash.
				128	*/
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	129	struct worker {
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	130	/* on idle list while idle, on busy hash table while busy */
				131	union {
				132	struct list_head entry; /* L: while idle */
				133	struct hlist_node hentry; /* L: while busy */
				134	};
				135
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	136	struct work_struct current_work; / L: work being processed */
Tejun Heo	55e3e1f	2012-12-18 10:35:02 -0800	[diff] [blame]	137	work_func_t current_func; /* L: current_work's fn */
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	138	struct cpu_workqueue_struct current_cwq; / L: current_work's cwq */
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	139	struct list_head scheduled; /* L: scheduled works */
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	140	struct task_struct task; / I: worker task */
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	141	struct worker_pool pool; / I: the associated pool */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	142	/* 64 bytes boundary on 64bit, 32 on 32bit */
				143	unsigned long last_active; /* L: last active timestamp */
				144	unsigned int flags; /* X: flags */
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	145	int id; /* I: worker id */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	146	struct work_struct rebind_work; /* L: rebind worker to cpu */
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	147	};
				148
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	149	struct worker_pool {
				150	struct global_cwq gcwq; / I: the owning gcwq */
Tejun Heo	22ad564	2012-07-12 14:46:37 -0700	[diff] [blame]	151	unsigned int flags; /* X: flags */
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	152
				153	struct list_head worklist; /* L: list of pending works */
				154	int nr_workers; /* L: total number of workers */
				155	int nr_idle; /* L: currently idle ones */
				156
				157	struct list_head idle_list; /* X: list of idle workers */
				158	struct timer_list idle_timer; /* L: worker idle timeout */
				159	struct timer_list mayday_timer; /* L: SOS timer for workers */
				160
				161	struct ida worker_ida; /* L: for worker IDs */
				162	struct worker first_idle; / L: first idle worker */
				163	};
				164
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	165	/*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	166	* Global per-cpu workqueue. There's one and only one for each cpu
				167	* and all works are queued and processed here regardless of their
				168	* target workqueues.
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	169	*/
				170	struct global_cwq {
				171	spinlock_t lock; /* the gcwq lock */
				172	unsigned int cpu; /* I: the associated cpu */
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	173	unsigned int flags; /* L: GCWQ_* flags */
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	174
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	175	/* workers are chained either in busy_hash or pool idle_list */
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	176	struct hlist_head busy_hash[BUSY_WORKER_HASH_SIZE];
				177	/* L: hash of busy workers */
				178
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	179	struct worker_pool pools[2]; /* normal and highpri pools */
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	180
				181	struct task_struct trustee; / L: for gcwq shutdown */
				182	unsigned int trustee_state; /* L: trustee state */
				183	wait_queue_head_t trustee_wait; /* trustee wait */
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	184	} ____cacheline_aligned_in_smp;
				185
				186	/*
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	187	* The per-CPU workqueue. The lower WORK_STRUCT_FLAG_BITS of
Tejun Heo	0f90004	2010-06-29 10:07:11 +0200	[diff] [blame]	188	* work_struct->data are used for flags and thus cwqs need to be
				189	* aligned at two's power of the number of flag bits.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	190	*/
				191	struct cpu_workqueue_struct {
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	192	struct worker_pool pool; / I: the associated pool */
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	193	struct workqueue_struct wq; / I: the owning workqueue */
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	194	int work_color; /* L: current color */
				195	int flush_color; /* L: flushing color */
				196	int nr_in_flight[WORK_NR_COLORS];
				197	/* L: nr of in_flight works */
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	198	int nr_active; /* L: nr of active works */
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	199	int max_active; /* L: max active works */
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	200	struct list_head delayed_works; /* L: delayed works */
Tejun Heo	0f90004	2010-06-29 10:07:11 +0200	[diff] [blame]	201	};
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	202
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	203	/*
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	204	* Structure used to wait for workqueue flush.
				205	*/
				206	struct wq_flusher {
				207	struct list_head list; /* F: list of flushers */
				208	int flush_color; /* F: flush color waiting for */
				209	struct completion done; /* flush completion */
				210	};
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	211
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	212	/*
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	213	* All cpumasks are assumed to be always set on UP and thus can't be
				214	* used to determine whether there's something to be done.
				215	*/
				216	#ifdef CONFIG_SMP
				217	typedef cpumask_var_t mayday_mask_t;
				218	#define mayday_test_and_set_cpu(cpu, mask) \
				219	cpumask_test_and_set_cpu((cpu), (mask))
				220	#define mayday_clear_cpu(cpu, mask) cpumask_clear_cpu((cpu), (mask))
				221	#define for_each_mayday_cpu(cpu, mask) for_each_cpu((cpu), (mask))
Tejun Heo	9c37547	2010-08-31 11:18:34 +0200	[diff] [blame]	222	#define alloc_mayday_mask(maskp, gfp) zalloc_cpumask_var((maskp), (gfp))
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	223	#define free_mayday_mask(mask) free_cpumask_var((mask))
				224	#else
				225	typedef unsigned long mayday_mask_t;
				226	#define mayday_test_and_set_cpu(cpu, mask) test_and_set_bit(0, &(mask))
				227	#define mayday_clear_cpu(cpu, mask) clear_bit(0, &(mask))
				228	#define for_each_mayday_cpu(cpu, mask) if ((cpu) = 0, (mask))
				229	#define alloc_mayday_mask(maskp, gfp) true
				230	#define free_mayday_mask(mask) do { } while (0)
				231	#endif
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	232
				233	/*
				234	* The externally visible workqueue abstraction is an array of
				235	* per-CPU workqueues:
				236	*/
				237	struct workqueue_struct {
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	238	unsigned int flags; /* W: WQ_* flags */
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	239	union {
				240	struct cpu_workqueue_struct __percpu *pcpu;
				241	struct cpu_workqueue_struct *single;
				242	unsigned long v;
				243	} cpu_wq; /* I: cwq's */
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	244	struct list_head list; /* W: list of all workqueues */
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	245
				246	struct mutex flush_mutex; /* protects wq flushing */
				247	int work_color; /* F: current work color */
				248	int flush_color; /* F: current flush color */
				249	atomic_t nr_cwqs_to_flush; /* flush in progress */
				250	struct wq_flusher first_flusher; / F: first flusher */
				251	struct list_head flusher_queue; /* F: flush waiters */
				252	struct list_head flusher_overflow; /* F: flush overflow list */
				253
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	254	mayday_mask_t mayday_mask; /* cpus requesting rescue */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	255	struct worker rescuer; / I: rescue worker */
				256
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	257	int nr_drainers; /* W: drain in progress */
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	258	int saved_max_active; /* W: saved cwq max_active */
Johannes Berg	4e6045f	2007-10-18 23:39:55 -0700	[diff] [blame]	259	#ifdef CONFIG_LOCKDEP
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	260	struct lockdep_map lockdep_map;
Johannes Berg	4e6045f	2007-10-18 23:39:55 -0700	[diff] [blame]	261	#endif
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	262	char name[]; /* I: workqueue name */
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	263	};
				264
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	265	struct workqueue_struct *system_wq __read_mostly;
				266	struct workqueue_struct *system_long_wq __read_mostly;
				267	struct workqueue_struct *system_nrt_wq __read_mostly;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	268	struct workqueue_struct *system_unbound_wq __read_mostly;
Tejun Heo	24d51ad	2011-02-21 09:52:50 +0100	[diff] [blame]	269	struct workqueue_struct *system_freezable_wq __read_mostly;
Alan Stern	62d3c54	2012-03-02 10:51:00 +0100	[diff] [blame]	270	struct workqueue_struct *system_nrt_freezable_wq __read_mostly;
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	271	EXPORT_SYMBOL_GPL(system_wq);
				272	EXPORT_SYMBOL_GPL(system_long_wq);
				273	EXPORT_SYMBOL_GPL(system_nrt_wq);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	274	EXPORT_SYMBOL_GPL(system_unbound_wq);
Tejun Heo	24d51ad	2011-02-21 09:52:50 +0100	[diff] [blame]	275	EXPORT_SYMBOL_GPL(system_freezable_wq);
Alan Stern	62d3c54	2012-03-02 10:51:00 +0100	[diff] [blame]	276	EXPORT_SYMBOL_GPL(system_nrt_freezable_wq);
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	277
Tejun Heo	97bd234	2010-10-05 10:41:14 +0200	[diff] [blame]	278	#define CREATE_TRACE_POINTS
				279	#include <trace/events/workqueue.h>
				280
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	281	#define for_each_worker_pool(pool, gcwq) \
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	282	for ((pool) = &(gcwq)->pools[0]; \
				283	(pool) < &(gcwq)->pools[NR_WORKER_POOLS]; (pool)++)
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	284
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	285	#define for_each_busy_worker(worker, i, pos, gcwq) \
				286	for (i = 0; i < BUSY_WORKER_HASH_SIZE; i++) \
				287	hlist_for_each_entry(worker, pos, &gcwq->busy_hash[i], hentry)
				288
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	289	static inline int __next_gcwq_cpu(int cpu, const struct cpumask *mask,
				290	unsigned int sw)
				291	{
				292	if (cpu < nr_cpu_ids) {
				293	if (sw & 1) {
				294	cpu = cpumask_next(cpu, mask);
				295	if (cpu < nr_cpu_ids)
				296	return cpu;
				297	}
				298	if (sw & 2)
				299	return WORK_CPU_UNBOUND;
				300	}
				301	return WORK_CPU_NONE;
				302	}
				303
				304	static inline int __next_wq_cpu(int cpu, const struct cpumask *mask,
				305	struct workqueue_struct *wq)
				306	{
				307	return __next_gcwq_cpu(cpu, mask, !(wq->flags & WQ_UNBOUND) ? 1 : 2);
				308	}
				309
Tejun Heo	0988495	2010-08-01 11:50:12 +0200	[diff] [blame]	310	/*
				311	* CPU iterators
				312	*
				313	* An extra gcwq is defined for an invalid cpu number
				314	* (WORK_CPU_UNBOUND) to host workqueues which are not bound to any
				315	* specific CPU. The following iterators are similar to
				316	* for_each_*_cpu() iterators but also considers the unbound gcwq.
				317	*
				318	* for_each_gcwq_cpu() : possible CPUs + WORK_CPU_UNBOUND
				319	* for_each_online_gcwq_cpu() : online CPUs + WORK_CPU_UNBOUND
				320	* for_each_cwq_cpu() : possible CPUs for bound workqueues,
				321	* WORK_CPU_UNBOUND for unbound workqueues
				322	*/
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	323	#define for_each_gcwq_cpu(cpu) \
				324	for ((cpu) = __next_gcwq_cpu(-1, cpu_possible_mask, 3); \
				325	(cpu) < WORK_CPU_NONE; \
				326	(cpu) = __next_gcwq_cpu((cpu), cpu_possible_mask, 3))
				327
				328	#define for_each_online_gcwq_cpu(cpu) \
				329	for ((cpu) = __next_gcwq_cpu(-1, cpu_online_mask, 3); \
				330	(cpu) < WORK_CPU_NONE; \
				331	(cpu) = __next_gcwq_cpu((cpu), cpu_online_mask, 3))
				332
				333	#define for_each_cwq_cpu(cpu, wq) \
				334	for ((cpu) = __next_wq_cpu(-1, cpu_possible_mask, (wq)); \
				335	(cpu) < WORK_CPU_NONE; \
				336	(cpu) = __next_wq_cpu((cpu), cpu_possible_mask, (wq)))
				337
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	338	#ifdef CONFIG_DEBUG_OBJECTS_WORK
				339
				340	static struct debug_obj_descr work_debug_descr;
				341
Stanislaw Gruszka	9977728	2011-03-07 09:58:33 +0100	[diff] [blame]	342	static void work_debug_hint(void addr)
				343	{
				344	return ((struct work_struct *) addr)->func;
				345	}
				346
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	347	/*
				348	* fixup_init is called when:
				349	* - an active object is initialized
				350	*/
				351	static int work_fixup_init(void *addr, enum debug_obj_state state)
				352	{
				353	struct work_struct *work = addr;
				354
				355	switch (state) {
				356	case ODEBUG_STATE_ACTIVE:
				357	cancel_work_sync(work);
				358	debug_object_init(work, &work_debug_descr);
				359	return 1;
				360	default:
				361	return 0;
				362	}
				363	}
				364
				365	/*
				366	* fixup_activate is called when:
				367	* - an active object is activated
				368	* - an unknown object is activated (might be a statically initialized object)
				369	*/
				370	static int work_fixup_activate(void *addr, enum debug_obj_state state)
				371	{
				372	struct work_struct *work = addr;
				373
				374	switch (state) {
				375
				376	case ODEBUG_STATE_NOTAVAILABLE:
				377	/*
				378	* This is not really a fixup. The work struct was
				379	* statically initialized. We just make sure that it
				380	* is tracked in the object tracker.
				381	*/
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	382	if (test_bit(WORK_STRUCT_STATIC_BIT, work_data_bits(work))) {
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	383	debug_object_init(work, &work_debug_descr);
				384	debug_object_activate(work, &work_debug_descr);
				385	return 0;
				386	}
				387	WARN_ON_ONCE(1);
				388	return 0;
				389
				390	case ODEBUG_STATE_ACTIVE:
				391	WARN_ON(1);
				392
				393	default:
				394	return 0;
				395	}
				396	}
				397
				398	/*
				399	* fixup_free is called when:
				400	* - an active object is freed
				401	*/
				402	static int work_fixup_free(void *addr, enum debug_obj_state state)
				403	{
				404	struct work_struct *work = addr;
				405
				406	switch (state) {
				407	case ODEBUG_STATE_ACTIVE:
				408	cancel_work_sync(work);
				409	debug_object_free(work, &work_debug_descr);
				410	return 1;
				411	default:
				412	return 0;
				413	}
				414	}
				415
				416	static struct debug_obj_descr work_debug_descr = {
				417	.name = "work_struct",
Stanislaw Gruszka	9977728	2011-03-07 09:58:33 +0100	[diff] [blame]	418	.debug_hint = work_debug_hint,
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	419	.fixup_init = work_fixup_init,
				420	.fixup_activate = work_fixup_activate,
				421	.fixup_free = work_fixup_free,
				422	};
				423
				424	static inline void debug_work_activate(struct work_struct *work)
				425	{
				426	debug_object_activate(work, &work_debug_descr);
				427	}
				428
				429	static inline void debug_work_deactivate(struct work_struct *work)
				430	{
				431	debug_object_deactivate(work, &work_debug_descr);
				432	}
				433
				434	void __init_work(struct work_struct *work, int onstack)
				435	{
				436	if (onstack)
				437	debug_object_init_on_stack(work, &work_debug_descr);
				438	else
				439	debug_object_init(work, &work_debug_descr);
				440	}
				441	EXPORT_SYMBOL_GPL(__init_work);
				442
				443	void destroy_work_on_stack(struct work_struct *work)
				444	{
				445	debug_object_free(work, &work_debug_descr);
				446	}
				447	EXPORT_SYMBOL_GPL(destroy_work_on_stack);
				448
				449	#else
				450	static inline void debug_work_activate(struct work_struct *work) { }
				451	static inline void debug_work_deactivate(struct work_struct *work) { }
				452	#endif
				453
Gautham R Shenoy	95402b3	2008-01-25 21:08:02 +0100	[diff] [blame]	454	/* Serializes the accesses to the list of workqueues. */
				455	static DEFINE_SPINLOCK(workqueue_lock);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	456	static LIST_HEAD(workqueues);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	457	static bool workqueue_freezing; /* W: have wqs started freezing? */
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	458
Oleg Nesterov	1444196	2007-05-23 13:57:57 -0700	[diff] [blame]	459	/*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	460	* The almighty global cpu workqueues. nr_running is the only field
				461	* which is expected to be used frequently by other cpus via
				462	* try_to_wake_up(). Put it in a separate cacheline.
Oleg Nesterov	1444196	2007-05-23 13:57:57 -0700	[diff] [blame]	463	*/
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	464	static DEFINE_PER_CPU(struct global_cwq, global_cwq);
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	465	static DEFINE_PER_CPU_SHARED_ALIGNED(atomic_t, pool_nr_running[NR_WORKER_POOLS]);
Nathan Lynch	f756d5e	2006-01-08 01:05:12 -0800	[diff] [blame]	466
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	467	/*
				468	* Global cpu workqueue and nr_running counter for unbound gcwq. The
				469	* gcwq is always online, has GCWQ_DISASSOCIATED set, and all its
				470	* workers have WORKER_UNBOUND set.
				471	*/
				472	static struct global_cwq unbound_global_cwq;
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	473	static atomic_t unbound_pool_nr_running[NR_WORKER_POOLS] = {
				474	[0 ... NR_WORKER_POOLS - 1] = ATOMIC_INIT(0), /* always 0 */
				475	};
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	476
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	477	static int worker_thread(void *__worker);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	478
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	479	static int worker_pool_pri(struct worker_pool *pool)
				480	{
				481	return pool - pool->gcwq->pools;
				482	}
				483
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	484	static struct global_cwq *get_gcwq(unsigned int cpu)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	485	{
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	486	if (cpu != WORK_CPU_UNBOUND)
				487	return &per_cpu(global_cwq, cpu);
				488	else
				489	return &unbound_global_cwq;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	490	}
				491
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	492	static atomic_t get_pool_nr_running(struct worker_pool pool)
Oleg Nesterov	b1f4ec1	2007-05-09 02:34:12 -0700	[diff] [blame]	493	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	494	int cpu = pool->gcwq->cpu;
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	495	int idx = worker_pool_pri(pool);
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	496
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	497	if (cpu != WORK_CPU_UNBOUND)
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	498	return &per_cpu(pool_nr_running, cpu)[idx];
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	499	else
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	500	return &unbound_pool_nr_running[idx];
Oleg Nesterov	b1f4ec1	2007-05-09 02:34:12 -0700	[diff] [blame]	501	}
				502
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	503	static struct cpu_workqueue_struct *get_cwq(unsigned int cpu,
				504	struct workqueue_struct *wq)
Oleg Nesterov	a848e3b	2007-05-09 02:34:17 -0700	[diff] [blame]	505	{
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	506	if (!(wq->flags & WQ_UNBOUND)) {
Lai Jiangshan	e06ffa1	2012-03-09 18:03:20 +0800	[diff] [blame]	507	if (likely(cpu < nr_cpu_ids))
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	508	return per_cpu_ptr(wq->cpu_wq.pcpu, cpu);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	509	} else if (likely(cpu == WORK_CPU_UNBOUND))
				510	return wq->cpu_wq.single;
				511	return NULL;
Oleg Nesterov	a848e3b	2007-05-09 02:34:17 -0700	[diff] [blame]	512	}
				513
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	514	static unsigned int work_color_to_flags(int color)
				515	{
				516	return color << WORK_STRUCT_COLOR_SHIFT;
				517	}
				518
				519	static int get_work_color(struct work_struct *work)
				520	{
				521	return (*work_data_bits(work) >> WORK_STRUCT_COLOR_SHIFT) &
				522	((1 << WORK_STRUCT_COLOR_BITS) - 1);
				523	}
				524
				525	static int work_next_color(int color)
				526	{
				527	return (color + 1) % WORK_NR_COLORS;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	528	}
				529
David Howells	4594bf1	2006-12-07 11:33:26 +0000	[diff] [blame]	530	/*
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	531	* A work's data points to the cwq with WORK_STRUCT_CWQ set while the
				532	* work is on queue. Once execution starts, WORK_STRUCT_CWQ is
				533	* cleared and the work data contains the cpu number it was last on.
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	534	*
				535	* set_work_{cwq\|cpu}() and clear_work_data() can be used to set the
				536	* cwq, cpu or clear work->data. These functions should only be
				537	* called while the work is owned - ie. while the PENDING bit is set.
				538	*
				539	* get_work_[g]cwq() can be used to obtain the gcwq or cwq
				540	* corresponding to a work. gcwq is available once the work has been
				541	* queued anywhere after initialization. cwq is available only from
				542	* queueing until execution starts.
David Howells	4594bf1	2006-12-07 11:33:26 +0000	[diff] [blame]	543	*/
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	544	static inline void set_work_data(struct work_struct *work, unsigned long data,
				545	unsigned long flags)
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	546	{
David Howells	4594bf1	2006-12-07 11:33:26 +0000	[diff] [blame]	547	BUG_ON(!work_pending(work));
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	548	atomic_long_set(&work->data, data \| flags \| work_static(work));
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	549	}
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	550
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	551	static void set_work_cwq(struct work_struct *work,
				552	struct cpu_workqueue_struct *cwq,
				553	unsigned long extra_flags)
Oleg Nesterov	4d707b9	2010-04-23 17:40:40 +0200	[diff] [blame]	554	{
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	555	set_work_data(work, (unsigned long)cwq,
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	556	WORK_STRUCT_PENDING \| WORK_STRUCT_CWQ \| extra_flags);
Oleg Nesterov	4d707b9	2010-04-23 17:40:40 +0200	[diff] [blame]	557	}
				558
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	559	static void set_work_cpu(struct work_struct *work, unsigned int cpu)
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	560	{
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	561	set_work_data(work, cpu << WORK_STRUCT_FLAG_BITS, WORK_STRUCT_PENDING);
				562	}
				563
				564	static void clear_work_data(struct work_struct *work)
				565	{
				566	set_work_data(work, WORK_STRUCT_NO_CPU, 0);
				567	}
				568
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	569	static struct cpu_workqueue_struct get_work_cwq(struct work_struct work)
				570	{
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	571	unsigned long data = atomic_long_read(&work->data);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	572
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	573	if (data & WORK_STRUCT_CWQ)
				574	return (void *)(data & WORK_STRUCT_WQ_DATA_MASK);
				575	else
Srinivasarao P	b6e586c	2013-09-18 14:33:45 +0530	[diff] [blame]	576	{
				577	WARN_ON_ONCE(1);
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	578	return NULL;
Srinivasarao P	b6e586c	2013-09-18 14:33:45 +0530	[diff] [blame]	579	}
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	580	}
				581
				582	static struct global_cwq get_work_gcwq(struct work_struct work)
				583	{
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	584	unsigned long data = atomic_long_read(&work->data);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	585	unsigned int cpu;
				586
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	587	if (data & WORK_STRUCT_CWQ)
				588	return ((struct cpu_workqueue_struct *)
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	589	(data & WORK_STRUCT_WQ_DATA_MASK))->pool->gcwq;
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	590
				591	cpu = data >> WORK_STRUCT_FLAG_BITS;
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	592	if (cpu == WORK_CPU_NONE)
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	593	return NULL;
				594
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	595	BUG_ON(cpu >= nr_cpu_ids && cpu != WORK_CPU_UNBOUND);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	596	return get_gcwq(cpu);
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	597	}
				598
				599	/*
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	600	* Policy functions. These define the policies on how the global worker
				601	* pools are managed. Unless noted otherwise, these functions assume that
				602	* they're being called with gcwq->lock held.
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	603	*/
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	604
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	605	static bool __need_more_worker(struct worker_pool *pool)
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	606	{
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	607	return !atomic_read(get_pool_nr_running(pool));
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	608	}
				609
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	610	/*
				611	* Need to wake up a worker? Called from anything but currently
				612	* running workers.
Tejun Heo	b7b5c68	2012-07-12 14:46:37 -0700	[diff] [blame]	613	*
				614	* Note that, because unbound workers never contribute to nr_running, this
				615	* function will always return %true for unbound gcwq as long as the
				616	* worklist isn't empty.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	617	*/
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	618	static bool need_more_worker(struct worker_pool *pool)
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	619	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	620	return !list_empty(&pool->worklist) && __need_more_worker(pool);
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	621	}
				622
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	623	/* Can I start working? Called from busy but !running workers. */
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	624	static bool may_start_working(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	625	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	626	return pool->nr_idle;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	627	}
				628
				629	/* Do I need to keep working? Called from currently running workers. */
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	630	static bool keep_working(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	631	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	632	atomic_t *nr_running = get_pool_nr_running(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	633
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	634	return !list_empty(&pool->worklist) && atomic_read(nr_running) <= 1;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	635	}
				636
				637	/* Do we need a new worker? Called from manager. */
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	638	static bool need_to_create_worker(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	639	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	640	return need_more_worker(pool) && !may_start_working(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	641	}
				642
				643	/* Do I need to be the manager? */
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	644	static bool need_to_manage_workers(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	645	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	646	return need_to_create_worker(pool) \|\|
Tejun Heo	22ad564	2012-07-12 14:46:37 -0700	[diff] [blame]	647	(pool->flags & POOL_MANAGE_WORKERS);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	648	}
				649
				650	/* Do we have too many workers and should some go away? */
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	651	static bool too_many_workers(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	652	{
Tejun Heo	22ad564	2012-07-12 14:46:37 -0700	[diff] [blame]	653	bool managing = pool->flags & POOL_MANAGING_WORKERS;
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	654	int nr_idle = pool->nr_idle + managing; /* manager is considered idle */
				655	int nr_busy = pool->nr_workers - nr_idle;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	656
				657	return nr_idle > 2 && (nr_idle - 2) * MAX_IDLE_WORKERS_RATIO >= nr_busy;
				658	}
				659
				660	/*
				661	* Wake up functions.
				662	*/
				663
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	664	/* Return the first worker. Safe with preemption disabled */
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	665	static struct worker first_worker(struct worker_pool pool)
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	666	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	667	if (unlikely(list_empty(&pool->idle_list)))
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	668	return NULL;
				669
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	670	return list_first_entry(&pool->idle_list, struct worker, entry);
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	671	}
				672
				673	/**
				674	* wake_up_worker - wake up an idle worker
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	675	* @pool: worker pool to wake worker from
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	676	*
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	677	* Wake up the first idle worker of @pool.
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	678	*
				679	* CONTEXT:
				680	* spin_lock_irq(gcwq->lock).
				681	*/
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	682	static void wake_up_worker(struct worker_pool *pool)
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	683	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	684	struct worker *worker = first_worker(pool);
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	685
				686	if (likely(worker))
				687	wake_up_process(worker->task);
				688	}
				689
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	690	/**
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	691	* wq_worker_waking_up - a worker is waking up
				692	* @task: task waking up
				693	* @cpu: CPU @task is waking up to
				694	*
				695	* This function is called during try_to_wake_up() when a worker is
				696	* being awoken.
				697	*
				698	* CONTEXT:
				699	* spin_lock_irq(rq->lock)
				700	*/
				701	void wq_worker_waking_up(struct task_struct *task, unsigned int cpu)
				702	{
				703	struct worker *worker = kthread_data(task);
				704
Steven Rostedt	2d64672	2010-12-03 23:12:33 -0500	[diff] [blame]	705	if (!(worker->flags & WORKER_NOT_RUNNING))
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	706	atomic_inc(get_pool_nr_running(worker->pool));
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	707	}
				708
				709	/**
				710	* wq_worker_sleeping - a worker is going to sleep
				711	* @task: task going to sleep
				712	* @cpu: CPU in question, must be the current CPU number
				713	*
				714	* This function is called during schedule() when a busy worker is
				715	* going to sleep. Worker on the same cpu can be woken up by
				716	* returning pointer to its task.
				717	*
				718	* CONTEXT:
				719	* spin_lock_irq(rq->lock)
				720	*
				721	* RETURNS:
				722	* Worker task on @cpu to wake up, %NULL if none.
				723	*/
				724	struct task_struct wq_worker_sleeping(struct task_struct task,
				725	unsigned int cpu)
				726	{
				727	struct worker worker = kthread_data(task), to_wakeup = NULL;
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	728	struct worker_pool *pool = worker->pool;
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	729	atomic_t *nr_running = get_pool_nr_running(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	730
Steven Rostedt	2d64672	2010-12-03 23:12:33 -0500	[diff] [blame]	731	if (worker->flags & WORKER_NOT_RUNNING)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	732	return NULL;
				733
				734	/* this can only happen on the local cpu */
				735	BUG_ON(cpu != raw_smp_processor_id());
				736
				737	/*
				738	* The counterpart of the following dec_and_test, implied mb,
				739	* worklist not empty test sequence is in insert_work().
				740	* Please read comment there.
				741	*
				742	* NOT_RUNNING is clear. This means that trustee is not in
				743	* charge and we're running on the local cpu w/ rq lock held
				744	* and preemption disabled, which in turn means that none else
				745	* could be manipulating idle_list, so dereferencing idle_list
				746	* without gcwq lock is safe.
				747	*/
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	748	if (atomic_dec_and_test(nr_running) && !list_empty(&pool->worklist))
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	749	to_wakeup = first_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	750	return to_wakeup ? to_wakeup->task : NULL;
				751	}
				752
				753	/**
				754	* worker_set_flags - set worker flags and adjust nr_running accordingly
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	755	* @worker: self
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	756	* @flags: flags to set
				757	* @wakeup: wakeup an idle worker if necessary
				758	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	759	* Set @flags in @worker->flags and adjust nr_running accordingly. If
				760	* nr_running becomes zero and @wakeup is %true, an idle worker is
				761	* woken up.
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	762	*
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	763	* CONTEXT:
				764	* spin_lock_irq(gcwq->lock)
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	765	*/
				766	static inline void worker_set_flags(struct worker *worker, unsigned int flags,
				767	bool wakeup)
				768	{
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	769	struct worker_pool *pool = worker->pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	770
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	771	WARN_ON_ONCE(worker->task != current);
				772
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	773	/*
				774	* If transitioning into NOT_RUNNING, adjust nr_running and
				775	* wake up an idle worker as necessary if requested by
				776	* @wakeup.
				777	*/
				778	if ((flags & WORKER_NOT_RUNNING) &&
				779	!(worker->flags & WORKER_NOT_RUNNING)) {
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	780	atomic_t *nr_running = get_pool_nr_running(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	781
				782	if (wakeup) {
				783	if (atomic_dec_and_test(nr_running) &&
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	784	!list_empty(&pool->worklist))
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	785	wake_up_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	786	} else
				787	atomic_dec(nr_running);
				788	}
				789
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	790	worker->flags \|= flags;
				791	}
				792
				793	/**
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	794	* worker_clr_flags - clear worker flags and adjust nr_running accordingly
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	795	* @worker: self
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	796	* @flags: flags to clear
				797	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	798	* Clear @flags in @worker->flags and adjust nr_running accordingly.
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	799	*
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	800	* CONTEXT:
				801	* spin_lock_irq(gcwq->lock)
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	802	*/
				803	static inline void worker_clr_flags(struct worker *worker, unsigned int flags)
				804	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	805	struct worker_pool *pool = worker->pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	806	unsigned int oflags = worker->flags;
				807
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	808	WARN_ON_ONCE(worker->task != current);
				809
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	810	worker->flags &= ~flags;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	811
Tejun Heo	42c025f	2011-01-11 15:58:49 +0100	[diff] [blame]	812	/*
				813	* If transitioning out of NOT_RUNNING, increment nr_running. Note
				814	* that the nested NOT_RUNNING is not a noop. NOT_RUNNING is mask
				815	* of multiple flags, not a single flag.
				816	*/
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	817	if ((flags & WORKER_NOT_RUNNING) && (oflags & WORKER_NOT_RUNNING))
				818	if (!(worker->flags & WORKER_NOT_RUNNING))
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	819	atomic_inc(get_pool_nr_running(pool));
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	820	}
				821
				822	/**
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	823	* busy_worker_head - return the busy hash head for a work
				824	* @gcwq: gcwq of interest
				825	* @work: work to be hashed
				826	*
				827	* Return hash head of @gcwq for @work.
				828	*
				829	* CONTEXT:
				830	* spin_lock_irq(gcwq->lock).
				831	*
				832	* RETURNS:
				833	* Pointer to the hash head.
				834	*/
				835	static struct hlist_head busy_worker_head(struct global_cwq gcwq,
				836	struct work_struct *work)
				837	{
				838	const int base_shift = ilog2(sizeof(struct work_struct));
				839	unsigned long v = (unsigned long)work;
				840
				841	/* simple shift and fold hash, do we need something better? */
				842	v >>= base_shift;
				843	v += v >> BUSY_WORKER_HASH_ORDER;
				844	v &= BUSY_WORKER_HASH_MASK;
				845
				846	return &gcwq->busy_hash[v];
				847	}
				848
				849	/**
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	850	* __find_worker_executing_work - find worker which is executing a work
				851	* @gcwq: gcwq of interest
				852	* @bwh: hash head as returned by busy_worker_head()
				853	* @work: work to find worker for
				854	*
				855	* Find a worker which is executing @work on @gcwq. @bwh should be
				856	* the hash head obtained by calling busy_worker_head() with the same
				857	* work.
				858	*
				859	* CONTEXT:
				860	* spin_lock_irq(gcwq->lock).
				861	*
				862	* RETURNS:
				863	* Pointer to worker which is executing @work if found, NULL
				864	* otherwise.
				865	*/
				866	static struct worker __find_worker_executing_work(struct global_cwq gcwq,
				867	struct hlist_head *bwh,
				868	struct work_struct *work)
				869	{
				870	struct worker *worker;
				871	struct hlist_node *tmp;
				872
				873	hlist_for_each_entry(worker, tmp, bwh, hentry)
Tejun Heo	55e3e1f	2012-12-18 10:35:02 -0800	[diff] [blame]	874	if (worker->current_work == work &&
				875	worker->current_func == work->func)
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	876	return worker;
				877	return NULL;
				878	}
				879
				880	/**
				881	* find_worker_executing_work - find worker which is executing a work
				882	* @gcwq: gcwq of interest
				883	* @work: work to find worker for
				884	*
Tejun Heo	55e3e1f	2012-12-18 10:35:02 -0800	[diff] [blame]	885	* Find a worker which is executing @work on @gcwq by searching
				886	* @gcwq->busy_hash which is keyed by the address of @work. For a worker
				887	* to match, its current execution should match the address of @work and
				888	* its work function. This is to avoid unwanted dependency between
				889	* unrelated work executions through a work item being recycled while still
				890	* being executed.
				891	*
				892	* This is a bit tricky. A work item may be freed once its execution
				893	* starts and nothing prevents the freed area from being recycled for
				894	* another work item. If the same work item address ends up being reused
				895	* before the original execution finishes, workqueue will identify the
				896	* recycled work item as currently executing and make it wait until the
				897	* current execution finishes, introducing an unwanted dependency.
				898	*
				899	* This function checks the work item address, work function and workqueue
				900	* to avoid false positives. Note that this isn't complete as one may
				901	* construct a work function which can introduce dependency onto itself
				902	* through a recycled work item. Well, if somebody wants to shoot oneself
				903	* in the foot that badly, there's only so much we can do, and if such
				904	* deadlock actually occurs, it should be easy to locate the culprit work
				905	* function.
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	906	*
				907	* CONTEXT:
				908	* spin_lock_irq(gcwq->lock).
				909	*
				910	* RETURNS:
				911	* Pointer to worker which is executing @work if found, NULL
				912	* otherwise.
				913	*/
				914	static struct worker find_worker_executing_work(struct global_cwq gcwq,
				915	struct work_struct *work)
				916	{
				917	return __find_worker_executing_work(gcwq, busy_worker_head(gcwq, work),
				918	work);
				919	}
				920
				921	/**
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	922	* insert_work - insert a work into gcwq
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	923	* @cwq: cwq @work belongs to
				924	* @work: work to insert
				925	* @head: insertion point
				926	* @extra_flags: extra WORK_STRUCT_* flags to set
				927	*
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	928	* Insert @work which belongs to @cwq into @gcwq after @head.
				929	* @extra_flags is or'd to work_struct flags.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	930	*
				931	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	932	* spin_lock_irq(gcwq->lock).
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	933	*/
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	934	static void insert_work(struct cpu_workqueue_struct *cwq,
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	935	struct work_struct work, struct list_head head,
				936	unsigned int extra_flags)
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	937	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	938	struct worker_pool *pool = cwq->pool;
Frederic Weisbecker	e1d8aa9	2009-01-12 23:15:46 +0100	[diff] [blame]	939
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	940	/* we own @work, set data and link */
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	941	set_work_cwq(work, cwq, extra_flags);
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	942
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	943	/*
				944	* Ensure that we get the right work->data if we see the
				945	* result of list_add() below, see try_to_grab_pending().
				946	*/
				947	smp_wmb();
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	948
Oleg Nesterov	1a4d9b0	2008-07-25 01:47:47 -0700	[diff] [blame]	949	list_add_tail(&work->entry, head);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	950
				951	/*
				952	* Ensure either worker_sched_deactivated() sees the above
				953	* list_add_tail() or we see zero nr_running to avoid workers
				954	* lying around lazily while there are works to be processed.
				955	*/
				956	smp_mb();
				957
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	958	if (__need_more_worker(pool))
				959	wake_up_worker(pool);
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	960	}
				961
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	962	/*
				963	* Test whether @work is being queued from another work executing on the
				964	* same workqueue. This is rather expensive and should only be used from
				965	* cold paths.
				966	*/
				967	static bool is_chained_work(struct workqueue_struct *wq)
				968	{
				969	unsigned long flags;
				970	unsigned int cpu;
				971
				972	for_each_gcwq_cpu(cpu) {
				973	struct global_cwq *gcwq = get_gcwq(cpu);
				974	struct worker *worker;
				975	struct hlist_node *pos;
				976	int i;
				977
				978	spin_lock_irqsave(&gcwq->lock, flags);
				979	for_each_busy_worker(worker, i, pos, gcwq) {
				980	if (worker->task != current)
				981	continue;
				982	spin_unlock_irqrestore(&gcwq->lock, flags);
				983	/*
				984	* I'm @worker, no locking necessary. See if @work
				985	* is headed to the same workqueue.
				986	*/
				987	return worker->current_cwq->wq == wq;
				988	}
				989	spin_unlock_irqrestore(&gcwq->lock, flags);
				990	}
				991	return false;
				992	}
				993
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	994	static void __queue_work(unsigned int cpu, struct workqueue_struct *wq,
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	995	struct work_struct *work)
				996	{
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	997	struct global_cwq *gcwq;
				998	struct cpu_workqueue_struct *cwq;
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	999	struct list_head *worklist;
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1000	unsigned int work_flags;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1001	unsigned long flags;
				1002
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	1003	debug_work_activate(work);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1004
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	1005	/* if dying, only works from the same workqueue are allowed */
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	1006	if (unlikely(wq->flags & WQ_DRAINING) &&
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	1007	WARN_ON_ONCE(!is_chained_work(wq)))
Tejun Heo	e41e704	2010-08-24 14:22:47 +0200	[diff] [blame]	1008	return;
				1009
Tejun Heo	c7fc77f	2010-07-02 10:03:51 +0200	[diff] [blame]	1010	/* determine gcwq to use */
				1011	if (!(wq->flags & WQ_UNBOUND)) {
Tejun Heo	18aa9ef	2010-06-29 10:07:13 +0200	[diff] [blame]	1012	struct global_cwq *last_gcwq;
				1013
Tejun Heo	c7fc77f	2010-07-02 10:03:51 +0200	[diff] [blame]	1014	if (unlikely(cpu == WORK_CPU_UNBOUND))
				1015	cpu = raw_smp_processor_id();
				1016
Tejun Heo	18aa9ef	2010-06-29 10:07:13 +0200	[diff] [blame]	1017	/*
				1018	* It's multi cpu. If @wq is non-reentrant and @work
				1019	* was previously on a different cpu, it might still
				1020	* be running there, in which case the work needs to
				1021	* be queued on that cpu to guarantee non-reentrance.
				1022	*/
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	1023	gcwq = get_gcwq(cpu);
Tejun Heo	18aa9ef	2010-06-29 10:07:13 +0200	[diff] [blame]	1024	if (wq->flags & WQ_NON_REENTRANT &&
				1025	(last_gcwq = get_work_gcwq(work)) && last_gcwq != gcwq) {
				1026	struct worker *worker;
				1027
				1028	spin_lock_irqsave(&last_gcwq->lock, flags);
				1029
				1030	worker = find_worker_executing_work(last_gcwq, work);
				1031
				1032	if (worker && worker->current_cwq->wq == wq)
				1033	gcwq = last_gcwq;
				1034	else {
				1035	/* meh... not running there, queue here */
				1036	spin_unlock_irqrestore(&last_gcwq->lock, flags);
				1037	spin_lock_irqsave(&gcwq->lock, flags);
				1038	}
				1039	} else
				1040	spin_lock_irqsave(&gcwq->lock, flags);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1041	} else {
				1042	gcwq = get_gcwq(WORK_CPU_UNBOUND);
				1043	spin_lock_irqsave(&gcwq->lock, flags);
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	1044	}
				1045
				1046	/* gcwq determined, get cwq and queue */
				1047	cwq = get_cwq(gcwq->cpu, wq);
Tejun Heo	cdadf00	2010-10-05 10:49:55 +0200	[diff] [blame]	1048	trace_workqueue_queue_work(cpu, cwq, work);
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	1049
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1050	BUG_ON(!list_empty(&work->entry));
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1051
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1052	cwq->nr_in_flight[cwq->work_color]++;
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1053	work_flags = work_color_to_flags(cwq->work_color);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1054
				1055	if (likely(cwq->nr_active < cwq->max_active)) {
Tejun Heo	cdadf00	2010-10-05 10:49:55 +0200	[diff] [blame]	1056	trace_workqueue_activate_work(work);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1057	cwq->nr_active++;
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	1058	worklist = &cwq->pool->worklist;
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1059	} else {
				1060	work_flags \|= WORK_STRUCT_DELAYED;
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1061	worklist = &cwq->delayed_works;
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1062	}
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1063
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1064	insert_work(cwq, work, worklist, work_flags);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1065
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1066	spin_unlock_irqrestore(&gcwq->lock, flags);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1067	}
				1068
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1069	/**
				1070	* queue_work - queue work on a workqueue
				1071	* @wq: workqueue to use
				1072	* @work: work to queue
				1073	*
Alan Stern	057647f	2006-10-28 10:38:58 -0700	[diff] [blame]	1074	* Returns 0 if @work was already on a queue, non-zero otherwise.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1075	*
Oleg Nesterov	00dfcaf	2008-04-29 01:00:27 -0700	[diff] [blame]	1076	* We queue the work to the CPU on which it was submitted, but if the CPU dies
				1077	* it can be processed by another CPU.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1078	*/
Harvey Harrison	7ad5b3a	2008-02-08 04:19:53 -0800	[diff] [blame]	1079	int queue_work(struct workqueue_struct wq, struct work_struct work)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1080	{
Oleg Nesterov	ef1ca23	2008-07-25 01:47:53 -0700	[diff] [blame]	1081	int ret;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1082
Oleg Nesterov	ef1ca23	2008-07-25 01:47:53 -0700	[diff] [blame]	1083	ret = queue_work_on(get_cpu(), wq, work);
				1084	put_cpu();
				1085
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1086	return ret;
				1087	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	1088	EXPORT_SYMBOL_GPL(queue_work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1089
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	1090	/**
				1091	* queue_work_on - queue work on specific cpu
				1092	* @cpu: CPU number to execute work on
				1093	* @wq: workqueue to use
				1094	* @work: work to queue
				1095	*
				1096	* Returns 0 if @work was already on a queue, non-zero otherwise.
				1097	*
				1098	* We queue the work to a specific CPU, the caller must ensure it
				1099	* can't go away.
				1100	*/
				1101	int
				1102	queue_work_on(int cpu, struct workqueue_struct wq, struct work_struct work)
				1103	{
				1104	int ret = 0;
				1105
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	1106	if (!test_and_set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(work))) {
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1107	__queue_work(cpu, wq, work);
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	1108	ret = 1;
				1109	}
				1110	return ret;
				1111	}
				1112	EXPORT_SYMBOL_GPL(queue_work_on);
				1113
Li Zefan	6d141c3	2008-02-08 04:21:09 -0800	[diff] [blame]	1114	static void delayed_work_timer_fn(unsigned long __data)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1115	{
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1116	struct delayed_work dwork = (struct delayed_work )__data;
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	1117	struct cpu_workqueue_struct *cwq = get_work_cwq(&dwork->work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1118
Srinivasarao P	b6e586c	2013-09-18 14:33:45 +0530	[diff] [blame]	1119	if (cwq != NULL)
				1120	__queue_work(smp_processor_id(), cwq->wq, &dwork->work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1121	}
				1122
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1123	/**
				1124	* queue_delayed_work - queue work on a workqueue after delay
				1125	* @wq: workqueue to use
Randy Dunlap	af9997e	2006-12-22 01:06:52 -0800	[diff] [blame]	1126	* @dwork: delayable work to queue
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1127	* @delay: number of jiffies to wait before queueing
				1128	*
Alan Stern	057647f	2006-10-28 10:38:58 -0700	[diff] [blame]	1129	* Returns 0 if @work was already on a queue, non-zero otherwise.
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1130	*/
Harvey Harrison	7ad5b3a	2008-02-08 04:19:53 -0800	[diff] [blame]	1131	int queue_delayed_work(struct workqueue_struct *wq,
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1132	struct delayed_work *dwork, unsigned long delay)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1133	{
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1134	if (delay == 0)
Oleg Nesterov	63bc036	2007-05-09 02:34:16 -0700	[diff] [blame]	1135	return queue_work(wq, &dwork->work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1136
Oleg Nesterov	63bc036	2007-05-09 02:34:16 -0700	[diff] [blame]	1137	return queue_delayed_work_on(-1, wq, dwork, delay);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1138	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	1139	EXPORT_SYMBOL_GPL(queue_delayed_work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1140
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1141	/**
				1142	* queue_delayed_work_on - queue work on specific CPU after delay
				1143	* @cpu: CPU number to execute work on
				1144	* @wq: workqueue to use
Randy Dunlap	af9997e	2006-12-22 01:06:52 -0800	[diff] [blame]	1145	* @dwork: work to queue
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1146	* @delay: number of jiffies to wait before queueing
				1147	*
Alan Stern	057647f	2006-10-28 10:38:58 -0700	[diff] [blame]	1148	* Returns 0 if @work was already on a queue, non-zero otherwise.
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1149	*/
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1150	int queue_delayed_work_on(int cpu, struct workqueue_struct *wq,
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1151	struct delayed_work *dwork, unsigned long delay)
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1152	{
				1153	int ret = 0;
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1154	struct timer_list *timer = &dwork->timer;
				1155	struct work_struct *work = &dwork->work;
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1156
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	1157	if (!test_and_set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(work))) {
Tejun Heo	c7fc77f	2010-07-02 10:03:51 +0200	[diff] [blame]	1158	unsigned int lcpu;
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	1159
Tejun Heo	4afca92	2012-12-04 07:40:39 -0800	[diff] [blame]	1160	WARN_ON_ONCE(timer_pending(timer));
				1161	WARN_ON_ONCE(!list_empty(&work->entry));
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1162
Andrew Liu	8a3e77c	2008-05-01 04:35:14 -0700	[diff] [blame]	1163	timer_stats_timer_set_start_info(&dwork->timer);
				1164
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	1165	/*
				1166	* This stores cwq for the moment, for the timer_fn.
				1167	* Note that the work's gcwq is preserved to allow
				1168	* reentrance detection for delayed works.
				1169	*/
Tejun Heo	c7fc77f	2010-07-02 10:03:51 +0200	[diff] [blame]	1170	if (!(wq->flags & WQ_UNBOUND)) {
				1171	struct global_cwq *gcwq = get_work_gcwq(work);
				1172
				1173	if (gcwq && gcwq->cpu != WORK_CPU_UNBOUND)
				1174	lcpu = gcwq->cpu;
				1175	else
				1176	lcpu = raw_smp_processor_id();
				1177	} else
				1178	lcpu = WORK_CPU_UNBOUND;
				1179
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	1180	set_work_cwq(work, get_cwq(lcpu, wq), 0);
Tejun Heo	c7fc77f	2010-07-02 10:03:51 +0200	[diff] [blame]	1181
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1182	timer->expires = jiffies + delay;
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1183	timer->data = (unsigned long)dwork;
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1184	timer->function = delayed_work_timer_fn;
Oleg Nesterov	63bc036	2007-05-09 02:34:16 -0700	[diff] [blame]	1185
				1186	if (unlikely(cpu >= 0))
				1187	add_timer_on(timer, cpu);
				1188	else
				1189	add_timer(timer);
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1190	ret = 1;
				1191	}
				1192	return ret;
				1193	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	1194	EXPORT_SYMBOL_GPL(queue_delayed_work_on);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1195
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1196	/**
				1197	* worker_enter_idle - enter idle state
				1198	* @worker: worker which is entering idle state
				1199	*
				1200	* @worker is entering idle state. Update stats and idle timer if
				1201	* necessary.
				1202	*
				1203	* LOCKING:
				1204	* spin_lock_irq(gcwq->lock).
				1205	*/
				1206	static void worker_enter_idle(struct worker *worker)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1207	{
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1208	struct worker_pool *pool = worker->pool;
				1209	struct global_cwq *gcwq = pool->gcwq;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1210
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1211	BUG_ON(worker->flags & WORKER_IDLE);
				1212	BUG_ON(!list_empty(&worker->entry) &&
				1213	(worker->hentry.next \|\| worker->hentry.pprev));
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1214
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	1215	/* can't use worker_set_flags(), also called from start_worker() */
				1216	worker->flags \|= WORKER_IDLE;
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1217	pool->nr_idle++;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1218	worker->last_active = jiffies;
Peter Zijlstra	d5abe66	2006-12-06 20:37:26 -0800	[diff] [blame]	1219
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1220	/* idle_list is LIFO */
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1221	list_add(&worker->entry, &pool->idle_list);
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	1222
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1223	if (likely(!(worker->flags & WORKER_ROGUE))) {
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1224	if (too_many_workers(pool) && !timer_pending(&pool->idle_timer))
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1225	mod_timer(&pool->idle_timer,
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1226	jiffies + IDLE_WORKER_TIMEOUT);
				1227	} else
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	1228	wake_up_all(&gcwq->trustee_wait);
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	1229
Tejun Heo	24312d3	2012-05-14 15:04:50 -0700	[diff] [blame]	1230	/*
				1231	* Sanity check nr_running. Because trustee releases gcwq->lock
				1232	* between setting %WORKER_ROGUE and zapping nr_running, the
				1233	* warning may trigger spuriously. Check iff trustee is idle.
				1234	*/
				1235	WARN_ON_ONCE(gcwq->trustee_state == TRUSTEE_DONE &&
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1236	pool->nr_workers == pool->nr_idle &&
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1237	atomic_read(get_pool_nr_running(pool)));
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1238	}
				1239
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1240	/**
				1241	* worker_leave_idle - leave idle state
				1242	* @worker: worker which is leaving idle state
				1243	*
				1244	* @worker is leaving idle state. Update stats.
				1245	*
				1246	* LOCKING:
				1247	* spin_lock_irq(gcwq->lock).
				1248	*/
				1249	static void worker_leave_idle(struct worker *worker)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1250	{
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1251	struct worker_pool *pool = worker->pool;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1252
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1253	BUG_ON(!(worker->flags & WORKER_IDLE));
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	1254	worker_clr_flags(worker, WORKER_IDLE);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1255	pool->nr_idle--;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1256	list_del_init(&worker->entry);
				1257	}
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1258
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1259	/**
				1260	* worker_maybe_bind_and_lock - bind worker to its cpu if possible and lock gcwq
				1261	* @worker: self
				1262	*
				1263	* Works which are scheduled while the cpu is online must at least be
				1264	* scheduled to a worker which is bound to the cpu so that if they are
				1265	* flushed from cpu callbacks while cpu is going down, they are
				1266	* guaranteed to execute on the cpu.
				1267	*
				1268	* This function is to be used by rogue workers and rescuers to bind
				1269	* themselves to the target cpu and may race with cpu going down or
				1270	* coming online. kthread_bind() can't be used because it may put the
				1271	* worker to already dead cpu and set_cpus_allowed_ptr() can't be used
				1272	* verbatim as it's best effort and blocking and gcwq may be
				1273	* [dis]associated in the meantime.
				1274	*
				1275	* This function tries set_cpus_allowed() and locks gcwq and verifies
				1276	* the binding against GCWQ_DISASSOCIATED which is set during
				1277	* CPU_DYING and cleared during CPU_ONLINE, so if the worker enters
				1278	* idle state or fetches works without dropping lock, it can guarantee
				1279	* the scheduling requirement described in the first paragraph.
				1280	*
				1281	* CONTEXT:
				1282	* Might sleep. Called without any lock but returns with gcwq->lock
				1283	* held.
				1284	*
				1285	* RETURNS:
				1286	* %true if the associated gcwq is online (@worker is successfully
				1287	* bound), %false if offline.
				1288	*/
				1289	static bool worker_maybe_bind_and_lock(struct worker *worker)
Namhyung Kim	972fa1c	2010-08-22 23:19:43 +0900	[diff] [blame]	1290	__acquires(&gcwq->lock)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1291	{
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1292	struct global_cwq *gcwq = worker->pool->gcwq;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1293	struct task_struct *task = worker->task;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1294
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1295	while (true) {
				1296	/*
				1297	* The following call may fail, succeed or succeed
				1298	* without actually migrating the task to the cpu if
				1299	* it races with cpu hotunplug operation. Verify
				1300	* against GCWQ_DISASSOCIATED.
				1301	*/
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1302	if (!(gcwq->flags & GCWQ_DISASSOCIATED))
				1303	set_cpus_allowed_ptr(task, get_cpu_mask(gcwq->cpu));
Oleg Nesterov	85f4186	2007-05-09 02:34:20 -0700	[diff] [blame]	1304
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1305	spin_lock_irq(&gcwq->lock);
				1306	if (gcwq->flags & GCWQ_DISASSOCIATED)
				1307	return false;
				1308	if (task_cpu(task) == gcwq->cpu &&
				1309	cpumask_equal(&current->cpus_allowed,
				1310	get_cpu_mask(gcwq->cpu)))
				1311	return true;
				1312	spin_unlock_irq(&gcwq->lock);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	1313
Tejun Heo	5035b20	2011-04-29 18:08:37 +0200	[diff] [blame]	1314	/*
				1315	* We've raced with CPU hot[un]plug. Give it a breather
				1316	* and retry migration. cond_resched() is required here;
				1317	* otherwise, we might deadlock against cpu_stop trying to
				1318	* bring down the CPU on non-preemptive kernel.
				1319	*/
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1320	cpu_relax();
Tejun Heo	5035b20	2011-04-29 18:08:37 +0200	[diff] [blame]	1321	cond_resched();
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1322	}
				1323	}
				1324
				1325	/*
				1326	* Function for worker->rebind_work used to rebind rogue busy workers
				1327	* to the associated cpu which is coming back online. This is
				1328	* scheduled by cpu up but can race with other cpu hotplug operations
				1329	* and may be executed twice without intervening cpu down.
				1330	*/
				1331	static void worker_rebind_fn(struct work_struct *work)
				1332	{
				1333	struct worker *worker = container_of(work, struct worker, rebind_work);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1334	struct global_cwq *gcwq = worker->pool->gcwq;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1335
				1336	if (worker_maybe_bind_and_lock(worker))
				1337	worker_clr_flags(worker, WORKER_REBIND);
				1338
				1339	spin_unlock_irq(&gcwq->lock);
				1340	}
				1341
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1342	static struct worker *alloc_worker(void)
				1343	{
				1344	struct worker *worker;
				1345
				1346	worker = kzalloc(sizeof(*worker), GFP_KERNEL);
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1347	if (worker) {
				1348	INIT_LIST_HEAD(&worker->entry);
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1349	INIT_LIST_HEAD(&worker->scheduled);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1350	INIT_WORK(&worker->rebind_work, worker_rebind_fn);
				1351	/* on creation a worker is in !idle && prep state */
				1352	worker->flags = WORKER_PREP;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1353	}
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1354	return worker;
				1355	}
				1356
				1357	/**
				1358	* create_worker - create a new workqueue worker
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1359	* @pool: pool the new worker will belong to
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1360	* @bind: whether to set affinity to @cpu or not
				1361	*
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1362	* Create a new worker which is bound to @pool. The returned worker
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1363	* can be started by calling start_worker() or destroyed using
				1364	* destroy_worker().
				1365	*
				1366	* CONTEXT:
				1367	* Might sleep. Does GFP_KERNEL allocations.
				1368	*
				1369	* RETURNS:
				1370	* Pointer to the newly created worker.
				1371	*/
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1372	static struct worker create_worker(struct worker_pool pool, bool bind)
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1373	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1374	struct global_cwq *gcwq = pool->gcwq;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1375	bool on_unbound_cpu = gcwq->cpu == WORK_CPU_UNBOUND;
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	1376	const char *pri = worker_pool_pri(pool) ? "H" : "";
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1377	struct worker *worker = NULL;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1378	int id = -1;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1379
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1380	spin_lock_irq(&gcwq->lock);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1381	while (ida_get_new(&pool->worker_ida, &id)) {
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1382	spin_unlock_irq(&gcwq->lock);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1383	if (!ida_pre_get(&pool->worker_ida, GFP_KERNEL))
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1384	goto fail;
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1385	spin_lock_irq(&gcwq->lock);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1386	}
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1387	spin_unlock_irq(&gcwq->lock);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1388
				1389	worker = alloc_worker();
				1390	if (!worker)
				1391	goto fail;
				1392
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1393	worker->pool = pool;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1394	worker->id = id;
				1395
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1396	if (!on_unbound_cpu)
Eric Dumazet	94dcf29	2011-03-22 16:30:45 -0700	[diff] [blame]	1397	worker->task = kthread_create_on_node(worker_thread,
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	1398	worker, cpu_to_node(gcwq->cpu),
				1399	"kworker/%u:%d%s", gcwq->cpu, id, pri);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1400	else
				1401	worker->task = kthread_create(worker_thread, worker,
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	1402	"kworker/u:%d%s", id, pri);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1403	if (IS_ERR(worker->task))
				1404	goto fail;
				1405
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	1406	if (worker_pool_pri(pool))
				1407	set_user_nice(worker->task, HIGHPRI_NICE_LEVEL);
				1408
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	1409	/*
				1410	* A rogue worker will become a regular one if CPU comes
				1411	* online later on. Make sure every worker has
				1412	* PF_THREAD_BOUND set.
				1413	*/
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1414	if (bind && !on_unbound_cpu)
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1415	kthread_bind(worker->task, gcwq->cpu);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1416	else {
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	1417	worker->task->flags \|= PF_THREAD_BOUND;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1418	if (on_unbound_cpu)
				1419	worker->flags \|= WORKER_UNBOUND;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1420	}
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	1421
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1422	return worker;
				1423	fail:
				1424	if (id >= 0) {
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1425	spin_lock_irq(&gcwq->lock);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1426	ida_remove(&pool->worker_ida, id);
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1427	spin_unlock_irq(&gcwq->lock);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1428	}
				1429	kfree(worker);
				1430	return NULL;
				1431	}
				1432
				1433	/**
				1434	* start_worker - start a newly created worker
				1435	* @worker: worker to start
				1436	*
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1437	* Make the gcwq aware of @worker and start it.
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1438	*
				1439	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1440	* spin_lock_irq(gcwq->lock).
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1441	*/
				1442	static void start_worker(struct worker *worker)
				1443	{
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	1444	worker->flags \|= WORKER_STARTED;
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1445	worker->pool->nr_workers++;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1446	worker_enter_idle(worker);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1447	wake_up_process(worker->task);
				1448	}
				1449
				1450	/**
				1451	* destroy_worker - destroy a workqueue worker
				1452	* @worker: worker to be destroyed
				1453	*
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1454	* Destroy @worker and adjust @gcwq stats accordingly.
				1455	*
				1456	* CONTEXT:
				1457	* spin_lock_irq(gcwq->lock) which is released and regrabbed.
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1458	*/
				1459	static void destroy_worker(struct worker *worker)
				1460	{
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1461	struct worker_pool *pool = worker->pool;
				1462	struct global_cwq *gcwq = pool->gcwq;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1463	int id = worker->id;
				1464
				1465	/* sanity check frenzy */
				1466	BUG_ON(worker->current_work);
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1467	BUG_ON(!list_empty(&worker->scheduled));
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1468
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1469	if (worker->flags & WORKER_STARTED)
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1470	pool->nr_workers--;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1471	if (worker->flags & WORKER_IDLE)
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1472	pool->nr_idle--;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1473
				1474	list_del_init(&worker->entry);
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	1475	worker->flags \|= WORKER_DIE;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1476
				1477	spin_unlock_irq(&gcwq->lock);
				1478
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1479	kthread_stop(worker->task);
				1480	kfree(worker);
				1481
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1482	spin_lock_irq(&gcwq->lock);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1483	ida_remove(&pool->worker_ida, id);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1484	}
				1485
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1486	static void idle_worker_timeout(unsigned long __pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1487	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1488	struct worker_pool pool = (void )__pool;
				1489	struct global_cwq *gcwq = pool->gcwq;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1490
				1491	spin_lock_irq(&gcwq->lock);
				1492
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1493	if (too_many_workers(pool)) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1494	struct worker *worker;
				1495	unsigned long expires;
				1496
				1497	/* idle_list is kept in LIFO order, check the last one */
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1498	worker = list_entry(pool->idle_list.prev, struct worker, entry);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1499	expires = worker->last_active + IDLE_WORKER_TIMEOUT;
				1500
				1501	if (time_before(jiffies, expires))
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1502	mod_timer(&pool->idle_timer, expires);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1503	else {
				1504	/* it's been idle for too long, wake up manager */
Tejun Heo	22ad564	2012-07-12 14:46:37 -0700	[diff] [blame]	1505	pool->flags \|= POOL_MANAGE_WORKERS;
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1506	wake_up_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1507	}
				1508	}
				1509
				1510	spin_unlock_irq(&gcwq->lock);
				1511	}
				1512
				1513	static bool send_mayday(struct work_struct *work)
				1514	{
				1515	struct cpu_workqueue_struct *cwq = get_work_cwq(work);
				1516	struct workqueue_struct *wq = cwq->wq;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1517	unsigned int cpu;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1518
				1519	if (!(wq->flags & WQ_RESCUER))
				1520	return false;
				1521
				1522	/* mayday mayday mayday */
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1523	cpu = cwq->pool->gcwq->cpu;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1524	/* WORK_CPU_UNBOUND can't be set in cpumask, use cpu 0 instead */
				1525	if (cpu == WORK_CPU_UNBOUND)
				1526	cpu = 0;
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	1527	if (!mayday_test_and_set_cpu(cpu, wq->mayday_mask))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1528	wake_up_process(wq->rescuer->task);
				1529	return true;
				1530	}
				1531
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1532	static void gcwq_mayday_timeout(unsigned long __pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1533	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1534	struct worker_pool pool = (void )__pool;
				1535	struct global_cwq *gcwq = pool->gcwq;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1536	struct work_struct *work;
				1537
				1538	spin_lock_irq(&gcwq->lock);
				1539
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1540	if (need_to_create_worker(pool)) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1541	/*
				1542	* We've been trying to create a new worker but
				1543	* haven't been successful. We might be hitting an
				1544	* allocation deadlock. Send distress signals to
				1545	* rescuers.
				1546	*/
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1547	list_for_each_entry(work, &pool->worklist, entry)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1548	send_mayday(work);
				1549	}
				1550
				1551	spin_unlock_irq(&gcwq->lock);
				1552
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1553	mod_timer(&pool->mayday_timer, jiffies + MAYDAY_INTERVAL);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1554	}
				1555
				1556	/**
				1557	* maybe_create_worker - create a new worker if necessary
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1558	* @pool: pool to create a new worker for
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1559	*
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1560	* Create a new worker for @pool if necessary. @pool is guaranteed to
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1561	* have at least one idle worker on return from this function. If
				1562	* creating a new worker takes longer than MAYDAY_INTERVAL, mayday is
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1563	* sent to all rescuers with works scheduled on @pool to resolve
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1564	* possible allocation deadlock.
				1565	*
				1566	* On return, need_to_create_worker() is guaranteed to be false and
				1567	* may_start_working() true.
				1568	*
				1569	* LOCKING:
				1570	* spin_lock_irq(gcwq->lock) which may be released and regrabbed
				1571	* multiple times. Does GFP_KERNEL allocations. Called only from
				1572	* manager.
				1573	*
				1574	* RETURNS:
				1575	* false if no action was taken and gcwq->lock stayed locked, true
				1576	* otherwise.
				1577	*/
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1578	static bool maybe_create_worker(struct worker_pool *pool)
Namhyung Kim	06bd6eb	2010-08-22 23:19:42 +0900	[diff] [blame]	1579	__releases(&gcwq->lock)
				1580	__acquires(&gcwq->lock)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1581	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1582	struct global_cwq *gcwq = pool->gcwq;
				1583
				1584	if (!need_to_create_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1585	return false;
				1586	restart:
Tejun Heo	9f9c236	2010-07-14 11:31:20 +0200	[diff] [blame]	1587	spin_unlock_irq(&gcwq->lock);
				1588
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1589	/* if we don't make progress in MAYDAY_INITIAL_TIMEOUT, call for help */
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1590	mod_timer(&pool->mayday_timer, jiffies + MAYDAY_INITIAL_TIMEOUT);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1591
				1592	while (true) {
				1593	struct worker *worker;
				1594
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1595	worker = create_worker(pool, true);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1596	if (worker) {
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1597	del_timer_sync(&pool->mayday_timer);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1598	spin_lock_irq(&gcwq->lock);
				1599	start_worker(worker);
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1600	BUG_ON(need_to_create_worker(pool));
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1601	return true;
				1602	}
				1603
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1604	if (!need_to_create_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1605	break;
				1606
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1607	__set_current_state(TASK_INTERRUPTIBLE);
				1608	schedule_timeout(CREATE_COOLDOWN);
Tejun Heo	9f9c236	2010-07-14 11:31:20 +0200	[diff] [blame]	1609
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1610	if (!need_to_create_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1611	break;
				1612	}
				1613
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1614	del_timer_sync(&pool->mayday_timer);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1615	spin_lock_irq(&gcwq->lock);
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1616	if (need_to_create_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1617	goto restart;
				1618	return true;
				1619	}
				1620
				1621	/**
				1622	* maybe_destroy_worker - destroy workers which have been idle for a while
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1623	* @pool: pool to destroy workers for
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1624	*
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1625	* Destroy @pool workers which have been idle for longer than
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1626	* IDLE_WORKER_TIMEOUT.
				1627	*
				1628	* LOCKING:
				1629	* spin_lock_irq(gcwq->lock) which may be released and regrabbed
				1630	* multiple times. Called only from manager.
				1631	*
				1632	* RETURNS:
				1633	* false if no action was taken and gcwq->lock stayed locked, true
				1634	* otherwise.
				1635	*/
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1636	static bool maybe_destroy_workers(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1637	{
				1638	bool ret = false;
				1639
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1640	while (too_many_workers(pool)) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1641	struct worker *worker;
				1642	unsigned long expires;
				1643
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1644	worker = list_entry(pool->idle_list.prev, struct worker, entry);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1645	expires = worker->last_active + IDLE_WORKER_TIMEOUT;
				1646
				1647	if (time_before(jiffies, expires)) {
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1648	mod_timer(&pool->idle_timer, expires);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1649	break;
				1650	}
				1651
				1652	destroy_worker(worker);
				1653	ret = true;
				1654	}
				1655
				1656	return ret;
				1657	}
				1658
				1659	/**
				1660	* manage_workers - manage worker pool
				1661	* @worker: self
				1662	*
				1663	* Assume the manager role and manage gcwq worker pool @worker belongs
				1664	* to. At any given time, there can be only zero or one manager per
				1665	* gcwq. The exclusion is handled automatically by this function.
				1666	*
				1667	* The caller can safely start processing works on false return. On
				1668	* true return, it's guaranteed that need_to_create_worker() is false
				1669	* and may_start_working() is true.
				1670	*
				1671	* CONTEXT:
				1672	* spin_lock_irq(gcwq->lock) which may be released and regrabbed
				1673	* multiple times. Does GFP_KERNEL allocations.
				1674	*
				1675	* RETURNS:
				1676	* false if no action was taken and gcwq->lock stayed locked, true if
				1677	* some action was taken.
				1678	*/
				1679	static bool manage_workers(struct worker *worker)
				1680	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1681	struct worker_pool *pool = worker->pool;
				1682	struct global_cwq *gcwq = pool->gcwq;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1683	bool ret = false;
				1684
Tejun Heo	22ad564	2012-07-12 14:46:37 -0700	[diff] [blame]	1685	if (pool->flags & POOL_MANAGING_WORKERS)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1686	return ret;
				1687
Tejun Heo	22ad564	2012-07-12 14:46:37 -0700	[diff] [blame]	1688	pool->flags &= ~POOL_MANAGE_WORKERS;
				1689	pool->flags \|= POOL_MANAGING_WORKERS;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1690
				1691	/*
				1692	* Destroy and then create so that may_start_working() is true
				1693	* on return.
				1694	*/
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1695	ret \|= maybe_destroy_workers(pool);
				1696	ret \|= maybe_create_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1697
Tejun Heo	22ad564	2012-07-12 14:46:37 -0700	[diff] [blame]	1698	pool->flags &= ~POOL_MANAGING_WORKERS;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1699
				1700	/*
				1701	* The trustee might be waiting to take over the manager
				1702	* position, tell it we're done.
				1703	*/
				1704	if (unlikely(gcwq->trustee))
				1705	wake_up_all(&gcwq->trustee_wait);
				1706
				1707	return ret;
				1708	}
				1709
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1710	/**
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1711	* move_linked_works - move linked works to a list
				1712	* @work: start of series of works to be scheduled
				1713	* @head: target list to append @work to
				1714	* @nextp: out paramter for nested worklist walking
				1715	*
				1716	* Schedule linked works starting from @work to @head. Work series to
				1717	* be scheduled starts at @work and includes any consecutive work with
				1718	* WORK_STRUCT_LINKED set in its predecessor.
				1719	*
				1720	* If @nextp is not NULL, it's updated to point to the next work of
				1721	* the last scheduled work. This allows move_linked_works() to be
				1722	* nested inside outer list_for_each_entry_safe().
				1723	*
				1724	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1725	* spin_lock_irq(gcwq->lock).
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1726	*/
				1727	static void move_linked_works(struct work_struct work, struct list_head head,
				1728	struct work_struct **nextp)
				1729	{
				1730	struct work_struct *n;
				1731
				1732	/*
				1733	* Linked worklist will always end before the end of the list,
				1734	* use NULL for list head.
				1735	*/
				1736	list_for_each_entry_safe_from(work, n, NULL, entry) {
				1737	list_move_tail(&work->entry, head);
				1738	if (!(*work_data_bits(work) & WORK_STRUCT_LINKED))
				1739	break;
				1740	}
				1741
				1742	/*
				1743	* If we're already inside safe list traversal and have moved
				1744	* multiple works to the scheduled queue, the next position
				1745	* needs to be updated.
				1746	*/
				1747	if (nextp)
				1748	*nextp = n;
				1749	}
				1750
Lai Jiangshan	31eafff	2012-09-18 10:40:00 -0700	[diff] [blame]	1751	static void cwq_activate_delayed_work(struct work_struct *work)
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1752	{
Lai Jiangshan	31eafff	2012-09-18 10:40:00 -0700	[diff] [blame]	1753	struct cpu_workqueue_struct *cwq = get_work_cwq(work);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1754
Tejun Heo	cdadf00	2010-10-05 10:49:55 +0200	[diff] [blame]	1755	trace_workqueue_activate_work(work);
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	1756	move_linked_works(work, &cwq->pool->worklist, NULL);
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1757	__clear_bit(WORK_STRUCT_DELAYED_BIT, work_data_bits(work));
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1758	cwq->nr_active++;
				1759	}
				1760
Lai Jiangshan	31eafff	2012-09-18 10:40:00 -0700	[diff] [blame]	1761	static void cwq_activate_first_delayed(struct cpu_workqueue_struct *cwq)
				1762	{
				1763	struct work_struct *work = list_first_entry(&cwq->delayed_works,
				1764	struct work_struct, entry);
				1765
				1766	cwq_activate_delayed_work(work);
				1767	}
				1768
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1769	/**
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1770	* cwq_dec_nr_in_flight - decrement cwq's nr_in_flight
				1771	* @cwq: cwq of interest
				1772	* @color: color of work which left the queue
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1773	* @delayed: for a delayed work
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1774	*
				1775	* A work either has completed or is removed from pending queue,
				1776	* decrement nr_in_flight of its cwq and handle workqueue flushing.
				1777	*
				1778	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1779	* spin_lock_irq(gcwq->lock).
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1780	*/
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1781	static void cwq_dec_nr_in_flight(struct cpu_workqueue_struct *cwq, int color,
				1782	bool delayed)
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1783	{
				1784	/* ignore uncolored works */
				1785	if (color == WORK_NO_COLOR)
				1786	return;
				1787
				1788	cwq->nr_in_flight[color]--;
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1789
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1790	if (!delayed) {
				1791	cwq->nr_active--;
				1792	if (!list_empty(&cwq->delayed_works)) {
				1793	/* one down, submit a delayed one */
				1794	if (cwq->nr_active < cwq->max_active)
				1795	cwq_activate_first_delayed(cwq);
				1796	}
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	1797	}
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1798
				1799	/* is flush in progress and are we at the flushing tip? */
				1800	if (likely(cwq->flush_color != color))
				1801	return;
				1802
				1803	/* are there still in-flight works? */
				1804	if (cwq->nr_in_flight[color])
				1805	return;
				1806
				1807	/* this cwq is done, clear flush_color */
				1808	cwq->flush_color = -1;
				1809
				1810	/*
				1811	* If this was the last cwq, wake up the first flusher. It
				1812	* will handle the rest.
				1813	*/
				1814	if (atomic_dec_and_test(&cwq->wq->nr_cwqs_to_flush))
				1815	complete(&cwq->wq->first_flusher->done);
				1816	}
				1817
				1818	/**
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1819	* process_one_work - process single work
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1820	* @worker: self
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1821	* @work: work to process
				1822	*
				1823	* Process @work. This function contains all the logics necessary to
				1824	* process a single work including synchronization against and
				1825	* interaction with other workers on the same cpu, queueing and
				1826	* flushing. As long as context requirement is met, any worker can
				1827	* call this function to process a work.
				1828	*
				1829	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1830	* spin_lock_irq(gcwq->lock) which is released and regrabbed.
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1831	*/
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1832	static void process_one_work(struct worker worker, struct work_struct work)
Namhyung Kim	06bd6eb	2010-08-22 23:19:42 +0900	[diff] [blame]	1833	__releases(&gcwq->lock)
				1834	__acquires(&gcwq->lock)
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1835	{
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	1836	struct cpu_workqueue_struct *cwq = get_work_cwq(work);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1837	struct worker_pool *pool = worker->pool;
				1838	struct global_cwq *gcwq = pool->gcwq;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1839	struct hlist_head *bwh = busy_worker_head(gcwq, work);
Tejun Heo	fb0e7be	2010-06-29 10:07:15 +0200	[diff] [blame]	1840	bool cpu_intensive = cwq->wq->flags & WQ_CPU_INTENSIVE;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1841	int work_color;
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	1842	struct worker *collision;
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1843	#ifdef CONFIG_LOCKDEP
				1844	/*
				1845	* It is permissible to free the struct work_struct from
				1846	* inside the function that is called from it, this we need to
				1847	* take into account for lockdep too. To avoid bogus "held
				1848	* lock freed" warnings as well as problems when looking into
				1849	* work->lockdep_map, make a copy and use that here.
				1850	*/
				1851	struct lockdep_map lockdep_map = work->lockdep_map;
				1852	#endif
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	1853	/*
				1854	* A single work shouldn't be executed concurrently by
				1855	* multiple workers on a single cpu. Check whether anyone is
				1856	* already processing the work. If so, defer the work to the
				1857	* currently executing one.
				1858	*/
				1859	collision = __find_worker_executing_work(gcwq, bwh, work);
				1860	if (unlikely(collision)) {
				1861	move_linked_works(work, &collision->scheduled, NULL);
				1862	return;
				1863	}
				1864
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1865	/* claim and process */
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1866	debug_work_deactivate(work);
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1867	hlist_add_head(&worker->hentry, bwh);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1868	worker->current_work = work;
Tejun Heo	55e3e1f	2012-12-18 10:35:02 -0800	[diff] [blame]	1869	worker->current_func = work->func;
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	1870	worker->current_cwq = cwq;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1871	work_color = get_work_color(work);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	1872
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	1873	/* record the current cpu number in the work data and dequeue */
				1874	set_work_cpu(work, gcwq->cpu);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1875	list_del_init(&work->entry);
				1876
Tejun Heo	649027d	2010-06-29 10:07:14 +0200	[diff] [blame]	1877	/*
Tejun Heo	fb0e7be	2010-06-29 10:07:15 +0200	[diff] [blame]	1878	* CPU intensive works don't participate in concurrency
				1879	* management. They're the scheduler's responsibility.
				1880	*/
				1881	if (unlikely(cpu_intensive))
				1882	worker_set_flags(worker, WORKER_CPU_INTENSIVE, true);
				1883
Tejun Heo	b7b5c68	2012-07-12 14:46:37 -0700	[diff] [blame]	1884	/*
				1885	* Unbound gcwq isn't concurrency managed and work items should be
				1886	* executed ASAP. Wake up another worker if necessary.
				1887	*/
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1888	if ((worker->flags & WORKER_UNBOUND) && need_more_worker(pool))
				1889	wake_up_worker(pool);
Tejun Heo	b7b5c68	2012-07-12 14:46:37 -0700	[diff] [blame]	1890
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1891	spin_unlock_irq(&gcwq->lock);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1892
Tejun Heo	66307ae	2012-08-03 10:30:45 -0700	[diff] [blame]	1893	smp_wmb(); /* paired with test_and_set_bit(PENDING) */
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1894	work_clear_pending(work);
Tejun Heo	66307ae	2012-08-03 10:30:45 -0700	[diff] [blame]	1895
Tejun Heo	e159489	2011-01-09 23:32:15 +0100	[diff] [blame]	1896	lock_map_acquire_read(&cwq->wq->lockdep_map);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1897	lock_map_acquire(&lockdep_map);
Arjan van de Ven	e36c886	2010-08-21 13:07:26 -0700	[diff] [blame]	1898	trace_workqueue_execute_start(work);
Tejun Heo	55e3e1f	2012-12-18 10:35:02 -0800	[diff] [blame]	1899	worker->current_func(work);
Arjan van de Ven	e36c886	2010-08-21 13:07:26 -0700	[diff] [blame]	1900	/*
				1901	* While we must be careful to not use "work" after this, the trace
				1902	* point will only record its address.
				1903	*/
				1904	trace_workqueue_execute_end(work);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1905	lock_map_release(&lockdep_map);
				1906	lock_map_release(&cwq->wq->lockdep_map);
				1907
				1908	if (unlikely(in_atomic() \|\| lockdep_depth(current) > 0)) {
Tejun Heo	55e3e1f	2012-12-18 10:35:02 -0800	[diff] [blame]	1909	pr_err("BUG: workqueue leaked lock or atomic: %s/0x%08x/%d\n"
				1910	" last function: %pf\n",
				1911	current->comm, preempt_count(), task_pid_nr(current),
				1912	worker->current_func);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1913	debug_show_held_locks(current);
Syed Rameez Mustafa	1bee7b9	2013-07-15 11:52:09 -0700	[diff] [blame]	1914	BUG_ON(PANIC_CORRUPTION);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1915	dump_stack();
				1916	}
				1917
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1918	spin_lock_irq(&gcwq->lock);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1919
Tejun Heo	fb0e7be	2010-06-29 10:07:15 +0200	[diff] [blame]	1920	/* clear cpu intensive status */
				1921	if (unlikely(cpu_intensive))
				1922	worker_clr_flags(worker, WORKER_CPU_INTENSIVE);
				1923
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1924	/* we're done with it, release */
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1925	hlist_del_init(&worker->hentry);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1926	worker->current_work = NULL;
Tejun Heo	55e3e1f	2012-12-18 10:35:02 -0800	[diff] [blame]	1927	worker->current_func = NULL;
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	1928	worker->current_cwq = NULL;
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1929	cwq_dec_nr_in_flight(cwq, work_color, false);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1930	}
				1931
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1932	/**
				1933	* process_scheduled_works - process scheduled works
				1934	* @worker: self
				1935	*
				1936	* Process all scheduled works. Please note that the scheduled list
				1937	* may change while processing a work, so this function repeatedly
				1938	* fetches a work from the top and executes it.
				1939	*
				1940	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1941	* spin_lock_irq(gcwq->lock) which may be released and regrabbed
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1942	* multiple times.
				1943	*/
				1944	static void process_scheduled_works(struct worker *worker)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1945	{
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1946	while (!list_empty(&worker->scheduled)) {
				1947	struct work_struct *work = list_first_entry(&worker->scheduled,
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1948	struct work_struct, entry);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1949	process_one_work(worker, work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1950	}
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1951	}
				1952
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1953	/**
				1954	* worker_thread - the worker thread function
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1955	* @__worker: self
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1956	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1957	* The gcwq worker thread function. There's a single dynamic pool of
				1958	* these per each cpu. These workers process all works regardless of
				1959	* their specific target workqueue. The only exception is works which
				1960	* belong to workqueues with a rescuer which will be explained in
				1961	* rescuer_thread().
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1962	*/
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1963	static int worker_thread(void *__worker)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1964	{
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1965	struct worker *worker = __worker;
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1966	struct worker_pool *pool = worker->pool;
				1967	struct global_cwq *gcwq = pool->gcwq;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1968
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1969	/* tell the scheduler that this is a workqueue worker */
				1970	worker->task->flags \|= PF_WQ_WORKER;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1971	woke_up:
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1972	spin_lock_irq(&gcwq->lock);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1973
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1974	/* DIE can be set only while we're idle, checking here is enough */
				1975	if (worker->flags & WORKER_DIE) {
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1976	spin_unlock_irq(&gcwq->lock);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1977	worker->task->flags &= ~PF_WQ_WORKER;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1978	return 0;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1979	}
				1980
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1981	worker_leave_idle(worker);
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	1982	recheck:
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1983	/* no more worker necessary? */
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1984	if (!need_more_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1985	goto sleep;
				1986
				1987	/* do we need to manage? */
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1988	if (unlikely(!may_start_working(pool)) && manage_workers(worker))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1989	goto recheck;
				1990
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1991	/*
				1992	* ->scheduled list can only be filled while a worker is
				1993	* preparing to process a work or actually processing it.
				1994	* Make sure nobody diddled with it while I was sleeping.
				1995	*/
				1996	BUG_ON(!list_empty(&worker->scheduled));
				1997
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1998	/*
				1999	* When control reaches this point, we're guaranteed to have
				2000	* at least one idle worker or that someone else has already
				2001	* assumed the manager role.
				2002	*/
				2003	worker_clr_flags(worker, WORKER_PREP);
				2004
				2005	do {
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2006	struct work_struct *work =
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	2007	list_first_entry(&pool->worklist,
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2008	struct work_struct, entry);
				2009
				2010	if (likely(!(*work_data_bits(work) & WORK_STRUCT_LINKED))) {
				2011	/* optimization path, not strictly necessary */
				2012	process_one_work(worker, work);
				2013	if (unlikely(!list_empty(&worker->scheduled)))
				2014	process_scheduled_works(worker);
				2015	} else {
				2016	move_linked_works(work, &worker->scheduled, NULL);
				2017	process_scheduled_works(worker);
				2018	}
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	2019	} while (keep_working(pool));
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2020
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2021	worker_set_flags(worker, WORKER_PREP, false);
Tejun Heo	d313dd8	2010-07-02 10:03:51 +0200	[diff] [blame]	2022	sleep:
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	2023	if (unlikely(need_to_manage_workers(pool)) && manage_workers(worker))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2024	goto recheck;
Tejun Heo	d313dd8	2010-07-02 10:03:51 +0200	[diff] [blame]	2025
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2026	/*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2027	* gcwq->lock is held and there's no work to process and no
				2028	* need to manage, sleep. Workers are woken up only while
				2029	* holding gcwq->lock or from local cpu, so setting the
				2030	* current state before releasing gcwq->lock is enough to
				2031	* prevent losing any event.
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2032	*/
				2033	worker_enter_idle(worker);
				2034	__set_current_state(TASK_INTERRUPTIBLE);
				2035	spin_unlock_irq(&gcwq->lock);
				2036	schedule();
				2037	goto woke_up;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2038	}
				2039
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2040	/**
				2041	* rescuer_thread - the rescuer thread function
				2042	* @__wq: the associated workqueue
				2043	*
				2044	* Workqueue rescuer thread function. There's one rescuer for each
				2045	* workqueue which has WQ_RESCUER set.
				2046	*
				2047	* Regular work processing on a gcwq may block trying to create a new
				2048	* worker which uses GFP_KERNEL allocation which has slight chance of
				2049	* developing into deadlock if some works currently on the same queue
				2050	* need to be processed to satisfy the GFP_KERNEL allocation. This is
				2051	* the problem rescuer solves.
				2052	*
				2053	* When such condition is possible, the gcwq summons rescuers of all
				2054	* workqueues which have works queued on the gcwq and let them process
				2055	* those works so that forward progress can be guaranteed.
				2056	*
				2057	* This should happen rarely.
				2058	*/
				2059	static int rescuer_thread(void *__wq)
				2060	{
				2061	struct workqueue_struct *wq = __wq;
				2062	struct worker *rescuer = wq->rescuer;
				2063	struct list_head *scheduled = &rescuer->scheduled;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2064	bool is_unbound = wq->flags & WQ_UNBOUND;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2065	unsigned int cpu;
				2066
				2067	set_user_nice(current, RESCUER_NICE_LEVEL);
				2068	repeat:
				2069	set_current_state(TASK_INTERRUPTIBLE);
				2070
Mike Galbraith	dbdd7f0	2012-11-28 07:17:18 +0100	[diff] [blame]	2071	if (kthread_should_stop()) {
				2072	__set_current_state(TASK_RUNNING);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2073	return 0;
Mike Galbraith	dbdd7f0	2012-11-28 07:17:18 +0100	[diff] [blame]	2074	}
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2075
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2076	/*
				2077	* See whether any cpu is asking for help. Unbounded
				2078	* workqueues use cpu 0 in mayday_mask for CPU_UNBOUND.
				2079	*/
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	2080	for_each_mayday_cpu(cpu, wq->mayday_mask) {
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2081	unsigned int tcpu = is_unbound ? WORK_CPU_UNBOUND : cpu;
				2082	struct cpu_workqueue_struct *cwq = get_cwq(tcpu, wq);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	2083	struct worker_pool *pool = cwq->pool;
				2084	struct global_cwq *gcwq = pool->gcwq;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2085	struct work_struct work, n;
				2086
				2087	__set_current_state(TASK_RUNNING);
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	2088	mayday_clear_cpu(cpu, wq->mayday_mask);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2089
				2090	/* migrate to the target cpu if possible */
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	2091	rescuer->pool = pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2092	worker_maybe_bind_and_lock(rescuer);
				2093
				2094	/*
				2095	* Slurp in all works issued via this workqueue and
				2096	* process'em.
				2097	*/
				2098	BUG_ON(!list_empty(&rescuer->scheduled));
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	2099	list_for_each_entry_safe(work, n, &pool->worklist, entry)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2100	if (get_work_cwq(work) == cwq)
				2101	move_linked_works(work, scheduled, &n);
				2102
				2103	process_scheduled_works(rescuer);
Tejun Heo	7576958	2011-02-14 14:04:46 +0100	[diff] [blame]	2104
				2105	/*
				2106	* Leave this gcwq. If keep_working() is %true, notify a
				2107	* regular worker; otherwise, we end up with 0 concurrency
				2108	* and stalling the execution.
				2109	*/
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	2110	if (keep_working(pool))
				2111	wake_up_worker(pool);
Tejun Heo	7576958	2011-02-14 14:04:46 +0100	[diff] [blame]	2112
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2113	spin_unlock_irq(&gcwq->lock);
				2114	}
				2115
				2116	schedule();
				2117	goto repeat;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2118	}
				2119
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2120	struct wq_barrier {
				2121	struct work_struct work;
				2122	struct completion done;
				2123	};
				2124
				2125	static void wq_barrier_func(struct work_struct *work)
				2126	{
				2127	struct wq_barrier *barr = container_of(work, struct wq_barrier, work);
				2128	complete(&barr->done);
				2129	}
				2130
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2131	/**
				2132	* insert_wq_barrier - insert a barrier work
				2133	* @cwq: cwq to insert barrier into
				2134	* @barr: wq_barrier to insert
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2135	* @target: target work to attach @barr to
				2136	* @worker: worker currently executing @target, NULL if @target is not executing
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2137	*
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2138	* @barr is linked to @target such that @barr is completed only after
				2139	* @target finishes execution. Please note that the ordering
				2140	* guarantee is observed only with respect to @target and on the local
				2141	* cpu.
				2142	*
				2143	* Currently, a queued barrier can't be canceled. This is because
				2144	* try_to_grab_pending() can't determine whether the work to be
				2145	* grabbed is at the head of the queue and thus can't clear LINKED
				2146	* flag of the previous work while there must be a valid next work
				2147	* after a work with LINKED flag set.
				2148	*
				2149	* Note that when @worker is non-NULL, @target may be modified
				2150	* underneath us, so we can't reliably determine cwq from @target.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2151	*
				2152	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2153	* spin_lock_irq(gcwq->lock).
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2154	*/
Oleg Nesterov	83c2252	2007-05-09 02:33:54 -0700	[diff] [blame]	2155	static void insert_wq_barrier(struct cpu_workqueue_struct *cwq,
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2156	struct wq_barrier *barr,
				2157	struct work_struct target, struct worker worker)
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2158	{
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2159	struct list_head *head;
				2160	unsigned int linked = 0;
				2161
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2162	/*
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2163	* debugobject calls are safe here even with gcwq->lock locked
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2164	* as we know for sure that this will not trigger any of the
				2165	* checks and call back into the fixup functions where we
				2166	* might deadlock.
				2167	*/
Andrew Morton	ca1cab3	2010-10-26 14:22:34 -0700	[diff] [blame]	2168	INIT_WORK_ONSTACK(&barr->work, wq_barrier_func);
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	2169	__set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(&barr->work));
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2170	init_completion(&barr->done);
Oleg Nesterov	83c2252	2007-05-09 02:33:54 -0700	[diff] [blame]	2171
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2172	/*
				2173	* If @target is currently being executed, schedule the
				2174	* barrier to the worker; otherwise, put it after @target.
				2175	*/
				2176	if (worker)
				2177	head = worker->scheduled.next;
				2178	else {
				2179	unsigned long *bits = work_data_bits(target);
				2180
				2181	head = target->entry.next;
				2182	/* there can already be other linked works, inherit and set */
				2183	linked = *bits & WORK_STRUCT_LINKED;
				2184	__set_bit(WORK_STRUCT_LINKED_BIT, bits);
				2185	}
				2186
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2187	debug_work_activate(&barr->work);
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2188	insert_work(cwq, &barr->work, head,
				2189	work_color_to_flags(WORK_NO_COLOR) \| linked);
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2190	}
				2191
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2192	/**
				2193	* flush_workqueue_prep_cwqs - prepare cwqs for workqueue flushing
				2194	* @wq: workqueue being flushed
				2195	* @flush_color: new flush color, < 0 for no-op
				2196	* @work_color: new work color, < 0 for no-op
				2197	*
				2198	* Prepare cwqs for workqueue flushing.
				2199	*
				2200	* If @flush_color is non-negative, flush_color on all cwqs should be
				2201	* -1. If no cwq has in-flight commands at the specified color, all
				2202	* cwq->flush_color's stay at -1 and %false is returned. If any cwq
				2203	* has in flight commands, its cwq->flush_color is set to
				2204	* @flush_color, @wq->nr_cwqs_to_flush is updated accordingly, cwq
				2205	* wakeup logic is armed and %true is returned.
				2206	*
				2207	* The caller should have initialized @wq->first_flusher prior to
				2208	* calling this function with non-negative @flush_color. If
				2209	* @flush_color is negative, no flush color update is done and %false
				2210	* is returned.
				2211	*
				2212	* If @work_color is non-negative, all cwqs should have the same
				2213	* work_color which is previous to @work_color and all will be
				2214	* advanced to @work_color.
				2215	*
				2216	* CONTEXT:
				2217	* mutex_lock(wq->flush_mutex).
				2218	*
				2219	* RETURNS:
				2220	* %true if @flush_color >= 0 and there's something to flush. %false
				2221	* otherwise.
				2222	*/
				2223	static bool flush_workqueue_prep_cwqs(struct workqueue_struct *wq,
				2224	int flush_color, int work_color)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2225	{
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2226	bool wait = false;
				2227	unsigned int cpu;
Oleg Nesterov	1444196	2007-05-23 13:57:57 -0700	[diff] [blame]	2228
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2229	if (flush_color >= 0) {
				2230	BUG_ON(atomic_read(&wq->nr_cwqs_to_flush));
				2231	atomic_set(&wq->nr_cwqs_to_flush, 1);
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2232	}
Oleg Nesterov	1444196	2007-05-23 13:57:57 -0700	[diff] [blame]	2233
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2234	for_each_cwq_cpu(cpu, wq) {
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2235	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	2236	struct global_cwq *gcwq = cwq->pool->gcwq;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2237
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2238	spin_lock_irq(&gcwq->lock);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2239
				2240	if (flush_color >= 0) {
				2241	BUG_ON(cwq->flush_color != -1);
				2242
				2243	if (cwq->nr_in_flight[flush_color]) {
				2244	cwq->flush_color = flush_color;
				2245	atomic_inc(&wq->nr_cwqs_to_flush);
				2246	wait = true;
				2247	}
				2248	}
				2249
				2250	if (work_color >= 0) {
				2251	BUG_ON(work_color != work_next_color(cwq->work_color));
				2252	cwq->work_color = work_color;
				2253	}
				2254
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2255	spin_unlock_irq(&gcwq->lock);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2256	}
				2257
				2258	if (flush_color >= 0 && atomic_dec_and_test(&wq->nr_cwqs_to_flush))
				2259	complete(&wq->first_flusher->done);
				2260
				2261	return wait;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2262	}
				2263
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2264	/**
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2265	* flush_workqueue - ensure that any scheduled work has run to completion.
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2266	* @wq: workqueue to flush
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2267	*
				2268	* Forces execution of the workqueue and blocks until its completion.
				2269	* This is typically used in driver shutdown handlers.
				2270	*
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2271	* We sleep until all works which were queued on entry have been handled,
				2272	* but we are not livelocked by new incoming ones.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2273	*/
Harvey Harrison	7ad5b3a	2008-02-08 04:19:53 -0800	[diff] [blame]	2274	void flush_workqueue(struct workqueue_struct *wq)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2275	{
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2276	struct wq_flusher this_flusher = {
				2277	.list = LIST_HEAD_INIT(this_flusher.list),
				2278	.flush_color = -1,
				2279	.done = COMPLETION_INITIALIZER_ONSTACK(this_flusher.done),
				2280	};
				2281	int next_color;
Oleg Nesterov	b1f4ec1	2007-05-09 02:34:12 -0700	[diff] [blame]	2282
Ingo Molnar	3295f0e	2008-08-11 10:30:30 +0200	[diff] [blame]	2283	lock_map_acquire(&wq->lockdep_map);
				2284	lock_map_release(&wq->lockdep_map);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2285
				2286	mutex_lock(&wq->flush_mutex);
				2287
				2288	/*
				2289	* Start-to-wait phase
				2290	*/
				2291	next_color = work_next_color(wq->work_color);
				2292
				2293	if (next_color != wq->flush_color) {
				2294	/*
				2295	* Color space is not full. The current work_color
				2296	* becomes our flush_color and work_color is advanced
				2297	* by one.
				2298	*/
				2299	BUG_ON(!list_empty(&wq->flusher_overflow));
				2300	this_flusher.flush_color = wq->work_color;
				2301	wq->work_color = next_color;
				2302
				2303	if (!wq->first_flusher) {
				2304	/* no flush in progress, become the first flusher */
				2305	BUG_ON(wq->flush_color != this_flusher.flush_color);
				2306
				2307	wq->first_flusher = &this_flusher;
				2308
				2309	if (!flush_workqueue_prep_cwqs(wq, wq->flush_color,
				2310	wq->work_color)) {
				2311	/* nothing to flush, done */
				2312	wq->flush_color = next_color;
				2313	wq->first_flusher = NULL;
				2314	goto out_unlock;
				2315	}
				2316	} else {
				2317	/* wait in queue */
				2318	BUG_ON(wq->flush_color == this_flusher.flush_color);
				2319	list_add_tail(&this_flusher.list, &wq->flusher_queue);
				2320	flush_workqueue_prep_cwqs(wq, -1, wq->work_color);
				2321	}
				2322	} else {
				2323	/*
				2324	* Oops, color space is full, wait on overflow queue.
				2325	* The next flush completion will assign us
				2326	* flush_color and transfer to flusher_queue.
				2327	*/
				2328	list_add_tail(&this_flusher.list, &wq->flusher_overflow);
				2329	}
				2330
				2331	mutex_unlock(&wq->flush_mutex);
				2332
				2333	wait_for_completion(&this_flusher.done);
				2334
				2335	/*
				2336	* Wake-up-and-cascade phase
				2337	*
				2338	* First flushers are responsible for cascading flushes and
				2339	* handling overflow. Non-first flushers can simply return.
				2340	*/
				2341	if (wq->first_flusher != &this_flusher)
				2342	return;
				2343
				2344	mutex_lock(&wq->flush_mutex);
				2345
Tejun Heo	4ce48b3	2010-07-02 10:03:51 +0200	[diff] [blame]	2346	/* we might have raced, check again with mutex held */
				2347	if (wq->first_flusher != &this_flusher)
				2348	goto out_unlock;
				2349
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2350	wq->first_flusher = NULL;
				2351
				2352	BUG_ON(!list_empty(&this_flusher.list));
				2353	BUG_ON(wq->flush_color != this_flusher.flush_color);
				2354
				2355	while (true) {
				2356	struct wq_flusher next, tmp;
				2357
				2358	/* complete all the flushers sharing the current flush color */
				2359	list_for_each_entry_safe(next, tmp, &wq->flusher_queue, list) {
				2360	if (next->flush_color != wq->flush_color)
				2361	break;
				2362	list_del_init(&next->list);
				2363	complete(&next->done);
				2364	}
				2365
				2366	BUG_ON(!list_empty(&wq->flusher_overflow) &&
				2367	wq->flush_color != work_next_color(wq->work_color));
				2368
				2369	/* this flush_color is finished, advance by one */
				2370	wq->flush_color = work_next_color(wq->flush_color);
				2371
				2372	/* one color has been freed, handle overflow queue */
				2373	if (!list_empty(&wq->flusher_overflow)) {
				2374	/*
				2375	* Assign the same color to all overflowed
				2376	* flushers, advance work_color and append to
				2377	* flusher_queue. This is the start-to-wait
				2378	* phase for these overflowed flushers.
				2379	*/
				2380	list_for_each_entry(tmp, &wq->flusher_overflow, list)
				2381	tmp->flush_color = wq->work_color;
				2382
				2383	wq->work_color = work_next_color(wq->work_color);
				2384
				2385	list_splice_tail_init(&wq->flusher_overflow,
				2386	&wq->flusher_queue);
				2387	flush_workqueue_prep_cwqs(wq, -1, wq->work_color);
				2388	}
				2389
				2390	if (list_empty(&wq->flusher_queue)) {
				2391	BUG_ON(wq->flush_color != wq->work_color);
				2392	break;
				2393	}
				2394
				2395	/*
				2396	* Need to flush more colors. Make the next flusher
				2397	* the new first flusher and arm cwqs.
				2398	*/
				2399	BUG_ON(wq->flush_color == wq->work_color);
				2400	BUG_ON(wq->flush_color != next->flush_color);
				2401
				2402	list_del_init(&next->list);
				2403	wq->first_flusher = next;
				2404
				2405	if (flush_workqueue_prep_cwqs(wq, wq->flush_color, -1))
				2406	break;
				2407
				2408	/*
				2409	* Meh... this color is already done, clear first
				2410	* flusher and repeat cascading.
				2411	*/
				2412	wq->first_flusher = NULL;
				2413	}
				2414
				2415	out_unlock:
				2416	mutex_unlock(&wq->flush_mutex);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2417	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	2418	EXPORT_SYMBOL_GPL(flush_workqueue);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2419
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2420	/**
				2421	* drain_workqueue - drain a workqueue
				2422	* @wq: workqueue to drain
				2423	*
				2424	* Wait until the workqueue becomes empty. While draining is in progress,
				2425	* only chain queueing is allowed. IOW, only currently pending or running
				2426	* work items on @wq can queue further work items on it. @wq is flushed
				2427	* repeatedly until it becomes empty. The number of flushing is detemined
				2428	* by the depth of chaining and should be relatively short. Whine if it
				2429	* takes too long.
				2430	*/
				2431	void drain_workqueue(struct workqueue_struct *wq)
				2432	{
				2433	unsigned int flush_cnt = 0;
				2434	unsigned int cpu;
				2435
				2436	/*
				2437	* __queue_work() needs to test whether there are drainers, is much
				2438	* hotter than drain_workqueue() and already looks at @wq->flags.
				2439	* Use WQ_DRAINING so that queue doesn't have to check nr_drainers.
				2440	*/
				2441	spin_lock(&workqueue_lock);
				2442	if (!wq->nr_drainers++)
				2443	wq->flags \|= WQ_DRAINING;
				2444	spin_unlock(&workqueue_lock);
				2445	reflush:
				2446	flush_workqueue(wq);
				2447
				2448	for_each_cwq_cpu(cpu, wq) {
				2449	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
Thomas Tuttle	fa2563e	2011-09-14 16:22:28 -0700	[diff] [blame]	2450	bool drained;
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2451
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	2452	spin_lock_irq(&cwq->pool->gcwq->lock);
Thomas Tuttle	fa2563e	2011-09-14 16:22:28 -0700	[diff] [blame]	2453	drained = !cwq->nr_active && list_empty(&cwq->delayed_works);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	2454	spin_unlock_irq(&cwq->pool->gcwq->lock);
Thomas Tuttle	fa2563e	2011-09-14 16:22:28 -0700	[diff] [blame]	2455
				2456	if (drained)
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2457	continue;
				2458
				2459	if (++flush_cnt == 10 \|\|
				2460	(flush_cnt % 100 == 0 && flush_cnt <= 1000))
				2461	pr_warning("workqueue %s: flush on destruction isn't complete after %u tries\n",
				2462	wq->name, flush_cnt);
				2463	goto reflush;
				2464	}
				2465
				2466	spin_lock(&workqueue_lock);
				2467	if (!--wq->nr_drainers)
				2468	wq->flags &= ~WQ_DRAINING;
				2469	spin_unlock(&workqueue_lock);
				2470	}
				2471	EXPORT_SYMBOL_GPL(drain_workqueue);
				2472
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2473	static bool start_flush_work(struct work_struct work, struct wq_barrier barr,
				2474	bool wait_executing)
				2475	{
				2476	struct worker *worker = NULL;
				2477	struct global_cwq *gcwq;
				2478	struct cpu_workqueue_struct *cwq;
				2479
				2480	might_sleep();
				2481	gcwq = get_work_gcwq(work);
				2482	if (!gcwq)
				2483	return false;
				2484
				2485	spin_lock_irq(&gcwq->lock);
				2486	if (!list_empty(&work->entry)) {
				2487	/*
				2488	* See the comment near try_to_grab_pending()->smp_rmb().
				2489	* If it was re-queued to a different gcwq under us, we
				2490	* are not going to wait.
				2491	*/
				2492	smp_rmb();
				2493	cwq = get_work_cwq(work);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	2494	if (unlikely(!cwq \|\| gcwq != cwq->pool->gcwq))
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2495	goto already_gone;
				2496	} else if (wait_executing) {
				2497	worker = find_worker_executing_work(gcwq, work);
				2498	if (!worker)
				2499	goto already_gone;
				2500	cwq = worker->current_cwq;
				2501	} else
				2502	goto already_gone;
				2503
				2504	insert_wq_barrier(cwq, barr, work, worker);
				2505	spin_unlock_irq(&gcwq->lock);
				2506
Tejun Heo	e159489	2011-01-09 23:32:15 +0100	[diff] [blame]	2507	/*
				2508	* If @max_active is 1 or rescuer is in use, flushing another work
				2509	* item on the same workqueue may lead to deadlock. Make sure the
				2510	* flusher is not running on the same workqueue by verifying write
				2511	* access.
				2512	*/
				2513	if (cwq->wq->saved_max_active == 1 \|\| cwq->wq->flags & WQ_RESCUER)
				2514	lock_map_acquire(&cwq->wq->lockdep_map);
				2515	else
				2516	lock_map_acquire_read(&cwq->wq->lockdep_map);
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2517	lock_map_release(&cwq->wq->lockdep_map);
Tejun Heo	e159489	2011-01-09 23:32:15 +0100	[diff] [blame]	2518
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2519	return true;
				2520	already_gone:
				2521	spin_unlock_irq(&gcwq->lock);
				2522	return false;
				2523	}
				2524
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2525	/**
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2526	* flush_work - wait for a work to finish executing the last queueing instance
				2527	* @work: the work to flush
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2528	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2529	* Wait until @work has finished execution. This function considers
				2530	* only the last queueing instance of @work. If @work has been
				2531	* enqueued across different CPUs on a non-reentrant workqueue or on
				2532	* multiple workqueues, @work might still be executing on return on
				2533	* some of the CPUs from earlier queueing.
Oleg Nesterov	a67da70	2008-07-25 01:47:52 -0700	[diff] [blame]	2534	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2535	* If @work was queued only on a non-reentrant, ordered or unbound
				2536	* workqueue, @work is guaranteed to be idle on return if it hasn't
				2537	* been requeued since flush started.
				2538	*
				2539	* RETURNS:
				2540	* %true if flush_work() waited for the work to finish execution,
				2541	* %false if it was already idle.
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2542	*/
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2543	bool flush_work(struct work_struct *work)
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2544	{
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2545	struct wq_barrier barr;
				2546
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2547	if (start_flush_work(work, &barr, true)) {
				2548	wait_for_completion(&barr.done);
				2549	destroy_work_on_stack(&barr.work);
				2550	return true;
				2551	} else
				2552	return false;
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2553	}
				2554	EXPORT_SYMBOL_GPL(flush_work);
				2555
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2556	static bool wait_on_cpu_work(struct global_cwq gcwq, struct work_struct work)
				2557	{
				2558	struct wq_barrier barr;
				2559	struct worker *worker;
				2560
				2561	spin_lock_irq(&gcwq->lock);
				2562
				2563	worker = find_worker_executing_work(gcwq, work);
				2564	if (unlikely(worker))
				2565	insert_wq_barrier(worker->current_cwq, &barr, work, worker);
				2566
				2567	spin_unlock_irq(&gcwq->lock);
				2568
				2569	if (unlikely(worker)) {
				2570	wait_for_completion(&barr.done);
				2571	destroy_work_on_stack(&barr.work);
				2572	return true;
				2573	} else
				2574	return false;
				2575	}
				2576
				2577	static bool wait_on_work(struct work_struct *work)
				2578	{
				2579	bool ret = false;
				2580	int cpu;
				2581
				2582	might_sleep();
				2583
				2584	lock_map_acquire(&work->lockdep_map);
				2585	lock_map_release(&work->lockdep_map);
				2586
				2587	for_each_gcwq_cpu(cpu)
				2588	ret \|= wait_on_cpu_work(get_gcwq(cpu), work);
				2589	return ret;
				2590	}
				2591
Tejun Heo	0938349	2010-09-16 10:48:29 +0200	[diff] [blame]	2592	/**
				2593	* flush_work_sync - wait until a work has finished execution
				2594	* @work: the work to flush
				2595	*
				2596	* Wait until @work has finished execution. On return, it's
				2597	* guaranteed that all queueing instances of @work which happened
				2598	* before this function is called are finished. In other words, if
				2599	* @work hasn't been requeued since this function was called, @work is
				2600	* guaranteed to be idle on return.
				2601	*
				2602	* RETURNS:
				2603	* %true if flush_work_sync() waited for the work to finish execution,
				2604	* %false if it was already idle.
				2605	*/
				2606	bool flush_work_sync(struct work_struct *work)
				2607	{
				2608	struct wq_barrier barr;
				2609	bool pending, waited;
				2610
				2611	/* we'll wait for executions separately, queue barr only if pending */
				2612	pending = start_flush_work(work, &barr, false);
				2613
				2614	/* wait for executions to finish */
				2615	waited = wait_on_work(work);
				2616
				2617	/* wait for the pending one */
				2618	if (pending) {
				2619	wait_for_completion(&barr.done);
				2620	destroy_work_on_stack(&barr.work);
				2621	}
				2622
				2623	return pending \|\| waited;
				2624	}
				2625	EXPORT_SYMBOL_GPL(flush_work_sync);
				2626
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2627	/*
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2628	* Upon a successful return (>= 0), the caller "owns" WORK_STRUCT_PENDING bit,
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2629	* so this work can't be re-armed in any way.
				2630	*/
				2631	static int try_to_grab_pending(struct work_struct *work)
				2632	{
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2633	struct global_cwq *gcwq;
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2634	int ret = -1;
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2635
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	2636	if (!test_and_set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(work)))
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2637	return 0;
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2638
				2639	/*
				2640	* The queueing is in progress, or it is already queued. Try to
				2641	* steal it from ->worklist without clearing WORK_STRUCT_PENDING.
				2642	*/
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	2643	gcwq = get_work_gcwq(work);
				2644	if (!gcwq)
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2645	return ret;
				2646
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2647	spin_lock_irq(&gcwq->lock);
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2648	if (!list_empty(&work->entry)) {
				2649	/*
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	2650	* This work is queued, but perhaps we locked the wrong gcwq.
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2651	* In that case we must see the new value after rmb(), see
				2652	* insert_work()->wmb().
				2653	*/
				2654	smp_rmb();
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	2655	if (gcwq == get_work_gcwq(work)) {
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2656	debug_work_deactivate(work);
Lai Jiangshan	31eafff	2012-09-18 10:40:00 -0700	[diff] [blame]	2657
				2658	/*
				2659	* A delayed work item cannot be grabbed directly
				2660	* because it might have linked NO_COLOR work items
				2661	* which, if left on the delayed_list, will confuse
				2662	* cwq->nr_active management later on and cause
				2663	* stall. Make sure the work item is activated
				2664	* before grabbing.
				2665	*/
				2666	if (*work_data_bits(work) & WORK_STRUCT_DELAYED)
				2667	cwq_activate_delayed_work(work);
				2668
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2669	list_del_init(&work->entry);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	2670	cwq_dec_nr_in_flight(get_work_cwq(work),
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	2671	get_work_color(work),
				2672	*work_data_bits(work) & WORK_STRUCT_DELAYED);
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2673	ret = 1;
				2674	}
				2675	}
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2676	spin_unlock_irq(&gcwq->lock);
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2677
				2678	return ret;
				2679	}
				2680
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2681	static bool __cancel_work_timer(struct work_struct *work,
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2682	struct timer_list* timer)
				2683	{
				2684	int ret;
				2685
				2686	do {
				2687	ret = (timer && likely(del_timer(timer)));
				2688	if (!ret)
				2689	ret = try_to_grab_pending(work);
				2690	wait_on_work(work);
				2691	} while (unlikely(ret < 0));
				2692
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	2693	clear_work_data(work);
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2694	return ret;
				2695	}
				2696
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2697	/**
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2698	* cancel_work_sync - cancel a work and wait for it to finish
				2699	* @work: the work to cancel
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2700	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2701	* Cancel @work and wait for its execution to finish. This function
				2702	* can be used even if the work re-queues itself or migrates to
				2703	* another workqueue. On return from this function, @work is
				2704	* guaranteed to be not pending or executing on any CPU.
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2705	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2706	* cancel_work_sync(&delayed_work->work) must not be used for
				2707	* delayed_work's. Use cancel_delayed_work_sync() instead.
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2708	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2709	* The caller must ensure that the workqueue on which @work was last
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2710	* queued can't be destroyed before this function returns.
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2711	*
				2712	* RETURNS:
				2713	* %true if @work was pending, %false otherwise.
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2714	*/
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2715	bool cancel_work_sync(struct work_struct *work)
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2716	{
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2717	return __cancel_work_timer(work, NULL);
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	2718	}
Oleg Nesterov	28e53bd	2007-05-09 02:34:22 -0700	[diff] [blame]	2719	EXPORT_SYMBOL_GPL(cancel_work_sync);
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	2720
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2721	/**
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2722	* flush_delayed_work - wait for a dwork to finish executing the last queueing
				2723	* @dwork: the delayed work to flush
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2724	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2725	* Delayed timer is cancelled and the pending work is queued for
				2726	* immediate execution. Like flush_work(), this function only
				2727	* considers the last queueing instance of @dwork.
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2728	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2729	* RETURNS:
				2730	* %true if flush_work() waited for the work to finish execution,
				2731	* %false if it was already idle.
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2732	*/
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2733	bool flush_delayed_work(struct delayed_work *dwork)
				2734	{
				2735	if (del_timer_sync(&dwork->timer))
				2736	__queue_work(raw_smp_processor_id(),
				2737	get_work_cwq(&dwork->work)->wq, &dwork->work);
				2738	return flush_work(&dwork->work);
				2739	}
				2740	EXPORT_SYMBOL(flush_delayed_work);
				2741
				2742	/**
Tejun Heo	0938349	2010-09-16 10:48:29 +0200	[diff] [blame]	2743	* flush_delayed_work_sync - wait for a dwork to finish
				2744	* @dwork: the delayed work to flush
				2745	*
				2746	* Delayed timer is cancelled and the pending work is queued for
				2747	* execution immediately. Other than timer handling, its behavior
				2748	* is identical to flush_work_sync().
				2749	*
				2750	* RETURNS:
				2751	* %true if flush_work_sync() waited for the work to finish execution,
				2752	* %false if it was already idle.
				2753	*/
				2754	bool flush_delayed_work_sync(struct delayed_work *dwork)
				2755	{
				2756	if (del_timer_sync(&dwork->timer))
				2757	__queue_work(raw_smp_processor_id(),
				2758	get_work_cwq(&dwork->work)->wq, &dwork->work);
				2759	return flush_work_sync(&dwork->work);
				2760	}
				2761	EXPORT_SYMBOL(flush_delayed_work_sync);
				2762
				2763	/**
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2764	* cancel_delayed_work_sync - cancel a delayed work and wait for it to finish
				2765	* @dwork: the delayed work cancel
				2766	*
				2767	* This is cancel_work_sync() for delayed works.
				2768	*
				2769	* RETURNS:
				2770	* %true if @dwork was pending, %false otherwise.
				2771	*/
				2772	bool cancel_delayed_work_sync(struct delayed_work *dwork)
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2773	{
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2774	return __cancel_work_timer(&dwork->work, &dwork->timer);
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2775	}
Oleg Nesterov	f5a421a	2007-07-15 23:41:44 -0700	[diff] [blame]	2776	EXPORT_SYMBOL(cancel_delayed_work_sync);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2777
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2778	/**
				2779	* schedule_work - put work task in global workqueue
				2780	* @work: job to be done
				2781	*
Bart Van Assche	5b0f437d	2009-07-30 19:00:53 +0200	[diff] [blame]	2782	* Returns zero if @work was already on the kernel-global workqueue and
				2783	* non-zero otherwise.
				2784	*
				2785	* This puts a job in the kernel-global workqueue if it was not already
				2786	* queued and leaves it in the same position on the kernel-global
				2787	* workqueue otherwise.
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2788	*/
Harvey Harrison	7ad5b3a	2008-02-08 04:19:53 -0800	[diff] [blame]	2789	int schedule_work(struct work_struct *work)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2790	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	2791	return queue_work(system_wq, work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2792	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	2793	EXPORT_SYMBOL(schedule_work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2794
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	2795	/*
				2796	* schedule_work_on - put work task on a specific cpu
				2797	* @cpu: cpu to put the work task on
				2798	* @work: job to be done
				2799	*
				2800	* This puts a job on a specific cpu
				2801	*/
				2802	int schedule_work_on(int cpu, struct work_struct *work)
				2803	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	2804	return queue_work_on(cpu, system_wq, work);
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	2805	}
				2806	EXPORT_SYMBOL(schedule_work_on);
				2807
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2808	/**
				2809	* schedule_delayed_work - put work task in global workqueue after delay
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	2810	* @dwork: job to be done
				2811	* @delay: number of jiffies to wait or 0 for immediate execution
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2812	*
				2813	* After waiting for a given time this puts a job in the kernel-global
				2814	* workqueue.
				2815	*/
Harvey Harrison	7ad5b3a	2008-02-08 04:19:53 -0800	[diff] [blame]	2816	int schedule_delayed_work(struct delayed_work *dwork,
Ingo Molnar	82f67cd	2007-02-16 01:28:13 -0800	[diff] [blame]	2817	unsigned long delay)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2818	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	2819	return queue_delayed_work(system_wq, dwork, delay);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2820	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	2821	EXPORT_SYMBOL(schedule_delayed_work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2822
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2823	/**
				2824	* schedule_delayed_work_on - queue work in global workqueue on CPU after delay
				2825	* @cpu: cpu to use
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	2826	* @dwork: job to be done
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2827	* @delay: number of jiffies to wait
				2828	*
				2829	* After waiting for a given time this puts a job in the kernel-global
				2830	* workqueue on the specified CPU.
				2831	*/
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2832	int schedule_delayed_work_on(int cpu,
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	2833	struct delayed_work *dwork, unsigned long delay)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2834	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	2835	return queue_delayed_work_on(cpu, system_wq, dwork, delay);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2836	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	2837	EXPORT_SYMBOL(schedule_delayed_work_on);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2838
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2839	/**
Tejun Heo	31ddd87	2010-10-19 11:14:49 +0200	[diff] [blame]	2840	* schedule_on_each_cpu - execute a function synchronously on each online CPU
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2841	* @func: the function to call
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2842	*
Tejun Heo	31ddd87	2010-10-19 11:14:49 +0200	[diff] [blame]	2843	* schedule_on_each_cpu() executes @func on each online CPU using the
				2844	* system workqueue and blocks until all CPUs have completed.
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2845	* schedule_on_each_cpu() is very slow.
Tejun Heo	31ddd87	2010-10-19 11:14:49 +0200	[diff] [blame]	2846	*
				2847	* RETURNS:
				2848	* 0 on success, -errno on failure.
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2849	*/
David Howells	65f27f3	2006-11-22 14:55:48 +0000	[diff] [blame]	2850	int schedule_on_each_cpu(work_func_t func)
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	2851	{
				2852	int cpu;
Namhyung Kim	38f5156	2010-08-08 14:24:09 +0200	[diff] [blame]	2853	struct work_struct __percpu *works;
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	2854
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2855	works = alloc_percpu(struct work_struct);
				2856	if (!works)
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	2857	return -ENOMEM;
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2858
Gautham R Shenoy	95402b3	2008-01-25 21:08:02 +0100	[diff] [blame]	2859	get_online_cpus();
Tejun Heo	9398180	2009-11-17 14:06:20 -0800	[diff] [blame]	2860
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	2861	for_each_online_cpu(cpu) {
Ingo Molnar	9bfb183	2006-12-18 20:05:09 +0100	[diff] [blame]	2862	struct work_struct *work = per_cpu_ptr(works, cpu);
				2863
				2864	INIT_WORK(work, func);
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	2865	schedule_work_on(cpu, work);
Andi Kleen	65a6446	2009-10-14 06:22:47 +0200	[diff] [blame]	2866	}
Tejun Heo	9398180	2009-11-17 14:06:20 -0800	[diff] [blame]	2867
				2868	for_each_online_cpu(cpu)
				2869	flush_work(per_cpu_ptr(works, cpu));
				2870
Gautham R Shenoy	95402b3	2008-01-25 21:08:02 +0100	[diff] [blame]	2871	put_online_cpus();
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2872	free_percpu(works);
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	2873	return 0;
				2874	}
				2875
Alan Stern	eef6a7d	2010-02-12 17:39:21 +0900	[diff] [blame]	2876	/**
				2877	* flush_scheduled_work - ensure that any scheduled work has run to completion.
				2878	*
				2879	* Forces execution of the kernel-global workqueue and blocks until its
				2880	* completion.
				2881	*
				2882	* Think twice before calling this function! It's very easy to get into
				2883	* trouble if you don't take great care. Either of the following situations
				2884	* will lead to deadlock:
				2885	*
				2886	* One of the work items currently on the workqueue needs to acquire
				2887	* a lock held by your code or its caller.
				2888	*
				2889	* Your code is running in the context of a work routine.
				2890	*
				2891	* They will be detected by lockdep when they occur, but the first might not
				2892	* occur very often. It depends on what work items are on the workqueue and
				2893	* what locks they need, which you have no control over.
				2894	*
				2895	* In most situations flushing the entire workqueue is overkill; you merely
				2896	* need to know that a particular work item isn't queued and isn't running.
				2897	* In such cases you should use cancel_delayed_work_sync() or
				2898	* cancel_work_sync() instead.
				2899	*/
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2900	void flush_scheduled_work(void)
				2901	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	2902	flush_workqueue(system_wq);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2903	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	2904	EXPORT_SYMBOL(flush_scheduled_work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2905
				2906	/**
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	2907	* execute_in_process_context - reliably execute the routine with user context
				2908	* @fn: the function to execute
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	2909	* @ew: guaranteed storage for the execute work structure (must
				2910	* be available when the work executes)
				2911	*
				2912	* Executes the function immediately if process context is available,
				2913	* otherwise schedules the function for delayed execution.
				2914	*
				2915	* Returns: 0 - function was executed
				2916	* 1 - function was scheduled for execution
				2917	*/
David Howells	65f27f3	2006-11-22 14:55:48 +0000	[diff] [blame]	2918	int execute_in_process_context(work_func_t fn, struct execute_work *ew)
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	2919	{
				2920	if (!in_interrupt()) {
David Howells	65f27f3	2006-11-22 14:55:48 +0000	[diff] [blame]	2921	fn(&ew->work);
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	2922	return 0;
				2923	}
				2924
David Howells	65f27f3	2006-11-22 14:55:48 +0000	[diff] [blame]	2925	INIT_WORK(&ew->work, fn);
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	2926	schedule_work(&ew->work);
				2927
				2928	return 1;
				2929	}
				2930	EXPORT_SYMBOL_GPL(execute_in_process_context);
				2931
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2932	int keventd_up(void)
				2933	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	2934	return system_wq != NULL;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2935	}
				2936
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	2937	static int alloc_cwqs(struct workqueue_struct *wq)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2938	{
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	2939	/*
Tejun Heo	0f90004	2010-06-29 10:07:11 +0200	[diff] [blame]	2940	* cwqs are forced aligned according to WORK_STRUCT_FLAG_BITS.
				2941	* Make sure that the alignment isn't lower than that of
				2942	* unsigned long long.
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	2943	*/
Tejun Heo	0f90004	2010-06-29 10:07:11 +0200	[diff] [blame]	2944	const size_t size = sizeof(struct cpu_workqueue_struct);
				2945	const size_t align = max_t(size_t, 1 << WORK_STRUCT_FLAG_BITS,
				2946	__alignof__(unsigned long long));
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	2947
Lai Jiangshan	e06ffa1	2012-03-09 18:03:20 +0800	[diff] [blame]	2948	if (!(wq->flags & WQ_UNBOUND))
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2949	wq->cpu_wq.pcpu = __alloc_percpu(size, align);
Tejun Heo	931ac77	2010-07-20 11:07:48 +0200	[diff] [blame]	2950	else {
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2951	void *ptr;
Frederic Weisbecker	e1d8aa9	2009-01-12 23:15:46 +0100	[diff] [blame]	2952
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2953	/*
				2954	* Allocate enough room to align cwq and put an extra
				2955	* pointer at the end pointing back to the originally
				2956	* allocated pointer which will be used for free.
				2957	*/
				2958	ptr = kzalloc(size + align + sizeof(void *), GFP_KERNEL);
				2959	if (ptr) {
				2960	wq->cpu_wq.single = PTR_ALIGN(ptr, align);
				2961	(void *)(wq->cpu_wq.single + 1) = ptr;
				2962	}
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	2963	}
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2964
Tejun Heo	0415b00	2011-03-24 18:50:09 +0100	[diff] [blame]	2965	/* just in case, make sure it's actually aligned */
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	2966	BUG_ON(!IS_ALIGNED(wq->cpu_wq.v, align));
				2967	return wq->cpu_wq.v ? 0 : -ENOMEM;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	2968	}
				2969
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	2970	static void free_cwqs(struct workqueue_struct *wq)
Oleg Nesterov	06ba38a	2007-05-09 02:34:15 -0700	[diff] [blame]	2971	{
Lai Jiangshan	e06ffa1	2012-03-09 18:03:20 +0800	[diff] [blame]	2972	if (!(wq->flags & WQ_UNBOUND))
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2973	free_percpu(wq->cpu_wq.pcpu);
				2974	else if (wq->cpu_wq.single) {
				2975	/* the pointer to free is stored right after the cwq */
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	2976	kfree((void *)(wq->cpu_wq.single + 1));
Oleg Nesterov	06ba38a	2007-05-09 02:34:15 -0700	[diff] [blame]	2977	}
				2978	}
				2979
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2980	static int wq_clamp_max_active(int max_active, unsigned int flags,
				2981	const char *name)
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	2982	{
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2983	int lim = flags & WQ_UNBOUND ? WQ_UNBOUND_MAX_ACTIVE : WQ_MAX_ACTIVE;
				2984
				2985	if (max_active < 1 \|\| max_active > lim)
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	2986	printk(KERN_WARNING "workqueue: max_active %d requested for %s "
				2987	"is out of range, clamping between %d and %d\n",
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2988	max_active, name, 1, lim);
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	2989
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2990	return clamp_val(max_active, 1, lim);
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	2991	}
				2992
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	2993	struct workqueue_struct __alloc_workqueue_key(const char fmt,
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	2994	unsigned int flags,
				2995	int max_active,
				2996	struct lock_class_key *key,
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	2997	const char *lock_name, ...)
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	2998	{
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	2999	va_list args, args1;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3000	struct workqueue_struct *wq;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	3001	unsigned int cpu;
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3002	size_t namelen;
				3003
				3004	/* determine namelen, allocate wq and format name */
				3005	va_start(args, lock_name);
				3006	va_copy(args1, args);
				3007	namelen = vsnprintf(NULL, 0, fmt, args) + 1;
				3008
				3009	wq = kzalloc(sizeof(*wq) + namelen, GFP_KERNEL);
				3010	if (!wq)
				3011	goto err;
				3012
				3013	vsnprintf(wq->name, namelen, fmt, args1);
				3014	va_end(args);
				3015	va_end(args1);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3016
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3017	/*
Tejun Heo	6370a6a	2010-10-11 15:12:27 +0200	[diff] [blame]	3018	* Workqueues which may be used during memory reclaim should
				3019	* have a rescuer to guarantee forward progress.
				3020	*/
				3021	if (flags & WQ_MEM_RECLAIM)
				3022	flags \|= WQ_RESCUER;
				3023
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3024	max_active = max_active ?: WQ_DFL_ACTIVE;
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3025	max_active = wq_clamp_max_active(max_active, flags, wq->name);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3026
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3027	/* init wq */
Tejun Heo	97e37d7	2010-06-29 10:07:10 +0200	[diff] [blame]	3028	wq->flags = flags;
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3029	wq->saved_max_active = max_active;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	3030	mutex_init(&wq->flush_mutex);
				3031	atomic_set(&wq->nr_cwqs_to_flush, 0);
				3032	INIT_LIST_HEAD(&wq->flusher_queue);
				3033	INIT_LIST_HEAD(&wq->flusher_overflow);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3034
Johannes Berg	eb13ba8	2008-01-16 09:51:58 +0100	[diff] [blame]	3035	lockdep_init_map(&wq->lockdep_map, lock_name, key, 0);
Oleg Nesterov	cce1a16	2007-05-09 02:34:13 -0700	[diff] [blame]	3036	INIT_LIST_HEAD(&wq->list);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3037
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3038	if (alloc_cwqs(wq) < 0)
				3039	goto err;
				3040
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3041	for_each_cwq_cpu(cpu, wq) {
Tejun Heo	1537663	2010-06-29 10:07:11 +0200	[diff] [blame]	3042	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3043	struct global_cwq *gcwq = get_gcwq(cpu);
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	3044	int pool_idx = (bool)(flags & WQ_HIGHPRI);
Tejun Heo	1537663	2010-06-29 10:07:11 +0200	[diff] [blame]	3045
Tejun Heo	0f90004	2010-06-29 10:07:11 +0200	[diff] [blame]	3046	BUG_ON((unsigned long)cwq & WORK_STRUCT_FLAG_MASK);
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	3047	cwq->pool = &gcwq->pools[pool_idx];
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	3048	cwq->wq = wq;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	3049	cwq->flush_color = -1;
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	3050	cwq->max_active = max_active;
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	3051	INIT_LIST_HEAD(&cwq->delayed_works);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3052	}
				3053
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3054	if (flags & WQ_RESCUER) {
				3055	struct worker *rescuer;
				3056
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	3057	if (!alloc_mayday_mask(&wq->mayday_mask, GFP_KERNEL))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3058	goto err;
				3059
				3060	wq->rescuer = rescuer = alloc_worker();
				3061	if (!rescuer)
				3062	goto err;
				3063
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3064	rescuer->task = kthread_create(rescuer_thread, wq, "%s",
				3065	wq->name);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3066	if (IS_ERR(rescuer->task))
				3067	goto err;
				3068
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3069	rescuer->task->flags \|= PF_THREAD_BOUND;
				3070	wake_up_process(rescuer->task);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3071	}
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3072
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3073	/*
				3074	* workqueue_lock protects global freeze state and workqueues
				3075	* list. Grab it, set max_active accordingly and add the new
				3076	* workqueue to workqueues list.
				3077	*/
Tejun Heo	1537663	2010-06-29 10:07:11 +0200	[diff] [blame]	3078	spin_lock(&workqueue_lock);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3079
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3080	if (workqueue_freezing && wq->flags & WQ_FREEZABLE)
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3081	for_each_cwq_cpu(cpu, wq)
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3082	get_cwq(cpu, wq)->max_active = 0;
				3083
Tejun Heo	1537663	2010-06-29 10:07:11 +0200	[diff] [blame]	3084	list_add(&wq->list, &workqueues);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3085
Tejun Heo	1537663	2010-06-29 10:07:11 +0200	[diff] [blame]	3086	spin_unlock(&workqueue_lock);
				3087
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3088	return wq;
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	3089	err:
				3090	if (wq) {
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3091	free_cwqs(wq);
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	3092	free_mayday_mask(wq->mayday_mask);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3093	kfree(wq->rescuer);
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	3094	kfree(wq);
				3095	}
				3096	return NULL;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3097	}
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3098	EXPORT_SYMBOL_GPL(__alloc_workqueue_key);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3099
				3100	/**
				3101	* destroy_workqueue - safely terminate a workqueue
				3102	* @wq: target workqueue
				3103	*
				3104	* Safely destroy a workqueue. All work currently pending will be done first.
				3105	*/
				3106	void destroy_workqueue(struct workqueue_struct *wq)
				3107	{
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	3108	unsigned int cpu;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3109
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	3110	/* drain it before proceeding with destruction */
				3111	drain_workqueue(wq);
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	3112
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3113	/*
				3114	* wq list is used to freeze wq, remove from list after
				3115	* flushing is complete in case freeze races us.
				3116	*/
Gautham R Shenoy	95402b3	2008-01-25 21:08:02 +0100	[diff] [blame]	3117	spin_lock(&workqueue_lock);
Oleg Nesterov	b1f4ec1	2007-05-09 02:34:12 -0700	[diff] [blame]	3118	list_del(&wq->list);
Gautham R Shenoy	95402b3	2008-01-25 21:08:02 +0100	[diff] [blame]	3119	spin_unlock(&workqueue_lock);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3120
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3121	/* sanity check */
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3122	for_each_cwq_cpu(cpu, wq) {
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	3123	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
				3124	int i;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3125
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	3126	for (i = 0; i < WORK_NR_COLORS; i++)
				3127	BUG_ON(cwq->nr_in_flight[i]);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	3128	BUG_ON(cwq->nr_active);
				3129	BUG_ON(!list_empty(&cwq->delayed_works));
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	3130	}
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3131
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3132	if (wq->flags & WQ_RESCUER) {
				3133	kthread_stop(wq->rescuer->task);
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	3134	free_mayday_mask(wq->mayday_mask);
Xiaotian Feng	8d9df9f	2010-08-16 09:54:28 +0200	[diff] [blame]	3135	kfree(wq->rescuer);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3136	}
				3137
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3138	free_cwqs(wq);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3139	kfree(wq);
				3140	}
				3141	EXPORT_SYMBOL_GPL(destroy_workqueue);
				3142
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3143	/**
				3144	* workqueue_set_max_active - adjust max_active of a workqueue
				3145	* @wq: target workqueue
				3146	* @max_active: new max_active value.
				3147	*
				3148	* Set max_active of @wq to @max_active.
				3149	*
				3150	* CONTEXT:
				3151	* Don't call from IRQ context.
				3152	*/
				3153	void workqueue_set_max_active(struct workqueue_struct *wq, int max_active)
				3154	{
				3155	unsigned int cpu;
				3156
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3157	max_active = wq_clamp_max_active(max_active, wq->flags, wq->name);
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3158
				3159	spin_lock(&workqueue_lock);
				3160
				3161	wq->saved_max_active = max_active;
				3162
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3163	for_each_cwq_cpu(cpu, wq) {
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3164	struct global_cwq *gcwq = get_gcwq(cpu);
				3165
				3166	spin_lock_irq(&gcwq->lock);
				3167
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3168	if (!(wq->flags & WQ_FREEZABLE) \|\|
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3169	!(gcwq->flags & GCWQ_FREEZING))
				3170	get_cwq(gcwq->cpu, wq)->max_active = max_active;
				3171
				3172	spin_unlock_irq(&gcwq->lock);
				3173	}
				3174
				3175	spin_unlock(&workqueue_lock);
				3176	}
				3177	EXPORT_SYMBOL_GPL(workqueue_set_max_active);
				3178
				3179	/**
				3180	* workqueue_congested - test whether a workqueue is congested
				3181	* @cpu: CPU in question
				3182	* @wq: target workqueue
				3183	*
				3184	* Test whether @wq's cpu workqueue for @cpu is congested. There is
				3185	* no synchronization around this function and the test result is
				3186	* unreliable and only useful as advisory hints or for debugging.
				3187	*
				3188	* RETURNS:
				3189	* %true if congested, %false otherwise.
				3190	*/
				3191	bool workqueue_congested(unsigned int cpu, struct workqueue_struct *wq)
				3192	{
				3193	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
				3194
				3195	return !list_empty(&cwq->delayed_works);
				3196	}
				3197	EXPORT_SYMBOL_GPL(workqueue_congested);
				3198
				3199	/**
				3200	* work_cpu - return the last known associated cpu for @work
				3201	* @work: the work of interest
				3202	*
				3203	* RETURNS:
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3204	* CPU number if @work was ever queued. WORK_CPU_NONE otherwise.
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3205	*/
				3206	unsigned int work_cpu(struct work_struct *work)
				3207	{
				3208	struct global_cwq *gcwq = get_work_gcwq(work);
				3209
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3210	return gcwq ? gcwq->cpu : WORK_CPU_NONE;
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3211	}
				3212	EXPORT_SYMBOL_GPL(work_cpu);
				3213
				3214	/**
				3215	* work_busy - test whether a work is currently pending or running
				3216	* @work: the work to be tested
				3217	*
				3218	* Test whether @work is currently pending or running. There is no
				3219	* synchronization around this function and the test result is
				3220	* unreliable and only useful as advisory hints or for debugging.
				3221	* Especially for reentrant wqs, the pending state might hide the
				3222	* running state.
				3223	*
				3224	* RETURNS:
				3225	* OR'd bitmask of WORK_BUSY_* bits.
				3226	*/
				3227	unsigned int work_busy(struct work_struct *work)
				3228	{
				3229	struct global_cwq *gcwq = get_work_gcwq(work);
				3230	unsigned long flags;
				3231	unsigned int ret = 0;
				3232
				3233	if (!gcwq)
				3234	return false;
				3235
				3236	spin_lock_irqsave(&gcwq->lock, flags);
				3237
				3238	if (work_pending(work))
				3239	ret \|= WORK_BUSY_PENDING;
				3240	if (find_worker_executing_work(gcwq, work))
				3241	ret \|= WORK_BUSY_RUNNING;
				3242
				3243	spin_unlock_irqrestore(&gcwq->lock, flags);
				3244
				3245	return ret;
				3246	}
				3247	EXPORT_SYMBOL_GPL(work_busy);
				3248
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3249	/*
				3250	* CPU hotplug.
				3251	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3252	* There are two challenges in supporting CPU hotplug. Firstly, there
				3253	* are a lot of assumptions on strong associations among work, cwq and
				3254	* gcwq which make migrating pending and scheduled works very
				3255	* difficult to implement without impacting hot paths. Secondly,
				3256	* gcwqs serve mix of short, long and very long running works making
				3257	* blocked draining impractical.
				3258	*
				3259	* This is solved by allowing a gcwq to be detached from CPU, running
				3260	* it with unbound (rogue) workers and allowing it to be reattached
				3261	* later if the cpu comes back online. A separate thread is created
				3262	* to govern a gcwq in such state and is called the trustee of the
				3263	* gcwq.
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3264	*
				3265	* Trustee states and their descriptions.
				3266	*
				3267	* START Command state used on startup. On CPU_DOWN_PREPARE, a
				3268	* new trustee is started with this state.
				3269	*
				3270	* IN_CHARGE Once started, trustee will enter this state after
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3271	* assuming the manager role and making all existing
				3272	* workers rogue. DOWN_PREPARE waits for trustee to
				3273	* enter this state. After reaching IN_CHARGE, trustee
				3274	* tries to execute the pending worklist until it's empty
				3275	* and the state is set to BUTCHER, or the state is set
				3276	* to RELEASE.
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3277	*
				3278	* BUTCHER Command state which is set by the cpu callback after
				3279	* the cpu has went down. Once this state is set trustee
				3280	* knows that there will be no new works on the worklist
				3281	* and once the worklist is empty it can proceed to
				3282	* killing idle workers.
				3283	*
				3284	* RELEASE Command state which is set by the cpu callback if the
				3285	* cpu down has been canceled or it has come online
				3286	* again. After recognizing this state, trustee stops
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3287	* trying to drain or butcher and clears ROGUE, rebinds
				3288	* all remaining workers back to the cpu and releases
				3289	* manager role.
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3290	*
				3291	* DONE Trustee will enter this state after BUTCHER or RELEASE
				3292	* is complete.
				3293	*
				3294	* trustee CPU draining
				3295	* took over down complete
				3296	* START -----------> IN_CHARGE -----------> BUTCHER -----------> DONE
				3297	* \| \| ^
				3298	* \| CPU is back online v return workers \|
				3299	* ----------------> RELEASE --------------
				3300	*/
				3301
				3302	/**
				3303	* trustee_wait_event_timeout - timed event wait for trustee
				3304	* @cond: condition to wait for
				3305	* @timeout: timeout in jiffies
				3306	*
				3307	* wait_event_timeout() for trustee to use. Handles locking and
				3308	* checks for RELEASE request.
				3309	*
				3310	* CONTEXT:
				3311	* spin_lock_irq(gcwq->lock) which may be released and regrabbed
				3312	* multiple times. To be used by trustee.
				3313	*
				3314	* RETURNS:
				3315	* Positive indicating left time if @cond is satisfied, 0 if timed
				3316	* out, -1 if canceled.
				3317	*/
				3318	#define trustee_wait_event_timeout(cond, timeout) ({ \
				3319	long __ret = (timeout); \
				3320	while (!((cond) \|\| (gcwq->trustee_state == TRUSTEE_RELEASE)) && \
				3321	__ret) { \
				3322	spin_unlock_irq(&gcwq->lock); \
				3323	__wait_event_timeout(gcwq->trustee_wait, (cond) \|\| \
				3324	(gcwq->trustee_state == TRUSTEE_RELEASE), \
				3325	__ret); \
				3326	spin_lock_irq(&gcwq->lock); \
				3327	} \
				3328	gcwq->trustee_state == TRUSTEE_RELEASE ? -1 : (__ret); \
				3329	})
				3330
				3331	/**
				3332	* trustee_wait_event - event wait for trustee
				3333	* @cond: condition to wait for
				3334	*
				3335	* wait_event() for trustee to use. Automatically handles locking and
				3336	* checks for CANCEL request.
				3337	*
				3338	* CONTEXT:
				3339	* spin_lock_irq(gcwq->lock) which may be released and regrabbed
				3340	* multiple times. To be used by trustee.
				3341	*
				3342	* RETURNS:
				3343	* 0 if @cond is satisfied, -1 if canceled.
				3344	*/
				3345	#define trustee_wait_event(cond) ({ \
				3346	long __ret1; \
				3347	__ret1 = trustee_wait_event_timeout(cond, MAX_SCHEDULE_TIMEOUT);\
				3348	__ret1 < 0 ? -1 : 0; \
				3349	})
				3350
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3351	static bool gcwq_is_managing_workers(struct global_cwq *gcwq)
				3352	{
				3353	struct worker_pool *pool;
				3354
				3355	for_each_worker_pool(pool, gcwq)
				3356	if (pool->flags & POOL_MANAGING_WORKERS)
				3357	return true;
				3358	return false;
				3359	}
				3360
				3361	static bool gcwq_has_idle_workers(struct global_cwq *gcwq)
				3362	{
				3363	struct worker_pool *pool;
				3364
				3365	for_each_worker_pool(pool, gcwq)
				3366	if (!list_empty(&pool->idle_list))
				3367	return true;
				3368	return false;
				3369	}
				3370
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3371	static int __cpuinit trustee_thread(void *__gcwq)
				3372	{
				3373	struct global_cwq *gcwq = __gcwq;
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3374	struct worker_pool *pool;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3375	struct worker *worker;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3376	struct work_struct *work;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3377	struct hlist_node *pos;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3378	long rc;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3379	int i;
				3380
				3381	BUG_ON(gcwq->cpu != smp_processor_id());
				3382
				3383	spin_lock_irq(&gcwq->lock);
				3384	/*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3385	* Claim the manager position and make all workers rogue.
				3386	* Trustee must be bound to the target cpu and can't be
				3387	* cancelled.
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3388	*/
				3389	BUG_ON(gcwq->cpu != smp_processor_id());
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3390	rc = trustee_wait_event(!gcwq_is_managing_workers(gcwq));
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3391	BUG_ON(rc < 0);
				3392
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3393	for_each_worker_pool(pool, gcwq) {
				3394	pool->flags \|= POOL_MANAGING_WORKERS;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3395
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3396	list_for_each_entry(worker, &pool->idle_list, entry)
				3397	worker->flags \|= WORKER_ROGUE;
				3398	}
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3399
				3400	for_each_busy_worker(worker, i, pos, gcwq)
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	3401	worker->flags \|= WORKER_ROGUE;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3402
				3403	/*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3404	* Call schedule() so that we cross rq->lock and thus can
				3405	* guarantee sched callbacks see the rogue flag. This is
				3406	* necessary as scheduler callbacks may be invoked from other
				3407	* cpus.
				3408	*/
				3409	spin_unlock_irq(&gcwq->lock);
				3410	schedule();
				3411	spin_lock_irq(&gcwq->lock);
				3412
				3413	/*
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	3414	* Sched callbacks are disabled now. Zap nr_running. After
				3415	* this, nr_running stays zero and need_more_worker() and
				3416	* keep_working() are always true as long as the worklist is
				3417	* not empty.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3418	*/
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3419	for_each_worker_pool(pool, gcwq)
				3420	atomic_set(get_pool_nr_running(pool), 0);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3421
				3422	spin_unlock_irq(&gcwq->lock);
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3423	for_each_worker_pool(pool, gcwq)
				3424	del_timer_sync(&pool->idle_timer);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3425	spin_lock_irq(&gcwq->lock);
				3426
				3427	/*
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3428	* We're now in charge. Notify and proceed to drain. We need
				3429	* to keep the gcwq running during the whole CPU down
				3430	* procedure as other cpu hotunplug callbacks may need to
				3431	* flush currently running tasks.
				3432	*/
				3433	gcwq->trustee_state = TRUSTEE_IN_CHARGE;
				3434	wake_up_all(&gcwq->trustee_wait);
				3435
				3436	/*
				3437	* The original cpu is in the process of dying and may go away
				3438	* anytime now. When that happens, we and all workers would
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3439	* be migrated to other cpus. Try draining any left work. We
				3440	* want to get it over with ASAP - spam rescuers, wake up as
				3441	* many idlers as necessary and create new ones till the
				3442	* worklist is empty. Note that if the gcwq is frozen, there
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3443	* may be frozen works in freezable cwqs. Don't declare
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3444	* completion while frozen.
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3445	*/
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3446	while (true) {
				3447	bool busy = false;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3448
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3449	for_each_worker_pool(pool, gcwq)
				3450	busy \|= pool->nr_workers != pool->nr_idle;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3451
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3452	if (!busy && !(gcwq->flags & GCWQ_FREEZING) &&
				3453	gcwq->trustee_state != TRUSTEE_IN_CHARGE)
				3454	break;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3455
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3456	for_each_worker_pool(pool, gcwq) {
				3457	int nr_works = 0;
				3458
				3459	list_for_each_entry(work, &pool->worklist, entry) {
				3460	send_mayday(work);
				3461	nr_works++;
				3462	}
				3463
				3464	list_for_each_entry(worker, &pool->idle_list, entry) {
				3465	if (!nr_works--)
				3466	break;
				3467	wake_up_process(worker->task);
				3468	}
				3469
				3470	if (need_to_create_worker(pool)) {
				3471	spin_unlock_irq(&gcwq->lock);
				3472	worker = create_worker(pool, false);
				3473	spin_lock_irq(&gcwq->lock);
				3474	if (worker) {
				3475	worker->flags \|= WORKER_ROGUE;
				3476	start_worker(worker);
				3477	}
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3478	}
				3479	}
				3480
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3481	/* give a breather */
				3482	if (trustee_wait_event_timeout(false, TRUSTEE_COOLDOWN) < 0)
				3483	break;
				3484	}
				3485
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3486	/*
				3487	* Either all works have been scheduled and cpu is down, or
				3488	* cpu down has already been canceled. Wait for and butcher
				3489	* all workers till we're canceled.
				3490	*/
				3491	do {
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3492	rc = trustee_wait_event(gcwq_has_idle_workers(gcwq));
				3493
				3494	i = 0;
				3495	for_each_worker_pool(pool, gcwq) {
				3496	while (!list_empty(&pool->idle_list)) {
				3497	worker = list_first_entry(&pool->idle_list,
				3498	struct worker, entry);
				3499	destroy_worker(worker);
				3500	}
				3501	i \|= pool->nr_workers;
				3502	}
				3503	} while (i && rc >= 0);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3504
				3505	/*
				3506	* At this point, either draining has completed and no worker
				3507	* is left, or cpu down has been canceled or the cpu is being
				3508	* brought back up. There shouldn't be any idle one left.
				3509	* Tell the remaining busy ones to rebind once it finishes the
				3510	* currently scheduled works by scheduling the rebind_work.
				3511	*/
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3512	for_each_worker_pool(pool, gcwq)
				3513	WARN_ON(!list_empty(&pool->idle_list));
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3514
				3515	for_each_busy_worker(worker, i, pos, gcwq) {
				3516	struct work_struct *rebind_work = &worker->rebind_work;
Lai Jiangshan	6adebb0	2012-09-02 00:28:19 +0800	[diff] [blame]	3517	unsigned long worker_flags = worker->flags;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3518
				3519	/*
				3520	* Rebind_work may race with future cpu hotplug
				3521	* operations. Use a separate flag to mark that
Lai Jiangshan	6adebb0	2012-09-02 00:28:19 +0800	[diff] [blame]	3522	* rebinding is scheduled. The morphing should
				3523	* be atomic.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3524	*/
Lai Jiangshan	6adebb0	2012-09-02 00:28:19 +0800	[diff] [blame]	3525	worker_flags \|= WORKER_REBIND;
				3526	worker_flags &= ~WORKER_ROGUE;
				3527	ACCESS_ONCE(worker->flags) = worker_flags;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3528
				3529	/* queue rebind_work, wq doesn't matter, use the default one */
				3530	if (test_and_set_bit(WORK_STRUCT_PENDING_BIT,
				3531	work_data_bits(rebind_work)))
				3532	continue;
				3533
				3534	debug_work_activate(rebind_work);
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3535	insert_work(get_cwq(gcwq->cpu, system_wq), rebind_work,
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3536	worker->scheduled.next,
				3537	work_color_to_flags(WORK_NO_COLOR));
				3538	}
				3539
				3540	/* relinquish manager role */
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3541	for_each_worker_pool(pool, gcwq)
				3542	pool->flags &= ~POOL_MANAGING_WORKERS;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3543
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3544	/* notify completion */
				3545	gcwq->trustee = NULL;
				3546	gcwq->trustee_state = TRUSTEE_DONE;
				3547	wake_up_all(&gcwq->trustee_wait);
				3548	spin_unlock_irq(&gcwq->lock);
				3549	return 0;
				3550	}
				3551
				3552	/**
				3553	* wait_trustee_state - wait for trustee to enter the specified state
				3554	* @gcwq: gcwq the trustee of interest belongs to
				3555	* @state: target state to wait for
				3556	*
				3557	* Wait for the trustee to reach @state. DONE is already matched.
				3558	*
				3559	* CONTEXT:
				3560	* spin_lock_irq(gcwq->lock) which may be released and regrabbed
				3561	* multiple times. To be used by cpu_callback.
				3562	*/
				3563	static void __cpuinit wait_trustee_state(struct global_cwq *gcwq, int state)
Namhyung Kim	06bd6eb	2010-08-22 23:19:42 +0900	[diff] [blame]	3564	__releases(&gcwq->lock)
				3565	__acquires(&gcwq->lock)
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3566	{
				3567	if (!(gcwq->trustee_state == state \|\|
				3568	gcwq->trustee_state == TRUSTEE_DONE)) {
				3569	spin_unlock_irq(&gcwq->lock);
				3570	__wait_event(gcwq->trustee_wait,
				3571	gcwq->trustee_state == state \|\|
				3572	gcwq->trustee_state == TRUSTEE_DONE);
				3573	spin_lock_irq(&gcwq->lock);
				3574	}
				3575	}
				3576
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3577	static int __devinit workqueue_cpu_callback(struct notifier_block *nfb,
				3578	unsigned long action,
				3579	void *hcpu)
				3580	{
				3581	unsigned int cpu = (unsigned long)hcpu;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3582	struct global_cwq *gcwq = get_gcwq(cpu);
				3583	struct task_struct *new_trustee = NULL;
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3584	struct worker *new_workers[NR_WORKER_POOLS] = { };
				3585	struct worker_pool *pool;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3586	unsigned long flags;
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3587	int i;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3588
Rafael J. Wysocki	8bb7844	2007-05-09 02:35:10 -0700	[diff] [blame]	3589	action &= ~CPU_TASKS_FROZEN;
				3590
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3591	switch (action) {
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3592	case CPU_DOWN_PREPARE:
				3593	new_trustee = kthread_create(trustee_thread, gcwq,
				3594	"workqueue_trustee/%d\n", cpu);
				3595	if (IS_ERR(new_trustee))
				3596	return notifier_from_errno(PTR_ERR(new_trustee));
				3597	kthread_bind(new_trustee, cpu);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3598	/* fall through */
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3599	case CPU_UP_PREPARE:
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3600	i = 0;
				3601	for_each_worker_pool(pool, gcwq) {
				3602	BUG_ON(pool->first_idle);
				3603	new_workers[i] = create_worker(pool, false);
				3604	if (!new_workers[i++])
				3605	goto err_destroy;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3606	}
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3607	}
				3608
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3609	/* some are called w/ irq disabled, don't disturb irq status */
				3610	spin_lock_irqsave(&gcwq->lock, flags);
				3611
Oleg Nesterov	00dfcaf	2008-04-29 01:00:27 -0700	[diff] [blame]	3612	switch (action) {
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3613	case CPU_DOWN_PREPARE:
				3614	/* initialize trustee and tell it to acquire the gcwq */
				3615	BUG_ON(gcwq->trustee \|\| gcwq->trustee_state != TRUSTEE_DONE);
				3616	gcwq->trustee = new_trustee;
				3617	gcwq->trustee_state = TRUSTEE_START;
				3618	wake_up_process(gcwq->trustee);
				3619	wait_trustee_state(gcwq, TRUSTEE_IN_CHARGE);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3620	/* fall through */
				3621	case CPU_UP_PREPARE:
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3622	i = 0;
				3623	for_each_worker_pool(pool, gcwq) {
				3624	BUG_ON(pool->first_idle);
				3625	pool->first_idle = new_workers[i++];
				3626	}
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3627	break;
				3628
				3629	case CPU_DYING:
				3630	/*
				3631	* Before this, the trustee and all workers except for
				3632	* the ones which are still executing works from
				3633	* before the last CPU down must be on the cpu. After
				3634	* this, they'll all be diasporas.
				3635	*/
				3636	gcwq->flags \|= GCWQ_DISASSOCIATED;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3637	break;
				3638
Oleg Nesterov	3da1c84	2008-07-25 01:47:50 -0700	[diff] [blame]	3639	case CPU_POST_DEAD:
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3640	gcwq->trustee_state = TRUSTEE_BUTCHER;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3641	/* fall through */
				3642	case CPU_UP_CANCELED:
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3643	for_each_worker_pool(pool, gcwq) {
				3644	destroy_worker(pool->first_idle);
				3645	pool->first_idle = NULL;
				3646	}
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3647	break;
				3648
				3649	case CPU_DOWN_FAILED:
				3650	case CPU_ONLINE:
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3651	gcwq->flags &= ~GCWQ_DISASSOCIATED;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3652	if (gcwq->trustee_state != TRUSTEE_DONE) {
				3653	gcwq->trustee_state = TRUSTEE_RELEASE;
				3654	wake_up_process(gcwq->trustee);
				3655	wait_trustee_state(gcwq, TRUSTEE_DONE);
				3656	}
				3657
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3658	/*
				3659	* Trustee is done and there might be no worker left.
				3660	* Put the first_idle in and request a real manager to
				3661	* take a look.
				3662	*/
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3663	for_each_worker_pool(pool, gcwq) {
				3664	spin_unlock_irq(&gcwq->lock);
				3665	kthread_bind(pool->first_idle->task, cpu);
				3666	spin_lock_irq(&gcwq->lock);
				3667	pool->flags \|= POOL_MANAGE_WORKERS;
				3668	start_worker(pool->first_idle);
				3669	pool->first_idle = NULL;
				3670	}
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3671	break;
Oleg Nesterov	00dfcaf	2008-04-29 01:00:27 -0700	[diff] [blame]	3672	}
				3673
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3674	spin_unlock_irqrestore(&gcwq->lock, flags);
				3675
Tejun Heo	1537663	2010-06-29 10:07:11 +0200	[diff] [blame]	3676	return notifier_from_errno(0);
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3677
				3678	err_destroy:
				3679	if (new_trustee)
				3680	kthread_stop(new_trustee);
				3681
				3682	spin_lock_irqsave(&gcwq->lock, flags);
				3683	for (i = 0; i < NR_WORKER_POOLS; i++)
				3684	if (new_workers[i])
				3685	destroy_worker(new_workers[i]);
				3686	spin_unlock_irqrestore(&gcwq->lock, flags);
				3687
				3688	return NOTIFY_BAD;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3689	}
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3690
Tejun Heo	d3b4254	2012-07-17 12:39:26 -0700	[diff] [blame]	3691	/*
				3692	* Workqueues should be brought up before normal priority CPU notifiers.
				3693	* This will be registered high priority CPU notifier.
				3694	*/
				3695	static int __devinit workqueue_cpu_up_callback(struct notifier_block *nfb,
				3696	unsigned long action,
				3697	void *hcpu)
				3698	{
				3699	switch (action & ~CPU_TASKS_FROZEN) {
				3700	case CPU_UP_PREPARE:
				3701	case CPU_UP_CANCELED:
				3702	case CPU_DOWN_FAILED:
				3703	case CPU_ONLINE:
				3704	return workqueue_cpu_callback(nfb, action, hcpu);
				3705	}
				3706	return NOTIFY_OK;
				3707	}
				3708
				3709	/*
				3710	* Workqueues should be brought down after normal priority CPU notifiers.
				3711	* This will be registered as low priority CPU notifier.
				3712	*/
				3713	static int __devinit workqueue_cpu_down_callback(struct notifier_block *nfb,
				3714	unsigned long action,
				3715	void *hcpu)
				3716	{
				3717	switch (action & ~CPU_TASKS_FROZEN) {
				3718	case CPU_DOWN_PREPARE:
				3719	case CPU_DYING:
				3720	case CPU_POST_DEAD:
				3721	return workqueue_cpu_callback(nfb, action, hcpu);
				3722	}
				3723	return NOTIFY_OK;
				3724	}
				3725
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3726	#ifdef CONFIG_SMP
Rusty Russell	8ccad40	2009-01-16 15:31:15 -0800	[diff] [blame]	3727
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3728	struct work_for_cpu {
Tejun Heo	fc7da7e	2012-09-18 12:48:43 -0700	[diff] [blame]	3729	struct work_struct work;
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3730	long (fn)(void );
				3731	void *arg;
				3732	long ret;
				3733	};
				3734
Tejun Heo	fc7da7e	2012-09-18 12:48:43 -0700	[diff] [blame]	3735	static void work_for_cpu_fn(struct work_struct *work)
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3736	{
Tejun Heo	fc7da7e	2012-09-18 12:48:43 -0700	[diff] [blame]	3737	struct work_for_cpu *wfc = container_of(work, struct work_for_cpu, work);
				3738
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3739	wfc->ret = wfc->fn(wfc->arg);
				3740	}
				3741
				3742	/**
				3743	* work_on_cpu - run a function in user context on a particular cpu
				3744	* @cpu: the cpu to run on
				3745	* @fn: the function to run
				3746	* @arg: the function arg
				3747	*
Rusty Russell	31ad908	2009-01-16 15:31:15 -0800	[diff] [blame]	3748	* This will return the value @fn returns.
				3749	* It is up to the caller to ensure that the cpu doesn't go offline.
Andrew Morton	6b44003	2009-04-09 09:50:37 -0600	[diff] [blame]	3750	* The caller must not hold any locks which would prevent @fn from completing.
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3751	*/
				3752	long work_on_cpu(unsigned int cpu, long (fn)(void ), void *arg)
				3753	{
Tejun Heo	fc7da7e	2012-09-18 12:48:43 -0700	[diff] [blame]	3754	struct work_for_cpu wfc = { .fn = fn, .arg = arg };
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3755
Tejun Heo	fc7da7e	2012-09-18 12:48:43 -0700	[diff] [blame]	3756	INIT_WORK_ONSTACK(&wfc.work, work_for_cpu_fn);
				3757	schedule_work_on(cpu, &wfc.work);
				3758	flush_work(&wfc.work);
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3759	return wfc.ret;
				3760	}
				3761	EXPORT_SYMBOL_GPL(work_on_cpu);
				3762	#endif /* CONFIG_SMP */
				3763
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3764	#ifdef CONFIG_FREEZER
Rusty Russell	e7577c5	2009-01-01 10:12:25 +1030	[diff] [blame]	3765
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3766	/**
				3767	* freeze_workqueues_begin - begin freezing workqueues
				3768	*
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3769	* Start freezing workqueues. After this function returns, all freezable
				3770	* workqueues will queue new works to their frozen_works list instead of
				3771	* gcwq->worklist.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3772	*
				3773	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3774	* Grabs and releases workqueue_lock and gcwq->lock's.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3775	*/
				3776	void freeze_workqueues_begin(void)
				3777	{
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3778	unsigned int cpu;
				3779
				3780	spin_lock(&workqueue_lock);
				3781
				3782	BUG_ON(workqueue_freezing);
				3783	workqueue_freezing = true;
				3784
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3785	for_each_gcwq_cpu(cpu) {
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3786	struct global_cwq *gcwq = get_gcwq(cpu);
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3787	struct workqueue_struct *wq;
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3788
				3789	spin_lock_irq(&gcwq->lock);
				3790
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3791	BUG_ON(gcwq->flags & GCWQ_FREEZING);
				3792	gcwq->flags \|= GCWQ_FREEZING;
				3793
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3794	list_for_each_entry(wq, &workqueues, list) {
				3795	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
				3796
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3797	if (cwq && wq->flags & WQ_FREEZABLE)
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3798	cwq->max_active = 0;
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3799	}
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3800
				3801	spin_unlock_irq(&gcwq->lock);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3802	}
				3803
				3804	spin_unlock(&workqueue_lock);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3805	}
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3806
				3807	/**
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3808	* freeze_workqueues_busy - are freezable workqueues still busy?
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3809	*
				3810	* Check whether freezing is complete. This function must be called
				3811	* between freeze_workqueues_begin() and thaw_workqueues().
				3812	*
				3813	* CONTEXT:
				3814	* Grabs and releases workqueue_lock.
				3815	*
				3816	* RETURNS:
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3817	* %true if some freezable workqueues are still busy. %false if freezing
				3818	* is complete.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3819	*/
				3820	bool freeze_workqueues_busy(void)
				3821	{
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3822	unsigned int cpu;
				3823	bool busy = false;
				3824
				3825	spin_lock(&workqueue_lock);
				3826
				3827	BUG_ON(!workqueue_freezing);
				3828
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3829	for_each_gcwq_cpu(cpu) {
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3830	struct workqueue_struct *wq;
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3831	/*
				3832	* nr_active is monotonically decreasing. It's safe
				3833	* to peek without lock.
				3834	*/
				3835	list_for_each_entry(wq, &workqueues, list) {
				3836	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
				3837
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3838	if (!cwq \|\| !(wq->flags & WQ_FREEZABLE))
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3839	continue;
				3840
				3841	BUG_ON(cwq->nr_active < 0);
				3842	if (cwq->nr_active) {
				3843	busy = true;
				3844	goto out_unlock;
				3845	}
				3846	}
				3847	}
				3848	out_unlock:
				3849	spin_unlock(&workqueue_lock);
				3850	return busy;
				3851	}
				3852
				3853	/**
				3854	* thaw_workqueues - thaw workqueues
				3855	*
				3856	* Thaw workqueues. Normal queueing is restored and all collected
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	3857	* frozen works are transferred to their respective gcwq worklists.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3858	*
				3859	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3860	* Grabs and releases workqueue_lock and gcwq->lock's.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3861	*/
				3862	void thaw_workqueues(void)
				3863	{
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3864	unsigned int cpu;
				3865
				3866	spin_lock(&workqueue_lock);
				3867
				3868	if (!workqueue_freezing)
				3869	goto out_unlock;
				3870
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3871	for_each_gcwq_cpu(cpu) {
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3872	struct global_cwq *gcwq = get_gcwq(cpu);
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3873	struct worker_pool *pool;
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3874	struct workqueue_struct *wq;
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3875
				3876	spin_lock_irq(&gcwq->lock);
				3877
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3878	BUG_ON(!(gcwq->flags & GCWQ_FREEZING));
				3879	gcwq->flags &= ~GCWQ_FREEZING;
				3880
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3881	list_for_each_entry(wq, &workqueues, list) {
				3882	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
				3883
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3884	if (!cwq \|\| !(wq->flags & WQ_FREEZABLE))
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3885	continue;
				3886
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3887	/* restore max_active and repopulate worklist */
				3888	cwq->max_active = wq->saved_max_active;
				3889
				3890	while (!list_empty(&cwq->delayed_works) &&
				3891	cwq->nr_active < cwq->max_active)
				3892	cwq_activate_first_delayed(cwq);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3893	}
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3894
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3895	for_each_worker_pool(pool, gcwq)
				3896	wake_up_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3897
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3898	spin_unlock_irq(&gcwq->lock);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3899	}
				3900
				3901	workqueue_freezing = false;
				3902	out_unlock:
				3903	spin_unlock(&workqueue_lock);
				3904	}
				3905	#endif /* CONFIG_FREEZER */
				3906
Suresh Siddha	6ee0578	2010-07-30 14:57:37 -0700	[diff] [blame]	3907	static int __init init_workqueues(void)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3908	{
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	3909	unsigned int cpu;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	3910	int i;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	3911
Tejun Heo	d3b4254	2012-07-17 12:39:26 -0700	[diff] [blame]	3912	cpu_notifier(workqueue_cpu_up_callback, CPU_PRI_WORKQUEUE_UP);
				3913	cpu_notifier(workqueue_cpu_down_callback, CPU_PRI_WORKQUEUE_DOWN);
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3914
				3915	/* initialize gcwqs */
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3916	for_each_gcwq_cpu(cpu) {
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3917	struct global_cwq *gcwq = get_gcwq(cpu);
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3918	struct worker_pool *pool;
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3919
				3920	spin_lock_init(&gcwq->lock);
				3921	gcwq->cpu = cpu;
Tejun Heo	477a3c3	2010-08-31 10:54:35 +0200	[diff] [blame]	3922	gcwq->flags \|= GCWQ_DISASSOCIATED;
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3923
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	3924	for (i = 0; i < BUSY_WORKER_HASH_SIZE; i++)
				3925	INIT_HLIST_HEAD(&gcwq->busy_hash[i]);
				3926
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3927	for_each_worker_pool(pool, gcwq) {
				3928	pool->gcwq = gcwq;
				3929	INIT_LIST_HEAD(&pool->worklist);
				3930	INIT_LIST_HEAD(&pool->idle_list);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3931
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3932	init_timer_deferrable(&pool->idle_timer);
				3933	pool->idle_timer.function = idle_worker_timeout;
				3934	pool->idle_timer.data = (unsigned long)pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3935
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3936	setup_timer(&pool->mayday_timer, gcwq_mayday_timeout,
				3937	(unsigned long)pool);
				3938
				3939	ida_init(&pool->worker_ida);
				3940	}
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3941
				3942	gcwq->trustee_state = TRUSTEE_DONE;
				3943	init_waitqueue_head(&gcwq->trustee_wait);
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3944	}
				3945
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3946	/* create the initial worker */
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3947	for_each_online_gcwq_cpu(cpu) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3948	struct global_cwq *gcwq = get_gcwq(cpu);
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3949	struct worker_pool *pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3950
Tejun Heo	477a3c3	2010-08-31 10:54:35 +0200	[diff] [blame]	3951	if (cpu != WORK_CPU_UNBOUND)
				3952	gcwq->flags &= ~GCWQ_DISASSOCIATED;
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3953
				3954	for_each_worker_pool(pool, gcwq) {
				3955	struct worker *worker;
				3956
				3957	worker = create_worker(pool, true);
				3958	BUG_ON(!worker);
				3959	spin_lock_irq(&gcwq->lock);
				3960	start_worker(worker);
				3961	spin_unlock_irq(&gcwq->lock);
				3962	}
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3963	}
				3964
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3965	system_wq = alloc_workqueue("events", 0, 0);
				3966	system_long_wq = alloc_workqueue("events_long", 0, 0);
				3967	system_nrt_wq = alloc_workqueue("events_nrt", WQ_NON_REENTRANT, 0);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3968	system_unbound_wq = alloc_workqueue("events_unbound", WQ_UNBOUND,
				3969	WQ_UNBOUND_MAX_ACTIVE);
Tejun Heo	24d51ad	2011-02-21 09:52:50 +0100	[diff] [blame]	3970	system_freezable_wq = alloc_workqueue("events_freezable",
				3971	WQ_FREEZABLE, 0);
Alan Stern	62d3c54	2012-03-02 10:51:00 +0100	[diff] [blame]	3972	system_nrt_freezable_wq = alloc_workqueue("events_nrt_freezable",
				3973	WQ_NON_REENTRANT \| WQ_FREEZABLE, 0);
Hitoshi Mitake	e5cba24	2010-11-26 12:06:44 +0100	[diff] [blame]	3974	BUG_ON(!system_wq \|\| !system_long_wq \|\| !system_nrt_wq \|\|
Alan Stern	62d3c54	2012-03-02 10:51:00 +0100	[diff] [blame]	3975	!system_unbound_wq \|\| !system_freezable_wq \|\|
				3976	!system_nrt_freezable_wq);
Suresh Siddha	6ee0578	2010-07-30 14:57:37 -0700	[diff] [blame]	3977	return 0;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3978	}
Suresh Siddha	6ee0578	2010-07-30 14:57:37 -0700	[diff] [blame]	3979	early_initcall(init_workqueues);