Blame - kernel/workqueue.c - android_kernel_htc_msm8960

blob: 98644ae1b020899b7e8622dc23df72cbda9db526 [file] [log] [blame]

Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1	/*
Tejun Heo	c54fce6	2010-09-10 16:51:36 +0200	[diff] [blame]	2	* kernel/workqueue.c - generic async execution with shared worker pool
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3	*
Tejun Heo	c54fce6	2010-09-10 16:51:36 +0200	[diff] [blame]	4	* Copyright (C) 2002 Ingo Molnar
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	5	*
Tejun Heo	c54fce6	2010-09-10 16:51:36 +0200	[diff] [blame]	6	* Derived from the taskqueue/keventd code by:
				7	* David Woodhouse <dwmw2@infradead.org>
				8	* Andrew Morton
				9	* Kai Petzke <wpp@marie.physik.tu-berlin.de>
				10	* Theodore Ts'o <tytso@mit.edu>
Christoph Lameter	89ada67	2005-10-30 15:01:59 -0800	[diff] [blame]	11	*
Christoph Lameter	cde5353	2008-07-04 09:59:22 -0700	[diff] [blame]	12	* Made to use alloc_percpu by Christoph Lameter.
Tejun Heo	c54fce6	2010-09-10 16:51:36 +0200	[diff] [blame]	13	*
				14	* Copyright (C) 2010 SUSE Linux Products GmbH
				15	* Copyright (C) 2010 Tejun Heo <tj@kernel.org>
				16	*
				17	* This is the generic async execution mechanism. Work items as are
				18	* executed in process context. The worker pool is shared and
				19	* automatically managed. There is one worker pool for each CPU and
				20	* one extra for works which are better served by workers which are
				21	* not bound to any specific CPU.
				22	*
				23	* Please read Documentation/workqueue.txt for details.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	24	*/
				25
Paul Gortmaker	9984de1	2011-05-23 14:51:41 -0400	[diff] [blame]	26	#include <linux/export.h>
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	27	#include <linux/kernel.h>
				28	#include <linux/sched.h>
				29	#include <linux/init.h>
				30	#include <linux/signal.h>
				31	#include <linux/completion.h>
				32	#include <linux/workqueue.h>
				33	#include <linux/slab.h>
				34	#include <linux/cpu.h>
				35	#include <linux/notifier.h>
				36	#include <linux/kthread.h>
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	37	#include <linux/hardirq.h>
Christoph Lameter	4693402	2006-10-11 01:21:26 -0700	[diff] [blame]	38	#include <linux/mempolicy.h>
Rafael J. Wysocki	341a595	2006-12-06 20:34:49 -0800	[diff] [blame]	39	#include <linux/freezer.h>
Peter Zijlstra	d5abe66	2006-12-06 20:37:26 -0800	[diff] [blame]	40	#include <linux/kallsyms.h>
				41	#include <linux/debug_locks.h>
Johannes Berg	4e6045f	2007-10-18 23:39:55 -0700	[diff] [blame]	42	#include <linux/lockdep.h>
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	43	#include <linux/idr.h>
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	44
				45	#include "workqueue_sched.h"
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	46
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	47	enum {
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	48	/* global_cwq flags */
Tejun Heo	22ad564	2012-07-12 14:46:37 -0700	[diff] [blame]	49	GCWQ_DISASSOCIATED = 1 << 0, /* cpu can't serve workers */
				50	GCWQ_FREEZING = 1 << 1, /* freeze in progress */
				51
				52	/* pool flags */
				53	POOL_MANAGE_WORKERS = 1 << 0, /* need to manage workers */
				54	POOL_MANAGING_WORKERS = 1 << 1, /* managing workers */
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	55
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	56	/* worker flags */
				57	WORKER_STARTED = 1 << 0, /* started */
				58	WORKER_DIE = 1 << 1, /* die die die */
				59	WORKER_IDLE = 1 << 2, /* is idle */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	60	WORKER_PREP = 1 << 3, /* preparing to run works */
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	61	WORKER_ROGUE = 1 << 4, /* not bound to any cpu */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	62	WORKER_REBIND = 1 << 5, /* mom is home, come back */
Tejun Heo	fb0e7be	2010-06-29 10:07:15 +0200	[diff] [blame]	63	WORKER_CPU_INTENSIVE = 1 << 6, /* cpu intensive */
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	64	WORKER_UNBOUND = 1 << 7, /* worker is unbound */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	65
Tejun Heo	fb0e7be	2010-06-29 10:07:15 +0200	[diff] [blame]	66	WORKER_NOT_RUNNING = WORKER_PREP \| WORKER_ROGUE \| WORKER_REBIND \|
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	67	WORKER_CPU_INTENSIVE \| WORKER_UNBOUND,
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	68
				69	/* gcwq->trustee_state */
				70	TRUSTEE_START = 0, /* start */
				71	TRUSTEE_IN_CHARGE = 1, /* trustee in charge of gcwq */
				72	TRUSTEE_BUTCHER = 2, /* butcher workers */
				73	TRUSTEE_RELEASE = 3, /* release workers */
				74	TRUSTEE_DONE = 4, /* trustee is done */
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	75
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	76	NR_WORKER_POOLS = 2, /* # worker pools per gcwq */
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	77
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	78	BUSY_WORKER_HASH_ORDER = 6, /* 64 pointers */
				79	BUSY_WORKER_HASH_SIZE = 1 << BUSY_WORKER_HASH_ORDER,
				80	BUSY_WORKER_HASH_MASK = BUSY_WORKER_HASH_SIZE - 1,
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	81
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	82	MAX_IDLE_WORKERS_RATIO = 4, /* 1/4 of busy can be idle */
				83	IDLE_WORKER_TIMEOUT = 300 * HZ, /* keep idle ones for 5 mins */
				84
Tejun Heo	3233cdb	2011-02-16 18:10:19 +0100	[diff] [blame]	85	MAYDAY_INITIAL_TIMEOUT = HZ / 100 >= 2 ? HZ / 100 : 2,
				86	/* call for help after 10ms
				87	(min two ticks) */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	88	MAYDAY_INTERVAL = HZ / 10, /* and then every 100ms */
				89	CREATE_COOLDOWN = HZ, /* time to breath after fail */
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	90	TRUSTEE_COOLDOWN = HZ / 10, /* for trustee draining */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	91
				92	/*
				93	* Rescue workers are used only on emergencies and shared by
				94	* all cpus. Give -20.
				95	*/
				96	RESCUER_NICE_LEVEL = -20,
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	97	HIGHPRI_NICE_LEVEL = -20,
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	98	};
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	99
				100	/*
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	101	* Structure fields follow one of the following exclusion rules.
				102	*
Tejun Heo	e41e704	2010-08-24 14:22:47 +0200	[diff] [blame]	103	* I: Modifiable by initialization/destruction paths and read-only for
				104	* everyone else.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	105	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	106	* P: Preemption protected. Disabling preemption is enough and should
				107	* only be modified and accessed from the local cpu.
				108	*
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	109	* L: gcwq->lock protected. Access with gcwq->lock held.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	110	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	111	* X: During normal operation, modification requires gcwq->lock and
				112	* should be done only from local cpu. Either disabling preemption
				113	* on local cpu or grabbing gcwq->lock is enough for read access.
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	114	* If GCWQ_DISASSOCIATED is set, it's identical to L.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	115	*
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	116	* F: wq->flush_mutex protected.
				117	*
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	118	* W: workqueue_lock protected.
				119	*/
				120
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	121	struct global_cwq;
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	122	struct worker_pool;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	123
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	124	/*
				125	* The poor guys doing the actual heavy lifting. All on-duty workers
				126	* are either serving the manager role, on idle list or on busy hash.
				127	*/
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	128	struct worker {
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	129	/* on idle list while idle, on busy hash table while busy */
				130	union {
				131	struct list_head entry; /* L: while idle */
				132	struct hlist_node hentry; /* L: while busy */
				133	};
				134
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	135	struct work_struct current_work; / L: work being processed */
Tejun Heo	55e3e1f	2012-12-18 10:35:02 -0800	[diff] [blame]	136	work_func_t current_func; /* L: current_work's fn */
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	137	struct cpu_workqueue_struct current_cwq; / L: current_work's cwq */
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	138	struct list_head scheduled; /* L: scheduled works */
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	139	struct task_struct task; / I: worker task */
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	140	struct worker_pool pool; / I: the associated pool */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	141	/* 64 bytes boundary on 64bit, 32 on 32bit */
				142	unsigned long last_active; /* L: last active timestamp */
				143	unsigned int flags; /* X: flags */
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	144	int id; /* I: worker id */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	145	struct work_struct rebind_work; /* L: rebind worker to cpu */
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	146	};
				147
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	148	struct worker_pool {
				149	struct global_cwq gcwq; / I: the owning gcwq */
Tejun Heo	22ad564	2012-07-12 14:46:37 -0700	[diff] [blame]	150	unsigned int flags; /* X: flags */
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	151
				152	struct list_head worklist; /* L: list of pending works */
				153	int nr_workers; /* L: total number of workers */
				154	int nr_idle; /* L: currently idle ones */
				155
				156	struct list_head idle_list; /* X: list of idle workers */
				157	struct timer_list idle_timer; /* L: worker idle timeout */
				158	struct timer_list mayday_timer; /* L: SOS timer for workers */
				159
				160	struct ida worker_ida; /* L: for worker IDs */
				161	struct worker first_idle; / L: first idle worker */
				162	};
				163
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	164	/*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	165	* Global per-cpu workqueue. There's one and only one for each cpu
				166	* and all works are queued and processed here regardless of their
				167	* target workqueues.
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	168	*/
				169	struct global_cwq {
				170	spinlock_t lock; /* the gcwq lock */
				171	unsigned int cpu; /* I: the associated cpu */
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	172	unsigned int flags; /* L: GCWQ_* flags */
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	173
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	174	/* workers are chained either in busy_hash or pool idle_list */
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	175	struct hlist_head busy_hash[BUSY_WORKER_HASH_SIZE];
				176	/* L: hash of busy workers */
				177
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	178	struct worker_pool pools[2]; /* normal and highpri pools */
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	179
				180	struct task_struct trustee; / L: for gcwq shutdown */
				181	unsigned int trustee_state; /* L: trustee state */
				182	wait_queue_head_t trustee_wait; /* trustee wait */
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	183	} ____cacheline_aligned_in_smp;
				184
				185	/*
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	186	* The per-CPU workqueue. The lower WORK_STRUCT_FLAG_BITS of
Tejun Heo	0f90004	2010-06-29 10:07:11 +0200	[diff] [blame]	187	* work_struct->data are used for flags and thus cwqs need to be
				188	* aligned at two's power of the number of flag bits.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	189	*/
				190	struct cpu_workqueue_struct {
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	191	struct worker_pool pool; / I: the associated pool */
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	192	struct workqueue_struct wq; / I: the owning workqueue */
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	193	int work_color; /* L: current color */
				194	int flush_color; /* L: flushing color */
				195	int nr_in_flight[WORK_NR_COLORS];
				196	/* L: nr of in_flight works */
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	197	int nr_active; /* L: nr of active works */
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	198	int max_active; /* L: max active works */
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	199	struct list_head delayed_works; /* L: delayed works */
Tejun Heo	0f90004	2010-06-29 10:07:11 +0200	[diff] [blame]	200	};
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	201
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	202	/*
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	203	* Structure used to wait for workqueue flush.
				204	*/
				205	struct wq_flusher {
				206	struct list_head list; /* F: list of flushers */
				207	int flush_color; /* F: flush color waiting for */
				208	struct completion done; /* flush completion */
				209	};
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	210
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	211	/*
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	212	* All cpumasks are assumed to be always set on UP and thus can't be
				213	* used to determine whether there's something to be done.
				214	*/
				215	#ifdef CONFIG_SMP
				216	typedef cpumask_var_t mayday_mask_t;
				217	#define mayday_test_and_set_cpu(cpu, mask) \
				218	cpumask_test_and_set_cpu((cpu), (mask))
				219	#define mayday_clear_cpu(cpu, mask) cpumask_clear_cpu((cpu), (mask))
				220	#define for_each_mayday_cpu(cpu, mask) for_each_cpu((cpu), (mask))
Tejun Heo	9c37547	2010-08-31 11:18:34 +0200	[diff] [blame]	221	#define alloc_mayday_mask(maskp, gfp) zalloc_cpumask_var((maskp), (gfp))
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	222	#define free_mayday_mask(mask) free_cpumask_var((mask))
				223	#else
				224	typedef unsigned long mayday_mask_t;
				225	#define mayday_test_and_set_cpu(cpu, mask) test_and_set_bit(0, &(mask))
				226	#define mayday_clear_cpu(cpu, mask) clear_bit(0, &(mask))
				227	#define for_each_mayday_cpu(cpu, mask) if ((cpu) = 0, (mask))
				228	#define alloc_mayday_mask(maskp, gfp) true
				229	#define free_mayday_mask(mask) do { } while (0)
				230	#endif
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	231
				232	/*
				233	* The externally visible workqueue abstraction is an array of
				234	* per-CPU workqueues:
				235	*/
				236	struct workqueue_struct {
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	237	unsigned int flags; /* W: WQ_* flags */
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	238	union {
				239	struct cpu_workqueue_struct __percpu *pcpu;
				240	struct cpu_workqueue_struct *single;
				241	unsigned long v;
				242	} cpu_wq; /* I: cwq's */
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	243	struct list_head list; /* W: list of all workqueues */
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	244
				245	struct mutex flush_mutex; /* protects wq flushing */
				246	int work_color; /* F: current work color */
				247	int flush_color; /* F: current flush color */
				248	atomic_t nr_cwqs_to_flush; /* flush in progress */
				249	struct wq_flusher first_flusher; / F: first flusher */
				250	struct list_head flusher_queue; /* F: flush waiters */
				251	struct list_head flusher_overflow; /* F: flush overflow list */
				252
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	253	mayday_mask_t mayday_mask; /* cpus requesting rescue */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	254	struct worker rescuer; / I: rescue worker */
				255
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	256	int nr_drainers; /* W: drain in progress */
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	257	int saved_max_active; /* W: saved cwq max_active */
Johannes Berg	4e6045f	2007-10-18 23:39:55 -0700	[diff] [blame]	258	#ifdef CONFIG_LOCKDEP
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	259	struct lockdep_map lockdep_map;
Johannes Berg	4e6045f	2007-10-18 23:39:55 -0700	[diff] [blame]	260	#endif
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	261	char name[]; /* I: workqueue name */
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	262	};
				263
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	264	struct workqueue_struct *system_wq __read_mostly;
				265	struct workqueue_struct *system_long_wq __read_mostly;
				266	struct workqueue_struct *system_nrt_wq __read_mostly;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	267	struct workqueue_struct *system_unbound_wq __read_mostly;
Tejun Heo	24d51ad	2011-02-21 09:52:50 +0100	[diff] [blame]	268	struct workqueue_struct *system_freezable_wq __read_mostly;
Alan Stern	62d3c54	2012-03-02 10:51:00 +0100	[diff] [blame]	269	struct workqueue_struct *system_nrt_freezable_wq __read_mostly;
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	270	EXPORT_SYMBOL_GPL(system_wq);
				271	EXPORT_SYMBOL_GPL(system_long_wq);
				272	EXPORT_SYMBOL_GPL(system_nrt_wq);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	273	EXPORT_SYMBOL_GPL(system_unbound_wq);
Tejun Heo	24d51ad	2011-02-21 09:52:50 +0100	[diff] [blame]	274	EXPORT_SYMBOL_GPL(system_freezable_wq);
Alan Stern	62d3c54	2012-03-02 10:51:00 +0100	[diff] [blame]	275	EXPORT_SYMBOL_GPL(system_nrt_freezable_wq);
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	276
Tejun Heo	97bd234	2010-10-05 10:41:14 +0200	[diff] [blame]	277	#define CREATE_TRACE_POINTS
				278	#include <trace/events/workqueue.h>
				279
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	280	#define for_each_worker_pool(pool, gcwq) \
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	281	for ((pool) = &(gcwq)->pools[0]; \
				282	(pool) < &(gcwq)->pools[NR_WORKER_POOLS]; (pool)++)
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	283
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	284	#define for_each_busy_worker(worker, i, pos, gcwq) \
				285	for (i = 0; i < BUSY_WORKER_HASH_SIZE; i++) \
				286	hlist_for_each_entry(worker, pos, &gcwq->busy_hash[i], hentry)
				287
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	288	static inline int __next_gcwq_cpu(int cpu, const struct cpumask *mask,
				289	unsigned int sw)
				290	{
				291	if (cpu < nr_cpu_ids) {
				292	if (sw & 1) {
				293	cpu = cpumask_next(cpu, mask);
				294	if (cpu < nr_cpu_ids)
				295	return cpu;
				296	}
				297	if (sw & 2)
				298	return WORK_CPU_UNBOUND;
				299	}
				300	return WORK_CPU_NONE;
				301	}
				302
				303	static inline int __next_wq_cpu(int cpu, const struct cpumask *mask,
				304	struct workqueue_struct *wq)
				305	{
				306	return __next_gcwq_cpu(cpu, mask, !(wq->flags & WQ_UNBOUND) ? 1 : 2);
				307	}
				308
Tejun Heo	0988495	2010-08-01 11:50:12 +0200	[diff] [blame]	309	/*
				310	* CPU iterators
				311	*
				312	* An extra gcwq is defined for an invalid cpu number
				313	* (WORK_CPU_UNBOUND) to host workqueues which are not bound to any
				314	* specific CPU. The following iterators are similar to
				315	* for_each_*_cpu() iterators but also considers the unbound gcwq.
				316	*
				317	* for_each_gcwq_cpu() : possible CPUs + WORK_CPU_UNBOUND
				318	* for_each_online_gcwq_cpu() : online CPUs + WORK_CPU_UNBOUND
				319	* for_each_cwq_cpu() : possible CPUs for bound workqueues,
				320	* WORK_CPU_UNBOUND for unbound workqueues
				321	*/
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	322	#define for_each_gcwq_cpu(cpu) \
				323	for ((cpu) = __next_gcwq_cpu(-1, cpu_possible_mask, 3); \
				324	(cpu) < WORK_CPU_NONE; \
				325	(cpu) = __next_gcwq_cpu((cpu), cpu_possible_mask, 3))
				326
				327	#define for_each_online_gcwq_cpu(cpu) \
				328	for ((cpu) = __next_gcwq_cpu(-1, cpu_online_mask, 3); \
				329	(cpu) < WORK_CPU_NONE; \
				330	(cpu) = __next_gcwq_cpu((cpu), cpu_online_mask, 3))
				331
				332	#define for_each_cwq_cpu(cpu, wq) \
				333	for ((cpu) = __next_wq_cpu(-1, cpu_possible_mask, (wq)); \
				334	(cpu) < WORK_CPU_NONE; \
				335	(cpu) = __next_wq_cpu((cpu), cpu_possible_mask, (wq)))
				336
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	337	#ifdef CONFIG_DEBUG_OBJECTS_WORK
				338
				339	static struct debug_obj_descr work_debug_descr;
				340
Stanislaw Gruszka	9977728	2011-03-07 09:58:33 +0100	[diff] [blame]	341	static void work_debug_hint(void addr)
				342	{
				343	return ((struct work_struct *) addr)->func;
				344	}
				345
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	346	/*
				347	* fixup_init is called when:
				348	* - an active object is initialized
				349	*/
				350	static int work_fixup_init(void *addr, enum debug_obj_state state)
				351	{
				352	struct work_struct *work = addr;
				353
				354	switch (state) {
				355	case ODEBUG_STATE_ACTIVE:
				356	cancel_work_sync(work);
				357	debug_object_init(work, &work_debug_descr);
				358	return 1;
				359	default:
				360	return 0;
				361	}
				362	}
				363
				364	/*
				365	* fixup_activate is called when:
				366	* - an active object is activated
				367	* - an unknown object is activated (might be a statically initialized object)
				368	*/
				369	static int work_fixup_activate(void *addr, enum debug_obj_state state)
				370	{
				371	struct work_struct *work = addr;
				372
				373	switch (state) {
				374
				375	case ODEBUG_STATE_NOTAVAILABLE:
				376	/*
				377	* This is not really a fixup. The work struct was
				378	* statically initialized. We just make sure that it
				379	* is tracked in the object tracker.
				380	*/
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	381	if (test_bit(WORK_STRUCT_STATIC_BIT, work_data_bits(work))) {
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	382	debug_object_init(work, &work_debug_descr);
				383	debug_object_activate(work, &work_debug_descr);
				384	return 0;
				385	}
				386	WARN_ON_ONCE(1);
				387	return 0;
				388
				389	case ODEBUG_STATE_ACTIVE:
				390	WARN_ON(1);
				391
				392	default:
				393	return 0;
				394	}
				395	}
				396
				397	/*
				398	* fixup_free is called when:
				399	* - an active object is freed
				400	*/
				401	static int work_fixup_free(void *addr, enum debug_obj_state state)
				402	{
				403	struct work_struct *work = addr;
				404
				405	switch (state) {
				406	case ODEBUG_STATE_ACTIVE:
				407	cancel_work_sync(work);
				408	debug_object_free(work, &work_debug_descr);
				409	return 1;
				410	default:
				411	return 0;
				412	}
				413	}
				414
				415	static struct debug_obj_descr work_debug_descr = {
				416	.name = "work_struct",
Stanislaw Gruszka	9977728	2011-03-07 09:58:33 +0100	[diff] [blame]	417	.debug_hint = work_debug_hint,
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	418	.fixup_init = work_fixup_init,
				419	.fixup_activate = work_fixup_activate,
				420	.fixup_free = work_fixup_free,
				421	};
				422
				423	static inline void debug_work_activate(struct work_struct *work)
				424	{
				425	debug_object_activate(work, &work_debug_descr);
				426	}
				427
				428	static inline void debug_work_deactivate(struct work_struct *work)
				429	{
				430	debug_object_deactivate(work, &work_debug_descr);
				431	}
				432
				433	void __init_work(struct work_struct *work, int onstack)
				434	{
				435	if (onstack)
				436	debug_object_init_on_stack(work, &work_debug_descr);
				437	else
				438	debug_object_init(work, &work_debug_descr);
				439	}
				440	EXPORT_SYMBOL_GPL(__init_work);
				441
				442	void destroy_work_on_stack(struct work_struct *work)
				443	{
				444	debug_object_free(work, &work_debug_descr);
				445	}
				446	EXPORT_SYMBOL_GPL(destroy_work_on_stack);
				447
				448	#else
				449	static inline void debug_work_activate(struct work_struct *work) { }
				450	static inline void debug_work_deactivate(struct work_struct *work) { }
				451	#endif
				452
Gautham R Shenoy	95402b3	2008-01-25 21:08:02 +0100	[diff] [blame]	453	/* Serializes the accesses to the list of workqueues. */
				454	static DEFINE_SPINLOCK(workqueue_lock);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	455	static LIST_HEAD(workqueues);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	456	static bool workqueue_freezing; /* W: have wqs started freezing? */
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	457
Oleg Nesterov	1444196	2007-05-23 13:57:57 -0700	[diff] [blame]	458	/*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	459	* The almighty global cpu workqueues. nr_running is the only field
				460	* which is expected to be used frequently by other cpus via
				461	* try_to_wake_up(). Put it in a separate cacheline.
Oleg Nesterov	1444196	2007-05-23 13:57:57 -0700	[diff] [blame]	462	*/
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	463	static DEFINE_PER_CPU(struct global_cwq, global_cwq);
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	464	static DEFINE_PER_CPU_SHARED_ALIGNED(atomic_t, pool_nr_running[NR_WORKER_POOLS]);
Nathan Lynch	f756d5e	2006-01-08 01:05:12 -0800	[diff] [blame]	465
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	466	/*
				467	* Global cpu workqueue and nr_running counter for unbound gcwq. The
				468	* gcwq is always online, has GCWQ_DISASSOCIATED set, and all its
				469	* workers have WORKER_UNBOUND set.
				470	*/
				471	static struct global_cwq unbound_global_cwq;
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	472	static atomic_t unbound_pool_nr_running[NR_WORKER_POOLS] = {
				473	[0 ... NR_WORKER_POOLS - 1] = ATOMIC_INIT(0), /* always 0 */
				474	};
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	475
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	476	static int worker_thread(void *__worker);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	477
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	478	static int worker_pool_pri(struct worker_pool *pool)
				479	{
				480	return pool - pool->gcwq->pools;
				481	}
				482
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	483	static struct global_cwq *get_gcwq(unsigned int cpu)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	484	{
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	485	if (cpu != WORK_CPU_UNBOUND)
				486	return &per_cpu(global_cwq, cpu);
				487	else
				488	return &unbound_global_cwq;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	489	}
				490
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	491	static atomic_t get_pool_nr_running(struct worker_pool pool)
Oleg Nesterov	b1f4ec1	2007-05-09 02:34:12 -0700	[diff] [blame]	492	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	493	int cpu = pool->gcwq->cpu;
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	494	int idx = worker_pool_pri(pool);
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	495
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	496	if (cpu != WORK_CPU_UNBOUND)
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	497	return &per_cpu(pool_nr_running, cpu)[idx];
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	498	else
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	499	return &unbound_pool_nr_running[idx];
Oleg Nesterov	b1f4ec1	2007-05-09 02:34:12 -0700	[diff] [blame]	500	}
				501
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	502	static struct cpu_workqueue_struct *get_cwq(unsigned int cpu,
				503	struct workqueue_struct *wq)
Oleg Nesterov	a848e3b	2007-05-09 02:34:17 -0700	[diff] [blame]	504	{
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	505	if (!(wq->flags & WQ_UNBOUND)) {
Lai Jiangshan	e06ffa1	2012-03-09 18:03:20 +0800	[diff] [blame]	506	if (likely(cpu < nr_cpu_ids))
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	507	return per_cpu_ptr(wq->cpu_wq.pcpu, cpu);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	508	} else if (likely(cpu == WORK_CPU_UNBOUND))
				509	return wq->cpu_wq.single;
				510	return NULL;
Oleg Nesterov	a848e3b	2007-05-09 02:34:17 -0700	[diff] [blame]	511	}
				512
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	513	static unsigned int work_color_to_flags(int color)
				514	{
				515	return color << WORK_STRUCT_COLOR_SHIFT;
				516	}
				517
				518	static int get_work_color(struct work_struct *work)
				519	{
				520	return (*work_data_bits(work) >> WORK_STRUCT_COLOR_SHIFT) &
				521	((1 << WORK_STRUCT_COLOR_BITS) - 1);
				522	}
				523
				524	static int work_next_color(int color)
				525	{
				526	return (color + 1) % WORK_NR_COLORS;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	527	}
				528
David Howells	4594bf1	2006-12-07 11:33:26 +0000	[diff] [blame]	529	/*
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	530	* A work's data points to the cwq with WORK_STRUCT_CWQ set while the
				531	* work is on queue. Once execution starts, WORK_STRUCT_CWQ is
				532	* cleared and the work data contains the cpu number it was last on.
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	533	*
				534	* set_work_{cwq\|cpu}() and clear_work_data() can be used to set the
				535	* cwq, cpu or clear work->data. These functions should only be
				536	* called while the work is owned - ie. while the PENDING bit is set.
				537	*
				538	* get_work_[g]cwq() can be used to obtain the gcwq or cwq
				539	* corresponding to a work. gcwq is available once the work has been
				540	* queued anywhere after initialization. cwq is available only from
				541	* queueing until execution starts.
David Howells	4594bf1	2006-12-07 11:33:26 +0000	[diff] [blame]	542	*/
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	543	static inline void set_work_data(struct work_struct *work, unsigned long data,
				544	unsigned long flags)
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	545	{
David Howells	4594bf1	2006-12-07 11:33:26 +0000	[diff] [blame]	546	BUG_ON(!work_pending(work));
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	547	atomic_long_set(&work->data, data \| flags \| work_static(work));
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	548	}
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	549
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	550	static void set_work_cwq(struct work_struct *work,
				551	struct cpu_workqueue_struct *cwq,
				552	unsigned long extra_flags)
Oleg Nesterov	4d707b9	2010-04-23 17:40:40 +0200	[diff] [blame]	553	{
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	554	set_work_data(work, (unsigned long)cwq,
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	555	WORK_STRUCT_PENDING \| WORK_STRUCT_CWQ \| extra_flags);
Oleg Nesterov	4d707b9	2010-04-23 17:40:40 +0200	[diff] [blame]	556	}
				557
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	558	static void set_work_cpu(struct work_struct *work, unsigned int cpu)
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	559	{
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	560	set_work_data(work, cpu << WORK_STRUCT_FLAG_BITS, WORK_STRUCT_PENDING);
				561	}
				562
				563	static void clear_work_data(struct work_struct *work)
				564	{
				565	set_work_data(work, WORK_STRUCT_NO_CPU, 0);
				566	}
				567
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	568	static struct cpu_workqueue_struct get_work_cwq(struct work_struct work)
				569	{
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	570	unsigned long data = atomic_long_read(&work->data);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	571
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	572	if (data & WORK_STRUCT_CWQ)
				573	return (void *)(data & WORK_STRUCT_WQ_DATA_MASK);
				574	else
Srinivasarao P	b6e586c	2013-09-18 14:33:45 +0530	[diff] [blame]	575	{
				576	WARN_ON_ONCE(1);
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	577	return NULL;
Srinivasarao P	b6e586c	2013-09-18 14:33:45 +0530	[diff] [blame]	578	}
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	579	}
				580
				581	static struct global_cwq get_work_gcwq(struct work_struct work)
				582	{
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	583	unsigned long data = atomic_long_read(&work->data);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	584	unsigned int cpu;
				585
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	586	if (data & WORK_STRUCT_CWQ)
				587	return ((struct cpu_workqueue_struct *)
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	588	(data & WORK_STRUCT_WQ_DATA_MASK))->pool->gcwq;
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	589
				590	cpu = data >> WORK_STRUCT_FLAG_BITS;
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	591	if (cpu == WORK_CPU_NONE)
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	592	return NULL;
				593
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	594	BUG_ON(cpu >= nr_cpu_ids && cpu != WORK_CPU_UNBOUND);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	595	return get_gcwq(cpu);
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	596	}
				597
				598	/*
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	599	* Policy functions. These define the policies on how the global worker
				600	* pools are managed. Unless noted otherwise, these functions assume that
				601	* they're being called with gcwq->lock held.
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	602	*/
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	603
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	604	static bool __need_more_worker(struct worker_pool *pool)
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	605	{
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	606	return !atomic_read(get_pool_nr_running(pool));
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	607	}
				608
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	609	/*
				610	* Need to wake up a worker? Called from anything but currently
				611	* running workers.
Tejun Heo	b7b5c68	2012-07-12 14:46:37 -0700	[diff] [blame]	612	*
				613	* Note that, because unbound workers never contribute to nr_running, this
				614	* function will always return %true for unbound gcwq as long as the
				615	* worklist isn't empty.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	616	*/
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	617	static bool need_more_worker(struct worker_pool *pool)
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	618	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	619	return !list_empty(&pool->worklist) && __need_more_worker(pool);
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	620	}
				621
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	622	/* Can I start working? Called from busy but !running workers. */
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	623	static bool may_start_working(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	624	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	625	return pool->nr_idle;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	626	}
				627
				628	/* Do I need to keep working? Called from currently running workers. */
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	629	static bool keep_working(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	630	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	631	atomic_t *nr_running = get_pool_nr_running(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	632
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	633	return !list_empty(&pool->worklist) && atomic_read(nr_running) <= 1;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	634	}
				635
				636	/* Do we need a new worker? Called from manager. */
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	637	static bool need_to_create_worker(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	638	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	639	return need_more_worker(pool) && !may_start_working(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	640	}
				641
				642	/* Do I need to be the manager? */
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	643	static bool need_to_manage_workers(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	644	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	645	return need_to_create_worker(pool) \|\|
Tejun Heo	22ad564	2012-07-12 14:46:37 -0700	[diff] [blame]	646	(pool->flags & POOL_MANAGE_WORKERS);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	647	}
				648
				649	/* Do we have too many workers and should some go away? */
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	650	static bool too_many_workers(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	651	{
Tejun Heo	22ad564	2012-07-12 14:46:37 -0700	[diff] [blame]	652	bool managing = pool->flags & POOL_MANAGING_WORKERS;
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	653	int nr_idle = pool->nr_idle + managing; /* manager is considered idle */
				654	int nr_busy = pool->nr_workers - nr_idle;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	655
				656	return nr_idle > 2 && (nr_idle - 2) * MAX_IDLE_WORKERS_RATIO >= nr_busy;
				657	}
				658
				659	/*
				660	* Wake up functions.
				661	*/
				662
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	663	/* Return the first worker. Safe with preemption disabled */
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	664	static struct worker first_worker(struct worker_pool pool)
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	665	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	666	if (unlikely(list_empty(&pool->idle_list)))
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	667	return NULL;
				668
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	669	return list_first_entry(&pool->idle_list, struct worker, entry);
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	670	}
				671
				672	/**
				673	* wake_up_worker - wake up an idle worker
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	674	* @pool: worker pool to wake worker from
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	675	*
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	676	* Wake up the first idle worker of @pool.
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	677	*
				678	* CONTEXT:
				679	* spin_lock_irq(gcwq->lock).
				680	*/
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	681	static void wake_up_worker(struct worker_pool *pool)
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	682	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	683	struct worker *worker = first_worker(pool);
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	684
				685	if (likely(worker))
				686	wake_up_process(worker->task);
				687	}
				688
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	689	/**
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	690	* wq_worker_waking_up - a worker is waking up
				691	* @task: task waking up
				692	* @cpu: CPU @task is waking up to
				693	*
				694	* This function is called during try_to_wake_up() when a worker is
				695	* being awoken.
				696	*
				697	* CONTEXT:
				698	* spin_lock_irq(rq->lock)
				699	*/
				700	void wq_worker_waking_up(struct task_struct *task, unsigned int cpu)
				701	{
				702	struct worker *worker = kthread_data(task);
				703
Steven Rostedt	2d64672	2010-12-03 23:12:33 -0500	[diff] [blame]	704	if (!(worker->flags & WORKER_NOT_RUNNING))
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	705	atomic_inc(get_pool_nr_running(worker->pool));
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	706	}
				707
				708	/**
				709	* wq_worker_sleeping - a worker is going to sleep
				710	* @task: task going to sleep
				711	* @cpu: CPU in question, must be the current CPU number
				712	*
				713	* This function is called during schedule() when a busy worker is
				714	* going to sleep. Worker on the same cpu can be woken up by
				715	* returning pointer to its task.
				716	*
				717	* CONTEXT:
				718	* spin_lock_irq(rq->lock)
				719	*
				720	* RETURNS:
				721	* Worker task on @cpu to wake up, %NULL if none.
				722	*/
				723	struct task_struct wq_worker_sleeping(struct task_struct task,
				724	unsigned int cpu)
				725	{
				726	struct worker worker = kthread_data(task), to_wakeup = NULL;
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	727	struct worker_pool *pool = worker->pool;
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	728	atomic_t *nr_running = get_pool_nr_running(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	729
Steven Rostedt	2d64672	2010-12-03 23:12:33 -0500	[diff] [blame]	730	if (worker->flags & WORKER_NOT_RUNNING)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	731	return NULL;
				732
				733	/* this can only happen on the local cpu */
				734	BUG_ON(cpu != raw_smp_processor_id());
				735
				736	/*
				737	* The counterpart of the following dec_and_test, implied mb,
				738	* worklist not empty test sequence is in insert_work().
				739	* Please read comment there.
				740	*
				741	* NOT_RUNNING is clear. This means that trustee is not in
				742	* charge and we're running on the local cpu w/ rq lock held
				743	* and preemption disabled, which in turn means that none else
				744	* could be manipulating idle_list, so dereferencing idle_list
				745	* without gcwq lock is safe.
				746	*/
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	747	if (atomic_dec_and_test(nr_running) && !list_empty(&pool->worklist))
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	748	to_wakeup = first_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	749	return to_wakeup ? to_wakeup->task : NULL;
				750	}
				751
				752	/**
				753	* worker_set_flags - set worker flags and adjust nr_running accordingly
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	754	* @worker: self
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	755	* @flags: flags to set
				756	* @wakeup: wakeup an idle worker if necessary
				757	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	758	* Set @flags in @worker->flags and adjust nr_running accordingly. If
				759	* nr_running becomes zero and @wakeup is %true, an idle worker is
				760	* woken up.
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	761	*
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	762	* CONTEXT:
				763	* spin_lock_irq(gcwq->lock)
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	764	*/
				765	static inline void worker_set_flags(struct worker *worker, unsigned int flags,
				766	bool wakeup)
				767	{
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	768	struct worker_pool *pool = worker->pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	769
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	770	WARN_ON_ONCE(worker->task != current);
				771
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	772	/*
				773	* If transitioning into NOT_RUNNING, adjust nr_running and
				774	* wake up an idle worker as necessary if requested by
				775	* @wakeup.
				776	*/
				777	if ((flags & WORKER_NOT_RUNNING) &&
				778	!(worker->flags & WORKER_NOT_RUNNING)) {
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	779	atomic_t *nr_running = get_pool_nr_running(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	780
				781	if (wakeup) {
				782	if (atomic_dec_and_test(nr_running) &&
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	783	!list_empty(&pool->worklist))
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	784	wake_up_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	785	} else
				786	atomic_dec(nr_running);
				787	}
				788
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	789	worker->flags \|= flags;
				790	}
				791
				792	/**
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	793	* worker_clr_flags - clear worker flags and adjust nr_running accordingly
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	794	* @worker: self
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	795	* @flags: flags to clear
				796	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	797	* Clear @flags in @worker->flags and adjust nr_running accordingly.
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	798	*
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	799	* CONTEXT:
				800	* spin_lock_irq(gcwq->lock)
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	801	*/
				802	static inline void worker_clr_flags(struct worker *worker, unsigned int flags)
				803	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	804	struct worker_pool *pool = worker->pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	805	unsigned int oflags = worker->flags;
				806
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	807	WARN_ON_ONCE(worker->task != current);
				808
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	809	worker->flags &= ~flags;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	810
Tejun Heo	42c025f	2011-01-11 15:58:49 +0100	[diff] [blame]	811	/*
				812	* If transitioning out of NOT_RUNNING, increment nr_running. Note
				813	* that the nested NOT_RUNNING is not a noop. NOT_RUNNING is mask
				814	* of multiple flags, not a single flag.
				815	*/
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	816	if ((flags & WORKER_NOT_RUNNING) && (oflags & WORKER_NOT_RUNNING))
				817	if (!(worker->flags & WORKER_NOT_RUNNING))
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	818	atomic_inc(get_pool_nr_running(pool));
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	819	}
				820
				821	/**
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	822	* busy_worker_head - return the busy hash head for a work
				823	* @gcwq: gcwq of interest
				824	* @work: work to be hashed
				825	*
				826	* Return hash head of @gcwq for @work.
				827	*
				828	* CONTEXT:
				829	* spin_lock_irq(gcwq->lock).
				830	*
				831	* RETURNS:
				832	* Pointer to the hash head.
				833	*/
				834	static struct hlist_head busy_worker_head(struct global_cwq gcwq,
				835	struct work_struct *work)
				836	{
				837	const int base_shift = ilog2(sizeof(struct work_struct));
				838	unsigned long v = (unsigned long)work;
				839
				840	/* simple shift and fold hash, do we need something better? */
				841	v >>= base_shift;
				842	v += v >> BUSY_WORKER_HASH_ORDER;
				843	v &= BUSY_WORKER_HASH_MASK;
				844
				845	return &gcwq->busy_hash[v];
				846	}
				847
				848	/**
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	849	* __find_worker_executing_work - find worker which is executing a work
				850	* @gcwq: gcwq of interest
				851	* @bwh: hash head as returned by busy_worker_head()
				852	* @work: work to find worker for
				853	*
				854	* Find a worker which is executing @work on @gcwq. @bwh should be
				855	* the hash head obtained by calling busy_worker_head() with the same
				856	* work.
				857	*
				858	* CONTEXT:
				859	* spin_lock_irq(gcwq->lock).
				860	*
				861	* RETURNS:
				862	* Pointer to worker which is executing @work if found, NULL
				863	* otherwise.
				864	*/
				865	static struct worker __find_worker_executing_work(struct global_cwq gcwq,
				866	struct hlist_head *bwh,
				867	struct work_struct *work)
				868	{
				869	struct worker *worker;
				870	struct hlist_node *tmp;
				871
				872	hlist_for_each_entry(worker, tmp, bwh, hentry)
Tejun Heo	55e3e1f	2012-12-18 10:35:02 -0800	[diff] [blame]	873	if (worker->current_work == work &&
				874	worker->current_func == work->func)
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	875	return worker;
				876	return NULL;
				877	}
				878
				879	/**
				880	* find_worker_executing_work - find worker which is executing a work
				881	* @gcwq: gcwq of interest
				882	* @work: work to find worker for
				883	*
Tejun Heo	55e3e1f	2012-12-18 10:35:02 -0800	[diff] [blame]	884	* Find a worker which is executing @work on @gcwq by searching
				885	* @gcwq->busy_hash which is keyed by the address of @work. For a worker
				886	* to match, its current execution should match the address of @work and
				887	* its work function. This is to avoid unwanted dependency between
				888	* unrelated work executions through a work item being recycled while still
				889	* being executed.
				890	*
				891	* This is a bit tricky. A work item may be freed once its execution
				892	* starts and nothing prevents the freed area from being recycled for
				893	* another work item. If the same work item address ends up being reused
				894	* before the original execution finishes, workqueue will identify the
				895	* recycled work item as currently executing and make it wait until the
				896	* current execution finishes, introducing an unwanted dependency.
				897	*
				898	* This function checks the work item address, work function and workqueue
				899	* to avoid false positives. Note that this isn't complete as one may
				900	* construct a work function which can introduce dependency onto itself
				901	* through a recycled work item. Well, if somebody wants to shoot oneself
				902	* in the foot that badly, there's only so much we can do, and if such
				903	* deadlock actually occurs, it should be easy to locate the culprit work
				904	* function.
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	905	*
				906	* CONTEXT:
				907	* spin_lock_irq(gcwq->lock).
				908	*
				909	* RETURNS:
				910	* Pointer to worker which is executing @work if found, NULL
				911	* otherwise.
				912	*/
				913	static struct worker find_worker_executing_work(struct global_cwq gcwq,
				914	struct work_struct *work)
				915	{
				916	return __find_worker_executing_work(gcwq, busy_worker_head(gcwq, work),
				917	work);
				918	}
				919
				920	/**
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	921	* insert_work - insert a work into gcwq
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	922	* @cwq: cwq @work belongs to
				923	* @work: work to insert
				924	* @head: insertion point
				925	* @extra_flags: extra WORK_STRUCT_* flags to set
				926	*
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	927	* Insert @work which belongs to @cwq into @gcwq after @head.
				928	* @extra_flags is or'd to work_struct flags.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	929	*
				930	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	931	* spin_lock_irq(gcwq->lock).
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	932	*/
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	933	static void insert_work(struct cpu_workqueue_struct *cwq,
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	934	struct work_struct work, struct list_head head,
				935	unsigned int extra_flags)
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	936	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	937	struct worker_pool *pool = cwq->pool;
Frederic Weisbecker	e1d8aa9	2009-01-12 23:15:46 +0100	[diff] [blame]	938
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	939	/* we own @work, set data and link */
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	940	set_work_cwq(work, cwq, extra_flags);
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	941
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	942	/*
				943	* Ensure that we get the right work->data if we see the
				944	* result of list_add() below, see try_to_grab_pending().
				945	*/
				946	smp_wmb();
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	947
Oleg Nesterov	1a4d9b0	2008-07-25 01:47:47 -0700	[diff] [blame]	948	list_add_tail(&work->entry, head);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	949
				950	/*
				951	* Ensure either worker_sched_deactivated() sees the above
				952	* list_add_tail() or we see zero nr_running to avoid workers
				953	* lying around lazily while there are works to be processed.
				954	*/
				955	smp_mb();
				956
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	957	if (__need_more_worker(pool))
				958	wake_up_worker(pool);
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	959	}
				960
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	961	/*
				962	* Test whether @work is being queued from another work executing on the
				963	* same workqueue. This is rather expensive and should only be used from
				964	* cold paths.
				965	*/
				966	static bool is_chained_work(struct workqueue_struct *wq)
				967	{
				968	unsigned long flags;
				969	unsigned int cpu;
				970
				971	for_each_gcwq_cpu(cpu) {
				972	struct global_cwq *gcwq = get_gcwq(cpu);
				973	struct worker *worker;
				974	struct hlist_node *pos;
				975	int i;
				976
				977	spin_lock_irqsave(&gcwq->lock, flags);
				978	for_each_busy_worker(worker, i, pos, gcwq) {
				979	if (worker->task != current)
				980	continue;
				981	spin_unlock_irqrestore(&gcwq->lock, flags);
				982	/*
				983	* I'm @worker, no locking necessary. See if @work
				984	* is headed to the same workqueue.
				985	*/
				986	return worker->current_cwq->wq == wq;
				987	}
				988	spin_unlock_irqrestore(&gcwq->lock, flags);
				989	}
				990	return false;
				991	}
				992
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	993	static void __queue_work(unsigned int cpu, struct workqueue_struct *wq,
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	994	struct work_struct *work)
				995	{
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	996	struct global_cwq *gcwq;
				997	struct cpu_workqueue_struct *cwq;
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	998	struct list_head *worklist;
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	999	unsigned int work_flags;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1000	unsigned long flags;
				1001
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	1002	debug_work_activate(work);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1003
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	1004	/* if dying, only works from the same workqueue are allowed */
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	1005	if (unlikely(wq->flags & WQ_DRAINING) &&
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	1006	WARN_ON_ONCE(!is_chained_work(wq)))
Tejun Heo	e41e704	2010-08-24 14:22:47 +0200	[diff] [blame]	1007	return;
				1008
Tejun Heo	c7fc77f	2010-07-02 10:03:51 +0200	[diff] [blame]	1009	/* determine gcwq to use */
				1010	if (!(wq->flags & WQ_UNBOUND)) {
Tejun Heo	18aa9ef	2010-06-29 10:07:13 +0200	[diff] [blame]	1011	struct global_cwq *last_gcwq;
				1012
Tejun Heo	c7fc77f	2010-07-02 10:03:51 +0200	[diff] [blame]	1013	if (unlikely(cpu == WORK_CPU_UNBOUND))
				1014	cpu = raw_smp_processor_id();
				1015
Tejun Heo	18aa9ef	2010-06-29 10:07:13 +0200	[diff] [blame]	1016	/*
				1017	* It's multi cpu. If @wq is non-reentrant and @work
				1018	* was previously on a different cpu, it might still
				1019	* be running there, in which case the work needs to
				1020	* be queued on that cpu to guarantee non-reentrance.
				1021	*/
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	1022	gcwq = get_gcwq(cpu);
Tejun Heo	18aa9ef	2010-06-29 10:07:13 +0200	[diff] [blame]	1023	if (wq->flags & WQ_NON_REENTRANT &&
				1024	(last_gcwq = get_work_gcwq(work)) && last_gcwq != gcwq) {
				1025	struct worker *worker;
				1026
				1027	spin_lock_irqsave(&last_gcwq->lock, flags);
				1028
				1029	worker = find_worker_executing_work(last_gcwq, work);
				1030
				1031	if (worker && worker->current_cwq->wq == wq)
				1032	gcwq = last_gcwq;
				1033	else {
				1034	/* meh... not running there, queue here */
				1035	spin_unlock_irqrestore(&last_gcwq->lock, flags);
				1036	spin_lock_irqsave(&gcwq->lock, flags);
				1037	}
				1038	} else
				1039	spin_lock_irqsave(&gcwq->lock, flags);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1040	} else {
				1041	gcwq = get_gcwq(WORK_CPU_UNBOUND);
				1042	spin_lock_irqsave(&gcwq->lock, flags);
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	1043	}
				1044
				1045	/* gcwq determined, get cwq and queue */
				1046	cwq = get_cwq(gcwq->cpu, wq);
Tejun Heo	cdadf00	2010-10-05 10:49:55 +0200	[diff] [blame]	1047	trace_workqueue_queue_work(cpu, cwq, work);
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	1048
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1049	BUG_ON(!list_empty(&work->entry));
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1050
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1051	cwq->nr_in_flight[cwq->work_color]++;
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1052	work_flags = work_color_to_flags(cwq->work_color);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1053
				1054	if (likely(cwq->nr_active < cwq->max_active)) {
Tejun Heo	cdadf00	2010-10-05 10:49:55 +0200	[diff] [blame]	1055	trace_workqueue_activate_work(work);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1056	cwq->nr_active++;
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	1057	worklist = &cwq->pool->worklist;
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1058	} else {
				1059	work_flags \|= WORK_STRUCT_DELAYED;
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1060	worklist = &cwq->delayed_works;
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1061	}
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1062
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1063	insert_work(cwq, work, worklist, work_flags);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1064
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1065	spin_unlock_irqrestore(&gcwq->lock, flags);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1066	}
				1067
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1068	/**
				1069	* queue_work - queue work on a workqueue
				1070	* @wq: workqueue to use
				1071	* @work: work to queue
				1072	*
Alan Stern	057647f	2006-10-28 10:38:58 -0700	[diff] [blame]	1073	* Returns 0 if @work was already on a queue, non-zero otherwise.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1074	*
Oleg Nesterov	00dfcaf	2008-04-29 01:00:27 -0700	[diff] [blame]	1075	* We queue the work to the CPU on which it was submitted, but if the CPU dies
				1076	* it can be processed by another CPU.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1077	*/
Harvey Harrison	7ad5b3a	2008-02-08 04:19:53 -0800	[diff] [blame]	1078	int queue_work(struct workqueue_struct wq, struct work_struct work)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1079	{
Oleg Nesterov	ef1ca23	2008-07-25 01:47:53 -0700	[diff] [blame]	1080	int ret;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1081
Oleg Nesterov	ef1ca23	2008-07-25 01:47:53 -0700	[diff] [blame]	1082	ret = queue_work_on(get_cpu(), wq, work);
				1083	put_cpu();
				1084
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1085	return ret;
				1086	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	1087	EXPORT_SYMBOL_GPL(queue_work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1088
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	1089	/**
				1090	* queue_work_on - queue work on specific cpu
				1091	* @cpu: CPU number to execute work on
				1092	* @wq: workqueue to use
				1093	* @work: work to queue
				1094	*
				1095	* Returns 0 if @work was already on a queue, non-zero otherwise.
				1096	*
				1097	* We queue the work to a specific CPU, the caller must ensure it
				1098	* can't go away.
				1099	*/
				1100	int
				1101	queue_work_on(int cpu, struct workqueue_struct wq, struct work_struct work)
				1102	{
				1103	int ret = 0;
				1104
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	1105	if (!test_and_set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(work))) {
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1106	__queue_work(cpu, wq, work);
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	1107	ret = 1;
				1108	}
				1109	return ret;
				1110	}
				1111	EXPORT_SYMBOL_GPL(queue_work_on);
				1112
Li Zefan	6d141c3	2008-02-08 04:21:09 -0800	[diff] [blame]	1113	static void delayed_work_timer_fn(unsigned long __data)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1114	{
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1115	struct delayed_work dwork = (struct delayed_work )__data;
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	1116	struct cpu_workqueue_struct *cwq = get_work_cwq(&dwork->work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1117
Srinivasarao P	b6e586c	2013-09-18 14:33:45 +0530	[diff] [blame]	1118	if (cwq != NULL)
				1119	__queue_work(smp_processor_id(), cwq->wq, &dwork->work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1120	}
				1121
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1122	/**
				1123	* queue_delayed_work - queue work on a workqueue after delay
				1124	* @wq: workqueue to use
Randy Dunlap	af9997e	2006-12-22 01:06:52 -0800	[diff] [blame]	1125	* @dwork: delayable work to queue
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1126	* @delay: number of jiffies to wait before queueing
				1127	*
Alan Stern	057647f	2006-10-28 10:38:58 -0700	[diff] [blame]	1128	* Returns 0 if @work was already on a queue, non-zero otherwise.
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1129	*/
Harvey Harrison	7ad5b3a	2008-02-08 04:19:53 -0800	[diff] [blame]	1130	int queue_delayed_work(struct workqueue_struct *wq,
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1131	struct delayed_work *dwork, unsigned long delay)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1132	{
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1133	if (delay == 0)
Oleg Nesterov	63bc036	2007-05-09 02:34:16 -0700	[diff] [blame]	1134	return queue_work(wq, &dwork->work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1135
Oleg Nesterov	63bc036	2007-05-09 02:34:16 -0700	[diff] [blame]	1136	return queue_delayed_work_on(-1, wq, dwork, delay);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1137	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	1138	EXPORT_SYMBOL_GPL(queue_delayed_work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1139
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1140	/**
				1141	* queue_delayed_work_on - queue work on specific CPU after delay
				1142	* @cpu: CPU number to execute work on
				1143	* @wq: workqueue to use
Randy Dunlap	af9997e	2006-12-22 01:06:52 -0800	[diff] [blame]	1144	* @dwork: work to queue
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1145	* @delay: number of jiffies to wait before queueing
				1146	*
Alan Stern	057647f	2006-10-28 10:38:58 -0700	[diff] [blame]	1147	* Returns 0 if @work was already on a queue, non-zero otherwise.
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1148	*/
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1149	int queue_delayed_work_on(int cpu, struct workqueue_struct *wq,
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1150	struct delayed_work *dwork, unsigned long delay)
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1151	{
				1152	int ret = 0;
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1153	struct timer_list *timer = &dwork->timer;
				1154	struct work_struct *work = &dwork->work;
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1155
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	1156	if (!test_and_set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(work))) {
Tejun Heo	c7fc77f	2010-07-02 10:03:51 +0200	[diff] [blame]	1157	unsigned int lcpu;
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	1158
Tejun Heo	4afca92	2012-12-04 07:40:39 -0800	[diff] [blame]	1159	WARN_ON_ONCE(timer_pending(timer));
				1160	WARN_ON_ONCE(!list_empty(&work->entry));
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1161
Andrew Liu	8a3e77c	2008-05-01 04:35:14 -0700	[diff] [blame]	1162	timer_stats_timer_set_start_info(&dwork->timer);
				1163
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	1164	/*
				1165	* This stores cwq for the moment, for the timer_fn.
				1166	* Note that the work's gcwq is preserved to allow
				1167	* reentrance detection for delayed works.
				1168	*/
Tejun Heo	c7fc77f	2010-07-02 10:03:51 +0200	[diff] [blame]	1169	if (!(wq->flags & WQ_UNBOUND)) {
				1170	struct global_cwq *gcwq = get_work_gcwq(work);
				1171
				1172	if (gcwq && gcwq->cpu != WORK_CPU_UNBOUND)
				1173	lcpu = gcwq->cpu;
				1174	else
				1175	lcpu = raw_smp_processor_id();
				1176	} else
				1177	lcpu = WORK_CPU_UNBOUND;
				1178
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	1179	set_work_cwq(work, get_cwq(lcpu, wq), 0);
Tejun Heo	c7fc77f	2010-07-02 10:03:51 +0200	[diff] [blame]	1180
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1181	timer->expires = jiffies + delay;
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1182	timer->data = (unsigned long)dwork;
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1183	timer->function = delayed_work_timer_fn;
Oleg Nesterov	63bc036	2007-05-09 02:34:16 -0700	[diff] [blame]	1184
				1185	if (unlikely(cpu >= 0))
				1186	add_timer_on(timer, cpu);
				1187	else
				1188	add_timer(timer);
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1189	ret = 1;
				1190	}
				1191	return ret;
				1192	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	1193	EXPORT_SYMBOL_GPL(queue_delayed_work_on);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1194
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1195	/**
				1196	* worker_enter_idle - enter idle state
				1197	* @worker: worker which is entering idle state
				1198	*
				1199	* @worker is entering idle state. Update stats and idle timer if
				1200	* necessary.
				1201	*
				1202	* LOCKING:
				1203	* spin_lock_irq(gcwq->lock).
				1204	*/
				1205	static void worker_enter_idle(struct worker *worker)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1206	{
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1207	struct worker_pool *pool = worker->pool;
				1208	struct global_cwq *gcwq = pool->gcwq;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1209
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1210	BUG_ON(worker->flags & WORKER_IDLE);
				1211	BUG_ON(!list_empty(&worker->entry) &&
				1212	(worker->hentry.next \|\| worker->hentry.pprev));
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1213
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	1214	/* can't use worker_set_flags(), also called from start_worker() */
				1215	worker->flags \|= WORKER_IDLE;
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1216	pool->nr_idle++;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1217	worker->last_active = jiffies;
Peter Zijlstra	d5abe66	2006-12-06 20:37:26 -0800	[diff] [blame]	1218
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1219	/* idle_list is LIFO */
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1220	list_add(&worker->entry, &pool->idle_list);
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	1221
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1222	if (likely(!(worker->flags & WORKER_ROGUE))) {
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1223	if (too_many_workers(pool) && !timer_pending(&pool->idle_timer))
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1224	mod_timer(&pool->idle_timer,
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1225	jiffies + IDLE_WORKER_TIMEOUT);
				1226	} else
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	1227	wake_up_all(&gcwq->trustee_wait);
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	1228
Tejun Heo	24312d3	2012-05-14 15:04:50 -0700	[diff] [blame]	1229	/*
				1230	* Sanity check nr_running. Because trustee releases gcwq->lock
				1231	* between setting %WORKER_ROGUE and zapping nr_running, the
				1232	* warning may trigger spuriously. Check iff trustee is idle.
				1233	*/
				1234	WARN_ON_ONCE(gcwq->trustee_state == TRUSTEE_DONE &&
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1235	pool->nr_workers == pool->nr_idle &&
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1236	atomic_read(get_pool_nr_running(pool)));
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1237	}
				1238
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1239	/**
				1240	* worker_leave_idle - leave idle state
				1241	* @worker: worker which is leaving idle state
				1242	*
				1243	* @worker is leaving idle state. Update stats.
				1244	*
				1245	* LOCKING:
				1246	* spin_lock_irq(gcwq->lock).
				1247	*/
				1248	static void worker_leave_idle(struct worker *worker)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1249	{
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1250	struct worker_pool *pool = worker->pool;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1251
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1252	BUG_ON(!(worker->flags & WORKER_IDLE));
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	1253	worker_clr_flags(worker, WORKER_IDLE);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1254	pool->nr_idle--;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1255	list_del_init(&worker->entry);
				1256	}
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1257
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1258	/**
				1259	* worker_maybe_bind_and_lock - bind worker to its cpu if possible and lock gcwq
				1260	* @worker: self
				1261	*
				1262	* Works which are scheduled while the cpu is online must at least be
				1263	* scheduled to a worker which is bound to the cpu so that if they are
				1264	* flushed from cpu callbacks while cpu is going down, they are
				1265	* guaranteed to execute on the cpu.
				1266	*
				1267	* This function is to be used by rogue workers and rescuers to bind
				1268	* themselves to the target cpu and may race with cpu going down or
				1269	* coming online. kthread_bind() can't be used because it may put the
				1270	* worker to already dead cpu and set_cpus_allowed_ptr() can't be used
				1271	* verbatim as it's best effort and blocking and gcwq may be
				1272	* [dis]associated in the meantime.
				1273	*
				1274	* This function tries set_cpus_allowed() and locks gcwq and verifies
				1275	* the binding against GCWQ_DISASSOCIATED which is set during
				1276	* CPU_DYING and cleared during CPU_ONLINE, so if the worker enters
				1277	* idle state or fetches works without dropping lock, it can guarantee
				1278	* the scheduling requirement described in the first paragraph.
				1279	*
				1280	* CONTEXT:
				1281	* Might sleep. Called without any lock but returns with gcwq->lock
				1282	* held.
				1283	*
				1284	* RETURNS:
				1285	* %true if the associated gcwq is online (@worker is successfully
				1286	* bound), %false if offline.
				1287	*/
				1288	static bool worker_maybe_bind_and_lock(struct worker *worker)
Namhyung Kim	972fa1c	2010-08-22 23:19:43 +0900	[diff] [blame]	1289	__acquires(&gcwq->lock)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1290	{
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1291	struct global_cwq *gcwq = worker->pool->gcwq;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1292	struct task_struct *task = worker->task;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1293
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1294	while (true) {
				1295	/*
				1296	* The following call may fail, succeed or succeed
				1297	* without actually migrating the task to the cpu if
				1298	* it races with cpu hotunplug operation. Verify
				1299	* against GCWQ_DISASSOCIATED.
				1300	*/
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1301	if (!(gcwq->flags & GCWQ_DISASSOCIATED))
				1302	set_cpus_allowed_ptr(task, get_cpu_mask(gcwq->cpu));
Oleg Nesterov	85f4186	2007-05-09 02:34:20 -0700	[diff] [blame]	1303
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1304	spin_lock_irq(&gcwq->lock);
				1305	if (gcwq->flags & GCWQ_DISASSOCIATED)
				1306	return false;
				1307	if (task_cpu(task) == gcwq->cpu &&
				1308	cpumask_equal(&current->cpus_allowed,
				1309	get_cpu_mask(gcwq->cpu)))
				1310	return true;
				1311	spin_unlock_irq(&gcwq->lock);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	1312
Tejun Heo	5035b20	2011-04-29 18:08:37 +0200	[diff] [blame]	1313	/*
				1314	* We've raced with CPU hot[un]plug. Give it a breather
				1315	* and retry migration. cond_resched() is required here;
				1316	* otherwise, we might deadlock against cpu_stop trying to
				1317	* bring down the CPU on non-preemptive kernel.
				1318	*/
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1319	cpu_relax();
Tejun Heo	5035b20	2011-04-29 18:08:37 +0200	[diff] [blame]	1320	cond_resched();
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1321	}
				1322	}
				1323
				1324	/*
				1325	* Function for worker->rebind_work used to rebind rogue busy workers
				1326	* to the associated cpu which is coming back online. This is
				1327	* scheduled by cpu up but can race with other cpu hotplug operations
				1328	* and may be executed twice without intervening cpu down.
				1329	*/
				1330	static void worker_rebind_fn(struct work_struct *work)
				1331	{
				1332	struct worker *worker = container_of(work, struct worker, rebind_work);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1333	struct global_cwq *gcwq = worker->pool->gcwq;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1334
				1335	if (worker_maybe_bind_and_lock(worker))
				1336	worker_clr_flags(worker, WORKER_REBIND);
				1337
				1338	spin_unlock_irq(&gcwq->lock);
				1339	}
				1340
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1341	static struct worker *alloc_worker(void)
				1342	{
				1343	struct worker *worker;
				1344
				1345	worker = kzalloc(sizeof(*worker), GFP_KERNEL);
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1346	if (worker) {
				1347	INIT_LIST_HEAD(&worker->entry);
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1348	INIT_LIST_HEAD(&worker->scheduled);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1349	INIT_WORK(&worker->rebind_work, worker_rebind_fn);
				1350	/* on creation a worker is in !idle && prep state */
				1351	worker->flags = WORKER_PREP;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1352	}
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1353	return worker;
				1354	}
				1355
				1356	/**
				1357	* create_worker - create a new workqueue worker
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1358	* @pool: pool the new worker will belong to
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1359	* @bind: whether to set affinity to @cpu or not
				1360	*
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1361	* Create a new worker which is bound to @pool. The returned worker
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1362	* can be started by calling start_worker() or destroyed using
				1363	* destroy_worker().
				1364	*
				1365	* CONTEXT:
				1366	* Might sleep. Does GFP_KERNEL allocations.
				1367	*
				1368	* RETURNS:
				1369	* Pointer to the newly created worker.
				1370	*/
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1371	static struct worker create_worker(struct worker_pool pool, bool bind)
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1372	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1373	struct global_cwq *gcwq = pool->gcwq;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1374	bool on_unbound_cpu = gcwq->cpu == WORK_CPU_UNBOUND;
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	1375	const char *pri = worker_pool_pri(pool) ? "H" : "";
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1376	struct worker *worker = NULL;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1377	int id = -1;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1378
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1379	spin_lock_irq(&gcwq->lock);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1380	while (ida_get_new(&pool->worker_ida, &id)) {
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1381	spin_unlock_irq(&gcwq->lock);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1382	if (!ida_pre_get(&pool->worker_ida, GFP_KERNEL))
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1383	goto fail;
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1384	spin_lock_irq(&gcwq->lock);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1385	}
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1386	spin_unlock_irq(&gcwq->lock);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1387
				1388	worker = alloc_worker();
				1389	if (!worker)
				1390	goto fail;
				1391
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1392	worker->pool = pool;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1393	worker->id = id;
				1394
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1395	if (!on_unbound_cpu)
Eric Dumazet	94dcf29	2011-03-22 16:30:45 -0700	[diff] [blame]	1396	worker->task = kthread_create_on_node(worker_thread,
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	1397	worker, cpu_to_node(gcwq->cpu),
				1398	"kworker/%u:%d%s", gcwq->cpu, id, pri);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1399	else
				1400	worker->task = kthread_create(worker_thread, worker,
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	1401	"kworker/u:%d%s", id, pri);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1402	if (IS_ERR(worker->task))
				1403	goto fail;
				1404
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	1405	if (worker_pool_pri(pool))
				1406	set_user_nice(worker->task, HIGHPRI_NICE_LEVEL);
				1407
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	1408	/*
				1409	* A rogue worker will become a regular one if CPU comes
				1410	* online later on. Make sure every worker has
				1411	* PF_THREAD_BOUND set.
				1412	*/
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1413	if (bind && !on_unbound_cpu)
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1414	kthread_bind(worker->task, gcwq->cpu);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1415	else {
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	1416	worker->task->flags \|= PF_THREAD_BOUND;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1417	if (on_unbound_cpu)
				1418	worker->flags \|= WORKER_UNBOUND;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1419	}
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	1420
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1421	return worker;
				1422	fail:
				1423	if (id >= 0) {
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1424	spin_lock_irq(&gcwq->lock);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1425	ida_remove(&pool->worker_ida, id);
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1426	spin_unlock_irq(&gcwq->lock);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1427	}
				1428	kfree(worker);
				1429	return NULL;
				1430	}
				1431
				1432	/**
				1433	* start_worker - start a newly created worker
				1434	* @worker: worker to start
				1435	*
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1436	* Make the gcwq aware of @worker and start it.
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1437	*
				1438	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1439	* spin_lock_irq(gcwq->lock).
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1440	*/
				1441	static void start_worker(struct worker *worker)
				1442	{
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	1443	worker->flags \|= WORKER_STARTED;
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1444	worker->pool->nr_workers++;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1445	worker_enter_idle(worker);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1446	wake_up_process(worker->task);
				1447	}
				1448
				1449	/**
				1450	* destroy_worker - destroy a workqueue worker
				1451	* @worker: worker to be destroyed
				1452	*
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1453	* Destroy @worker and adjust @gcwq stats accordingly.
				1454	*
				1455	* CONTEXT:
				1456	* spin_lock_irq(gcwq->lock) which is released and regrabbed.
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1457	*/
				1458	static void destroy_worker(struct worker *worker)
				1459	{
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1460	struct worker_pool *pool = worker->pool;
				1461	struct global_cwq *gcwq = pool->gcwq;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1462	int id = worker->id;
				1463
				1464	/* sanity check frenzy */
				1465	BUG_ON(worker->current_work);
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1466	BUG_ON(!list_empty(&worker->scheduled));
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1467
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1468	if (worker->flags & WORKER_STARTED)
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1469	pool->nr_workers--;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1470	if (worker->flags & WORKER_IDLE)
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1471	pool->nr_idle--;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1472
				1473	list_del_init(&worker->entry);
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	1474	worker->flags \|= WORKER_DIE;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1475
				1476	spin_unlock_irq(&gcwq->lock);
				1477
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1478	kthread_stop(worker->task);
				1479	kfree(worker);
				1480
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1481	spin_lock_irq(&gcwq->lock);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1482	ida_remove(&pool->worker_ida, id);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1483	}
				1484
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1485	static void idle_worker_timeout(unsigned long __pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1486	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1487	struct worker_pool pool = (void )__pool;
				1488	struct global_cwq *gcwq = pool->gcwq;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1489
				1490	spin_lock_irq(&gcwq->lock);
				1491
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1492	if (too_many_workers(pool)) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1493	struct worker *worker;
				1494	unsigned long expires;
				1495
				1496	/* idle_list is kept in LIFO order, check the last one */
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1497	worker = list_entry(pool->idle_list.prev, struct worker, entry);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1498	expires = worker->last_active + IDLE_WORKER_TIMEOUT;
				1499
				1500	if (time_before(jiffies, expires))
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1501	mod_timer(&pool->idle_timer, expires);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1502	else {
				1503	/* it's been idle for too long, wake up manager */
Tejun Heo	22ad564	2012-07-12 14:46:37 -0700	[diff] [blame]	1504	pool->flags \|= POOL_MANAGE_WORKERS;
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1505	wake_up_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1506	}
				1507	}
				1508
				1509	spin_unlock_irq(&gcwq->lock);
				1510	}
				1511
				1512	static bool send_mayday(struct work_struct *work)
				1513	{
				1514	struct cpu_workqueue_struct *cwq = get_work_cwq(work);
				1515	struct workqueue_struct *wq = cwq->wq;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1516	unsigned int cpu;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1517
				1518	if (!(wq->flags & WQ_RESCUER))
				1519	return false;
				1520
				1521	/* mayday mayday mayday */
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1522	cpu = cwq->pool->gcwq->cpu;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1523	/* WORK_CPU_UNBOUND can't be set in cpumask, use cpu 0 instead */
				1524	if (cpu == WORK_CPU_UNBOUND)
				1525	cpu = 0;
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	1526	if (!mayday_test_and_set_cpu(cpu, wq->mayday_mask))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1527	wake_up_process(wq->rescuer->task);
				1528	return true;
				1529	}
				1530
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1531	static void gcwq_mayday_timeout(unsigned long __pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1532	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1533	struct worker_pool pool = (void )__pool;
				1534	struct global_cwq *gcwq = pool->gcwq;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1535	struct work_struct *work;
				1536
				1537	spin_lock_irq(&gcwq->lock);
				1538
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1539	if (need_to_create_worker(pool)) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1540	/*
				1541	* We've been trying to create a new worker but
				1542	* haven't been successful. We might be hitting an
				1543	* allocation deadlock. Send distress signals to
				1544	* rescuers.
				1545	*/
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1546	list_for_each_entry(work, &pool->worklist, entry)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1547	send_mayday(work);
				1548	}
				1549
				1550	spin_unlock_irq(&gcwq->lock);
				1551
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1552	mod_timer(&pool->mayday_timer, jiffies + MAYDAY_INTERVAL);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1553	}
				1554
				1555	/**
				1556	* maybe_create_worker - create a new worker if necessary
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1557	* @pool: pool to create a new worker for
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1558	*
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1559	* Create a new worker for @pool if necessary. @pool is guaranteed to
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1560	* have at least one idle worker on return from this function. If
				1561	* creating a new worker takes longer than MAYDAY_INTERVAL, mayday is
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1562	* sent to all rescuers with works scheduled on @pool to resolve
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1563	* possible allocation deadlock.
				1564	*
				1565	* On return, need_to_create_worker() is guaranteed to be false and
				1566	* may_start_working() true.
				1567	*
				1568	* LOCKING:
				1569	* spin_lock_irq(gcwq->lock) which may be released and regrabbed
				1570	* multiple times. Does GFP_KERNEL allocations. Called only from
				1571	* manager.
				1572	*
				1573	* RETURNS:
				1574	* false if no action was taken and gcwq->lock stayed locked, true
				1575	* otherwise.
				1576	*/
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1577	static bool maybe_create_worker(struct worker_pool *pool)
Namhyung Kim	06bd6eb	2010-08-22 23:19:42 +0900	[diff] [blame]	1578	__releases(&gcwq->lock)
				1579	__acquires(&gcwq->lock)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1580	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1581	struct global_cwq *gcwq = pool->gcwq;
				1582
				1583	if (!need_to_create_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1584	return false;
				1585	restart:
Tejun Heo	9f9c236	2010-07-14 11:31:20 +0200	[diff] [blame]	1586	spin_unlock_irq(&gcwq->lock);
				1587
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1588	/* if we don't make progress in MAYDAY_INITIAL_TIMEOUT, call for help */
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1589	mod_timer(&pool->mayday_timer, jiffies + MAYDAY_INITIAL_TIMEOUT);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1590
				1591	while (true) {
				1592	struct worker *worker;
				1593
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1594	worker = create_worker(pool, true);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1595	if (worker) {
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1596	del_timer_sync(&pool->mayday_timer);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1597	spin_lock_irq(&gcwq->lock);
				1598	start_worker(worker);
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1599	BUG_ON(need_to_create_worker(pool));
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1600	return true;
				1601	}
				1602
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1603	if (!need_to_create_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1604	break;
				1605
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1606	__set_current_state(TASK_INTERRUPTIBLE);
				1607	schedule_timeout(CREATE_COOLDOWN);
Tejun Heo	9f9c236	2010-07-14 11:31:20 +0200	[diff] [blame]	1608
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1609	if (!need_to_create_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1610	break;
				1611	}
				1612
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1613	del_timer_sync(&pool->mayday_timer);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1614	spin_lock_irq(&gcwq->lock);
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1615	if (need_to_create_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1616	goto restart;
				1617	return true;
				1618	}
				1619
				1620	/**
				1621	* maybe_destroy_worker - destroy workers which have been idle for a while
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1622	* @pool: pool to destroy workers for
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1623	*
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1624	* Destroy @pool workers which have been idle for longer than
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1625	* IDLE_WORKER_TIMEOUT.
				1626	*
				1627	* LOCKING:
				1628	* spin_lock_irq(gcwq->lock) which may be released and regrabbed
				1629	* multiple times. Called only from manager.
				1630	*
				1631	* RETURNS:
				1632	* false if no action was taken and gcwq->lock stayed locked, true
				1633	* otherwise.
				1634	*/
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1635	static bool maybe_destroy_workers(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1636	{
				1637	bool ret = false;
				1638
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1639	while (too_many_workers(pool)) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1640	struct worker *worker;
				1641	unsigned long expires;
				1642
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1643	worker = list_entry(pool->idle_list.prev, struct worker, entry);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1644	expires = worker->last_active + IDLE_WORKER_TIMEOUT;
				1645
				1646	if (time_before(jiffies, expires)) {
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1647	mod_timer(&pool->idle_timer, expires);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1648	break;
				1649	}
				1650
				1651	destroy_worker(worker);
				1652	ret = true;
				1653	}
				1654
				1655	return ret;
				1656	}
				1657
				1658	/**
				1659	* manage_workers - manage worker pool
				1660	* @worker: self
				1661	*
				1662	* Assume the manager role and manage gcwq worker pool @worker belongs
				1663	* to. At any given time, there can be only zero or one manager per
				1664	* gcwq. The exclusion is handled automatically by this function.
				1665	*
				1666	* The caller can safely start processing works on false return. On
				1667	* true return, it's guaranteed that need_to_create_worker() is false
				1668	* and may_start_working() is true.
				1669	*
				1670	* CONTEXT:
				1671	* spin_lock_irq(gcwq->lock) which may be released and regrabbed
				1672	* multiple times. Does GFP_KERNEL allocations.
				1673	*
				1674	* RETURNS:
				1675	* false if no action was taken and gcwq->lock stayed locked, true if
				1676	* some action was taken.
				1677	*/
				1678	static bool manage_workers(struct worker *worker)
				1679	{
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1680	struct worker_pool *pool = worker->pool;
				1681	struct global_cwq *gcwq = pool->gcwq;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1682	bool ret = false;
				1683
Tejun Heo	22ad564	2012-07-12 14:46:37 -0700	[diff] [blame]	1684	if (pool->flags & POOL_MANAGING_WORKERS)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1685	return ret;
				1686
Tejun Heo	22ad564	2012-07-12 14:46:37 -0700	[diff] [blame]	1687	pool->flags &= ~POOL_MANAGE_WORKERS;
				1688	pool->flags \|= POOL_MANAGING_WORKERS;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1689
				1690	/*
				1691	* Destroy and then create so that may_start_working() is true
				1692	* on return.
				1693	*/
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1694	ret \|= maybe_destroy_workers(pool);
				1695	ret \|= maybe_create_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1696
Tejun Heo	22ad564	2012-07-12 14:46:37 -0700	[diff] [blame]	1697	pool->flags &= ~POOL_MANAGING_WORKERS;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1698
				1699	/*
				1700	* The trustee might be waiting to take over the manager
				1701	* position, tell it we're done.
				1702	*/
				1703	if (unlikely(gcwq->trustee))
				1704	wake_up_all(&gcwq->trustee_wait);
				1705
				1706	return ret;
				1707	}
				1708
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1709	/**
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1710	* move_linked_works - move linked works to a list
				1711	* @work: start of series of works to be scheduled
				1712	* @head: target list to append @work to
				1713	* @nextp: out paramter for nested worklist walking
				1714	*
				1715	* Schedule linked works starting from @work to @head. Work series to
				1716	* be scheduled starts at @work and includes any consecutive work with
				1717	* WORK_STRUCT_LINKED set in its predecessor.
				1718	*
				1719	* If @nextp is not NULL, it's updated to point to the next work of
				1720	* the last scheduled work. This allows move_linked_works() to be
				1721	* nested inside outer list_for_each_entry_safe().
				1722	*
				1723	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1724	* spin_lock_irq(gcwq->lock).
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1725	*/
				1726	static void move_linked_works(struct work_struct work, struct list_head head,
				1727	struct work_struct **nextp)
				1728	{
				1729	struct work_struct *n;
				1730
				1731	/*
				1732	* Linked worklist will always end before the end of the list,
				1733	* use NULL for list head.
				1734	*/
				1735	list_for_each_entry_safe_from(work, n, NULL, entry) {
				1736	list_move_tail(&work->entry, head);
				1737	if (!(*work_data_bits(work) & WORK_STRUCT_LINKED))
				1738	break;
				1739	}
				1740
				1741	/*
				1742	* If we're already inside safe list traversal and have moved
				1743	* multiple works to the scheduled queue, the next position
				1744	* needs to be updated.
				1745	*/
				1746	if (nextp)
				1747	*nextp = n;
				1748	}
				1749
Lai Jiangshan	31eafff	2012-09-18 10:40:00 -0700	[diff] [blame]	1750	static void cwq_activate_delayed_work(struct work_struct *work)
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1751	{
Lai Jiangshan	31eafff	2012-09-18 10:40:00 -0700	[diff] [blame]	1752	struct cpu_workqueue_struct *cwq = get_work_cwq(work);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1753
Tejun Heo	cdadf00	2010-10-05 10:49:55 +0200	[diff] [blame]	1754	trace_workqueue_activate_work(work);
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	1755	move_linked_works(work, &cwq->pool->worklist, NULL);
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1756	__clear_bit(WORK_STRUCT_DELAYED_BIT, work_data_bits(work));
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1757	cwq->nr_active++;
				1758	}
				1759
Lai Jiangshan	31eafff	2012-09-18 10:40:00 -0700	[diff] [blame]	1760	static void cwq_activate_first_delayed(struct cpu_workqueue_struct *cwq)
				1761	{
				1762	struct work_struct *work = list_first_entry(&cwq->delayed_works,
				1763	struct work_struct, entry);
				1764
				1765	cwq_activate_delayed_work(work);
				1766	}
				1767
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1768	/**
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1769	* cwq_dec_nr_in_flight - decrement cwq's nr_in_flight
				1770	* @cwq: cwq of interest
				1771	* @color: color of work which left the queue
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1772	* @delayed: for a delayed work
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1773	*
				1774	* A work either has completed or is removed from pending queue,
				1775	* decrement nr_in_flight of its cwq and handle workqueue flushing.
				1776	*
				1777	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1778	* spin_lock_irq(gcwq->lock).
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1779	*/
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1780	static void cwq_dec_nr_in_flight(struct cpu_workqueue_struct *cwq, int color,
				1781	bool delayed)
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1782	{
				1783	/* ignore uncolored works */
				1784	if (color == WORK_NO_COLOR)
				1785	return;
				1786
				1787	cwq->nr_in_flight[color]--;
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1788
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1789	if (!delayed) {
				1790	cwq->nr_active--;
				1791	if (!list_empty(&cwq->delayed_works)) {
				1792	/* one down, submit a delayed one */
				1793	if (cwq->nr_active < cwq->max_active)
				1794	cwq_activate_first_delayed(cwq);
				1795	}
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	1796	}
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1797
				1798	/* is flush in progress and are we at the flushing tip? */
				1799	if (likely(cwq->flush_color != color))
				1800	return;
				1801
				1802	/* are there still in-flight works? */
				1803	if (cwq->nr_in_flight[color])
				1804	return;
				1805
				1806	/* this cwq is done, clear flush_color */
				1807	cwq->flush_color = -1;
				1808
				1809	/*
				1810	* If this was the last cwq, wake up the first flusher. It
				1811	* will handle the rest.
				1812	*/
				1813	if (atomic_dec_and_test(&cwq->wq->nr_cwqs_to_flush))
				1814	complete(&cwq->wq->first_flusher->done);
				1815	}
				1816
				1817	/**
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1818	* process_one_work - process single work
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1819	* @worker: self
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1820	* @work: work to process
				1821	*
				1822	* Process @work. This function contains all the logics necessary to
				1823	* process a single work including synchronization against and
				1824	* interaction with other workers on the same cpu, queueing and
				1825	* flushing. As long as context requirement is met, any worker can
				1826	* call this function to process a work.
				1827	*
				1828	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1829	* spin_lock_irq(gcwq->lock) which is released and regrabbed.
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1830	*/
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1831	static void process_one_work(struct worker worker, struct work_struct work)
Namhyung Kim	06bd6eb	2010-08-22 23:19:42 +0900	[diff] [blame]	1832	__releases(&gcwq->lock)
				1833	__acquires(&gcwq->lock)
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1834	{
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	1835	struct cpu_workqueue_struct *cwq = get_work_cwq(work);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1836	struct worker_pool *pool = worker->pool;
				1837	struct global_cwq *gcwq = pool->gcwq;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1838	struct hlist_head *bwh = busy_worker_head(gcwq, work);
Tejun Heo	fb0e7be	2010-06-29 10:07:15 +0200	[diff] [blame]	1839	bool cpu_intensive = cwq->wq->flags & WQ_CPU_INTENSIVE;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1840	int work_color;
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	1841	struct worker *collision;
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1842	#ifdef CONFIG_LOCKDEP
				1843	/*
				1844	* It is permissible to free the struct work_struct from
				1845	* inside the function that is called from it, this we need to
				1846	* take into account for lockdep too. To avoid bogus "held
				1847	* lock freed" warnings as well as problems when looking into
				1848	* work->lockdep_map, make a copy and use that here.
				1849	*/
				1850	struct lockdep_map lockdep_map = work->lockdep_map;
				1851	#endif
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	1852	/*
				1853	* A single work shouldn't be executed concurrently by
				1854	* multiple workers on a single cpu. Check whether anyone is
				1855	* already processing the work. If so, defer the work to the
				1856	* currently executing one.
				1857	*/
				1858	collision = __find_worker_executing_work(gcwq, bwh, work);
				1859	if (unlikely(collision)) {
				1860	move_linked_works(work, &collision->scheduled, NULL);
				1861	return;
				1862	}
				1863
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1864	/* claim and process */
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1865	debug_work_deactivate(work);
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1866	hlist_add_head(&worker->hentry, bwh);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1867	worker->current_work = work;
Tejun Heo	55e3e1f	2012-12-18 10:35:02 -0800	[diff] [blame]	1868	worker->current_func = work->func;
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	1869	worker->current_cwq = cwq;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	1870	work_color = get_work_color(work);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	1871
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	1872	/* record the current cpu number in the work data and dequeue */
				1873	set_work_cpu(work, gcwq->cpu);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1874	list_del_init(&work->entry);
				1875
Tejun Heo	649027d	2010-06-29 10:07:14 +0200	[diff] [blame]	1876	/*
Tejun Heo	fb0e7be	2010-06-29 10:07:15 +0200	[diff] [blame]	1877	* CPU intensive works don't participate in concurrency
				1878	* management. They're the scheduler's responsibility.
				1879	*/
				1880	if (unlikely(cpu_intensive))
				1881	worker_set_flags(worker, WORKER_CPU_INTENSIVE, true);
				1882
Tejun Heo	b7b5c68	2012-07-12 14:46:37 -0700	[diff] [blame]	1883	/*
				1884	* Unbound gcwq isn't concurrency managed and work items should be
				1885	* executed ASAP. Wake up another worker if necessary.
				1886	*/
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1887	if ((worker->flags & WORKER_UNBOUND) && need_more_worker(pool))
				1888	wake_up_worker(pool);
Tejun Heo	b7b5c68	2012-07-12 14:46:37 -0700	[diff] [blame]	1889
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1890	spin_unlock_irq(&gcwq->lock);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1891
Tejun Heo	66307ae	2012-08-03 10:30:45 -0700	[diff] [blame]	1892	smp_wmb(); /* paired with test_and_set_bit(PENDING) */
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1893	work_clear_pending(work);
Tejun Heo	66307ae	2012-08-03 10:30:45 -0700	[diff] [blame]	1894
Tejun Heo	e159489	2011-01-09 23:32:15 +0100	[diff] [blame]	1895	lock_map_acquire_read(&cwq->wq->lockdep_map);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1896	lock_map_acquire(&lockdep_map);
Arjan van de Ven	e36c886	2010-08-21 13:07:26 -0700	[diff] [blame]	1897	trace_workqueue_execute_start(work);
Tejun Heo	55e3e1f	2012-12-18 10:35:02 -0800	[diff] [blame]	1898	worker->current_func(work);
Arjan van de Ven	e36c886	2010-08-21 13:07:26 -0700	[diff] [blame]	1899	/*
				1900	* While we must be careful to not use "work" after this, the trace
				1901	* point will only record its address.
				1902	*/
				1903	trace_workqueue_execute_end(work);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1904	lock_map_release(&lockdep_map);
				1905	lock_map_release(&cwq->wq->lockdep_map);
				1906
				1907	if (unlikely(in_atomic() \|\| lockdep_depth(current) > 0)) {
Tejun Heo	55e3e1f	2012-12-18 10:35:02 -0800	[diff] [blame]	1908	pr_err("BUG: workqueue leaked lock or atomic: %s/0x%08x/%d\n"
				1909	" last function: %pf\n",
				1910	current->comm, preempt_count(), task_pid_nr(current),
				1911	worker->current_func);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1912	debug_show_held_locks(current);
				1913	dump_stack();
				1914	}
				1915
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1916	spin_lock_irq(&gcwq->lock);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1917
Tejun Heo	fb0e7be	2010-06-29 10:07:15 +0200	[diff] [blame]	1918	/* clear cpu intensive status */
				1919	if (unlikely(cpu_intensive))
				1920	worker_clr_flags(worker, WORKER_CPU_INTENSIVE);
				1921
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1922	/* we're done with it, release */
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1923	hlist_del_init(&worker->hentry);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1924	worker->current_work = NULL;
Tejun Heo	55e3e1f	2012-12-18 10:35:02 -0800	[diff] [blame]	1925	worker->current_func = NULL;
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	1926	worker->current_cwq = NULL;
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1927	cwq_dec_nr_in_flight(cwq, work_color, false);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	1928	}
				1929
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1930	/**
				1931	* process_scheduled_works - process scheduled works
				1932	* @worker: self
				1933	*
				1934	* Process all scheduled works. Please note that the scheduled list
				1935	* may change while processing a work, so this function repeatedly
				1936	* fetches a work from the top and executes it.
				1937	*
				1938	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1939	* spin_lock_irq(gcwq->lock) which may be released and regrabbed
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1940	* multiple times.
				1941	*/
				1942	static void process_scheduled_works(struct worker *worker)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1943	{
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1944	while (!list_empty(&worker->scheduled)) {
				1945	struct work_struct *work = list_first_entry(&worker->scheduled,
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1946	struct work_struct, entry);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1947	process_one_work(worker, work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1948	}
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1949	}
				1950
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1951	/**
				1952	* worker_thread - the worker thread function
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1953	* @__worker: self
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1954	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1955	* The gcwq worker thread function. There's a single dynamic pool of
				1956	* these per each cpu. These workers process all works regardless of
				1957	* their specific target workqueue. The only exception is works which
				1958	* belong to workqueues with a rescuer which will be explained in
				1959	* rescuer_thread().
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1960	*/
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1961	static int worker_thread(void *__worker)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1962	{
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1963	struct worker *worker = __worker;
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	1964	struct worker_pool *pool = worker->pool;
				1965	struct global_cwq *gcwq = pool->gcwq;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1966
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1967	/* tell the scheduler that this is a workqueue worker */
				1968	worker->task->flags \|= PF_WQ_WORKER;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1969	woke_up:
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1970	spin_lock_irq(&gcwq->lock);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1971
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1972	/* DIE can be set only while we're idle, checking here is enough */
				1973	if (worker->flags & WORKER_DIE) {
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	1974	spin_unlock_irq(&gcwq->lock);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1975	worker->task->flags &= ~PF_WQ_WORKER;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1976	return 0;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1977	}
				1978
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1979	worker_leave_idle(worker);
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	1980	recheck:
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1981	/* no more worker necessary? */
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1982	if (!need_more_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1983	goto sleep;
				1984
				1985	/* do we need to manage? */
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	1986	if (unlikely(!may_start_working(pool)) && manage_workers(worker))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1987	goto recheck;
				1988
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1989	/*
				1990	* ->scheduled list can only be filled while a worker is
				1991	* preparing to process a work or actually processing it.
				1992	* Make sure nobody diddled with it while I was sleeping.
				1993	*/
				1994	BUG_ON(!list_empty(&worker->scheduled));
				1995
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1996	/*
				1997	* When control reaches this point, we're guaranteed to have
				1998	* at least one idle worker or that someone else has already
				1999	* assumed the manager role.
				2000	*/
				2001	worker_clr_flags(worker, WORKER_PREP);
				2002
				2003	do {
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2004	struct work_struct *work =
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	2005	list_first_entry(&pool->worklist,
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2006	struct work_struct, entry);
				2007
				2008	if (likely(!(*work_data_bits(work) & WORK_STRUCT_LINKED))) {
				2009	/* optimization path, not strictly necessary */
				2010	process_one_work(worker, work);
				2011	if (unlikely(!list_empty(&worker->scheduled)))
				2012	process_scheduled_works(worker);
				2013	} else {
				2014	move_linked_works(work, &worker->scheduled, NULL);
				2015	process_scheduled_works(worker);
				2016	}
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	2017	} while (keep_working(pool));
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2018
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2019	worker_set_flags(worker, WORKER_PREP, false);
Tejun Heo	d313dd8	2010-07-02 10:03:51 +0200	[diff] [blame]	2020	sleep:
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	2021	if (unlikely(need_to_manage_workers(pool)) && manage_workers(worker))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2022	goto recheck;
Tejun Heo	d313dd8	2010-07-02 10:03:51 +0200	[diff] [blame]	2023
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2024	/*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2025	* gcwq->lock is held and there's no work to process and no
				2026	* need to manage, sleep. Workers are woken up only while
				2027	* holding gcwq->lock or from local cpu, so setting the
				2028	* current state before releasing gcwq->lock is enough to
				2029	* prevent losing any event.
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2030	*/
				2031	worker_enter_idle(worker);
				2032	__set_current_state(TASK_INTERRUPTIBLE);
				2033	spin_unlock_irq(&gcwq->lock);
				2034	schedule();
				2035	goto woke_up;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2036	}
				2037
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2038	/**
				2039	* rescuer_thread - the rescuer thread function
				2040	* @__wq: the associated workqueue
				2041	*
				2042	* Workqueue rescuer thread function. There's one rescuer for each
				2043	* workqueue which has WQ_RESCUER set.
				2044	*
				2045	* Regular work processing on a gcwq may block trying to create a new
				2046	* worker which uses GFP_KERNEL allocation which has slight chance of
				2047	* developing into deadlock if some works currently on the same queue
				2048	* need to be processed to satisfy the GFP_KERNEL allocation. This is
				2049	* the problem rescuer solves.
				2050	*
				2051	* When such condition is possible, the gcwq summons rescuers of all
				2052	* workqueues which have works queued on the gcwq and let them process
				2053	* those works so that forward progress can be guaranteed.
				2054	*
				2055	* This should happen rarely.
				2056	*/
				2057	static int rescuer_thread(void *__wq)
				2058	{
				2059	struct workqueue_struct *wq = __wq;
				2060	struct worker *rescuer = wq->rescuer;
				2061	struct list_head *scheduled = &rescuer->scheduled;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2062	bool is_unbound = wq->flags & WQ_UNBOUND;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2063	unsigned int cpu;
				2064
				2065	set_user_nice(current, RESCUER_NICE_LEVEL);
				2066	repeat:
				2067	set_current_state(TASK_INTERRUPTIBLE);
				2068
Mike Galbraith	dbdd7f0	2012-11-28 07:17:18 +0100	[diff] [blame]	2069	if (kthread_should_stop()) {
				2070	__set_current_state(TASK_RUNNING);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2071	return 0;
Mike Galbraith	dbdd7f0	2012-11-28 07:17:18 +0100	[diff] [blame]	2072	}
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2073
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2074	/*
				2075	* See whether any cpu is asking for help. Unbounded
				2076	* workqueues use cpu 0 in mayday_mask for CPU_UNBOUND.
				2077	*/
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	2078	for_each_mayday_cpu(cpu, wq->mayday_mask) {
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2079	unsigned int tcpu = is_unbound ? WORK_CPU_UNBOUND : cpu;
				2080	struct cpu_workqueue_struct *cwq = get_cwq(tcpu, wq);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	2081	struct worker_pool *pool = cwq->pool;
				2082	struct global_cwq *gcwq = pool->gcwq;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2083	struct work_struct work, n;
				2084
				2085	__set_current_state(TASK_RUNNING);
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	2086	mayday_clear_cpu(cpu, wq->mayday_mask);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2087
				2088	/* migrate to the target cpu if possible */
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	2089	rescuer->pool = pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2090	worker_maybe_bind_and_lock(rescuer);
				2091
				2092	/*
				2093	* Slurp in all works issued via this workqueue and
				2094	* process'em.
				2095	*/
				2096	BUG_ON(!list_empty(&rescuer->scheduled));
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	2097	list_for_each_entry_safe(work, n, &pool->worklist, entry)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2098	if (get_work_cwq(work) == cwq)
				2099	move_linked_works(work, scheduled, &n);
				2100
				2101	process_scheduled_works(rescuer);
Tejun Heo	7576958	2011-02-14 14:04:46 +0100	[diff] [blame]	2102
				2103	/*
				2104	* Leave this gcwq. If keep_working() is %true, notify a
				2105	* regular worker; otherwise, we end up with 0 concurrency
				2106	* and stalling the execution.
				2107	*/
Tejun Heo	7ef6a93	2012-07-12 14:46:37 -0700	[diff] [blame]	2108	if (keep_working(pool))
				2109	wake_up_worker(pool);
Tejun Heo	7576958	2011-02-14 14:04:46 +0100	[diff] [blame]	2110
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2111	spin_unlock_irq(&gcwq->lock);
				2112	}
				2113
				2114	schedule();
				2115	goto repeat;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2116	}
				2117
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2118	struct wq_barrier {
				2119	struct work_struct work;
				2120	struct completion done;
				2121	};
				2122
				2123	static void wq_barrier_func(struct work_struct *work)
				2124	{
				2125	struct wq_barrier *barr = container_of(work, struct wq_barrier, work);
				2126	complete(&barr->done);
				2127	}
				2128
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2129	/**
				2130	* insert_wq_barrier - insert a barrier work
				2131	* @cwq: cwq to insert barrier into
				2132	* @barr: wq_barrier to insert
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2133	* @target: target work to attach @barr to
				2134	* @worker: worker currently executing @target, NULL if @target is not executing
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2135	*
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2136	* @barr is linked to @target such that @barr is completed only after
				2137	* @target finishes execution. Please note that the ordering
				2138	* guarantee is observed only with respect to @target and on the local
				2139	* cpu.
				2140	*
				2141	* Currently, a queued barrier can't be canceled. This is because
				2142	* try_to_grab_pending() can't determine whether the work to be
				2143	* grabbed is at the head of the queue and thus can't clear LINKED
				2144	* flag of the previous work while there must be a valid next work
				2145	* after a work with LINKED flag set.
				2146	*
				2147	* Note that when @worker is non-NULL, @target may be modified
				2148	* underneath us, so we can't reliably determine cwq from @target.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2149	*
				2150	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2151	* spin_lock_irq(gcwq->lock).
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2152	*/
Oleg Nesterov	83c2252	2007-05-09 02:33:54 -0700	[diff] [blame]	2153	static void insert_wq_barrier(struct cpu_workqueue_struct *cwq,
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2154	struct wq_barrier *barr,
				2155	struct work_struct target, struct worker worker)
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2156	{
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2157	struct list_head *head;
				2158	unsigned int linked = 0;
				2159
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2160	/*
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2161	* debugobject calls are safe here even with gcwq->lock locked
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2162	* as we know for sure that this will not trigger any of the
				2163	* checks and call back into the fixup functions where we
				2164	* might deadlock.
				2165	*/
Andrew Morton	ca1cab3	2010-10-26 14:22:34 -0700	[diff] [blame]	2166	INIT_WORK_ONSTACK(&barr->work, wq_barrier_func);
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	2167	__set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(&barr->work));
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2168	init_completion(&barr->done);
Oleg Nesterov	83c2252	2007-05-09 02:33:54 -0700	[diff] [blame]	2169
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2170	/*
				2171	* If @target is currently being executed, schedule the
				2172	* barrier to the worker; otherwise, put it after @target.
				2173	*/
				2174	if (worker)
				2175	head = worker->scheduled.next;
				2176	else {
				2177	unsigned long *bits = work_data_bits(target);
				2178
				2179	head = target->entry.next;
				2180	/* there can already be other linked works, inherit and set */
				2181	linked = *bits & WORK_STRUCT_LINKED;
				2182	__set_bit(WORK_STRUCT_LINKED_BIT, bits);
				2183	}
				2184
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2185	debug_work_activate(&barr->work);
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2186	insert_work(cwq, &barr->work, head,
				2187	work_color_to_flags(WORK_NO_COLOR) \| linked);
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2188	}
				2189
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2190	/**
				2191	* flush_workqueue_prep_cwqs - prepare cwqs for workqueue flushing
				2192	* @wq: workqueue being flushed
				2193	* @flush_color: new flush color, < 0 for no-op
				2194	* @work_color: new work color, < 0 for no-op
				2195	*
				2196	* Prepare cwqs for workqueue flushing.
				2197	*
				2198	* If @flush_color is non-negative, flush_color on all cwqs should be
				2199	* -1. If no cwq has in-flight commands at the specified color, all
				2200	* cwq->flush_color's stay at -1 and %false is returned. If any cwq
				2201	* has in flight commands, its cwq->flush_color is set to
				2202	* @flush_color, @wq->nr_cwqs_to_flush is updated accordingly, cwq
				2203	* wakeup logic is armed and %true is returned.
				2204	*
				2205	* The caller should have initialized @wq->first_flusher prior to
				2206	* calling this function with non-negative @flush_color. If
				2207	* @flush_color is negative, no flush color update is done and %false
				2208	* is returned.
				2209	*
				2210	* If @work_color is non-negative, all cwqs should have the same
				2211	* work_color which is previous to @work_color and all will be
				2212	* advanced to @work_color.
				2213	*
				2214	* CONTEXT:
				2215	* mutex_lock(wq->flush_mutex).
				2216	*
				2217	* RETURNS:
				2218	* %true if @flush_color >= 0 and there's something to flush. %false
				2219	* otherwise.
				2220	*/
				2221	static bool flush_workqueue_prep_cwqs(struct workqueue_struct *wq,
				2222	int flush_color, int work_color)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2223	{
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2224	bool wait = false;
				2225	unsigned int cpu;
Oleg Nesterov	1444196	2007-05-23 13:57:57 -0700	[diff] [blame]	2226
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2227	if (flush_color >= 0) {
				2228	BUG_ON(atomic_read(&wq->nr_cwqs_to_flush));
				2229	atomic_set(&wq->nr_cwqs_to_flush, 1);
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2230	}
Oleg Nesterov	1444196	2007-05-23 13:57:57 -0700	[diff] [blame]	2231
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2232	for_each_cwq_cpu(cpu, wq) {
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2233	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	2234	struct global_cwq *gcwq = cwq->pool->gcwq;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2235
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2236	spin_lock_irq(&gcwq->lock);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2237
				2238	if (flush_color >= 0) {
				2239	BUG_ON(cwq->flush_color != -1);
				2240
				2241	if (cwq->nr_in_flight[flush_color]) {
				2242	cwq->flush_color = flush_color;
				2243	atomic_inc(&wq->nr_cwqs_to_flush);
				2244	wait = true;
				2245	}
				2246	}
				2247
				2248	if (work_color >= 0) {
				2249	BUG_ON(work_color != work_next_color(cwq->work_color));
				2250	cwq->work_color = work_color;
				2251	}
				2252
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2253	spin_unlock_irq(&gcwq->lock);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2254	}
				2255
				2256	if (flush_color >= 0 && atomic_dec_and_test(&wq->nr_cwqs_to_flush))
				2257	complete(&wq->first_flusher->done);
				2258
				2259	return wait;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2260	}
				2261
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2262	/**
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2263	* flush_workqueue - ensure that any scheduled work has run to completion.
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2264	* @wq: workqueue to flush
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2265	*
				2266	* Forces execution of the workqueue and blocks until its completion.
				2267	* This is typically used in driver shutdown handlers.
				2268	*
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2269	* We sleep until all works which were queued on entry have been handled,
				2270	* but we are not livelocked by new incoming ones.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2271	*/
Harvey Harrison	7ad5b3a	2008-02-08 04:19:53 -0800	[diff] [blame]	2272	void flush_workqueue(struct workqueue_struct *wq)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2273	{
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2274	struct wq_flusher this_flusher = {
				2275	.list = LIST_HEAD_INIT(this_flusher.list),
				2276	.flush_color = -1,
				2277	.done = COMPLETION_INITIALIZER_ONSTACK(this_flusher.done),
				2278	};
				2279	int next_color;
Oleg Nesterov	b1f4ec1	2007-05-09 02:34:12 -0700	[diff] [blame]	2280
Ingo Molnar	3295f0e	2008-08-11 10:30:30 +0200	[diff] [blame]	2281	lock_map_acquire(&wq->lockdep_map);
				2282	lock_map_release(&wq->lockdep_map);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2283
				2284	mutex_lock(&wq->flush_mutex);
				2285
				2286	/*
				2287	* Start-to-wait phase
				2288	*/
				2289	next_color = work_next_color(wq->work_color);
				2290
				2291	if (next_color != wq->flush_color) {
				2292	/*
				2293	* Color space is not full. The current work_color
				2294	* becomes our flush_color and work_color is advanced
				2295	* by one.
				2296	*/
				2297	BUG_ON(!list_empty(&wq->flusher_overflow));
				2298	this_flusher.flush_color = wq->work_color;
				2299	wq->work_color = next_color;
				2300
				2301	if (!wq->first_flusher) {
				2302	/* no flush in progress, become the first flusher */
				2303	BUG_ON(wq->flush_color != this_flusher.flush_color);
				2304
				2305	wq->first_flusher = &this_flusher;
				2306
				2307	if (!flush_workqueue_prep_cwqs(wq, wq->flush_color,
				2308	wq->work_color)) {
				2309	/* nothing to flush, done */
				2310	wq->flush_color = next_color;
				2311	wq->first_flusher = NULL;
				2312	goto out_unlock;
				2313	}
				2314	} else {
				2315	/* wait in queue */
				2316	BUG_ON(wq->flush_color == this_flusher.flush_color);
				2317	list_add_tail(&this_flusher.list, &wq->flusher_queue);
				2318	flush_workqueue_prep_cwqs(wq, -1, wq->work_color);
				2319	}
				2320	} else {
				2321	/*
				2322	* Oops, color space is full, wait on overflow queue.
				2323	* The next flush completion will assign us
				2324	* flush_color and transfer to flusher_queue.
				2325	*/
				2326	list_add_tail(&this_flusher.list, &wq->flusher_overflow);
				2327	}
				2328
				2329	mutex_unlock(&wq->flush_mutex);
				2330
				2331	wait_for_completion(&this_flusher.done);
				2332
				2333	/*
				2334	* Wake-up-and-cascade phase
				2335	*
				2336	* First flushers are responsible for cascading flushes and
				2337	* handling overflow. Non-first flushers can simply return.
				2338	*/
				2339	if (wq->first_flusher != &this_flusher)
				2340	return;
				2341
				2342	mutex_lock(&wq->flush_mutex);
				2343
Tejun Heo	4ce48b3	2010-07-02 10:03:51 +0200	[diff] [blame]	2344	/* we might have raced, check again with mutex held */
				2345	if (wq->first_flusher != &this_flusher)
				2346	goto out_unlock;
				2347
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2348	wq->first_flusher = NULL;
				2349
				2350	BUG_ON(!list_empty(&this_flusher.list));
				2351	BUG_ON(wq->flush_color != this_flusher.flush_color);
				2352
				2353	while (true) {
				2354	struct wq_flusher next, tmp;
				2355
				2356	/* complete all the flushers sharing the current flush color */
				2357	list_for_each_entry_safe(next, tmp, &wq->flusher_queue, list) {
				2358	if (next->flush_color != wq->flush_color)
				2359	break;
				2360	list_del_init(&next->list);
				2361	complete(&next->done);
				2362	}
				2363
				2364	BUG_ON(!list_empty(&wq->flusher_overflow) &&
				2365	wq->flush_color != work_next_color(wq->work_color));
				2366
				2367	/* this flush_color is finished, advance by one */
				2368	wq->flush_color = work_next_color(wq->flush_color);
				2369
				2370	/* one color has been freed, handle overflow queue */
				2371	if (!list_empty(&wq->flusher_overflow)) {
				2372	/*
				2373	* Assign the same color to all overflowed
				2374	* flushers, advance work_color and append to
				2375	* flusher_queue. This is the start-to-wait
				2376	* phase for these overflowed flushers.
				2377	*/
				2378	list_for_each_entry(tmp, &wq->flusher_overflow, list)
				2379	tmp->flush_color = wq->work_color;
				2380
				2381	wq->work_color = work_next_color(wq->work_color);
				2382
				2383	list_splice_tail_init(&wq->flusher_overflow,
				2384	&wq->flusher_queue);
				2385	flush_workqueue_prep_cwqs(wq, -1, wq->work_color);
				2386	}
				2387
				2388	if (list_empty(&wq->flusher_queue)) {
				2389	BUG_ON(wq->flush_color != wq->work_color);
				2390	break;
				2391	}
				2392
				2393	/*
				2394	* Need to flush more colors. Make the next flusher
				2395	* the new first flusher and arm cwqs.
				2396	*/
				2397	BUG_ON(wq->flush_color == wq->work_color);
				2398	BUG_ON(wq->flush_color != next->flush_color);
				2399
				2400	list_del_init(&next->list);
				2401	wq->first_flusher = next;
				2402
				2403	if (flush_workqueue_prep_cwqs(wq, wq->flush_color, -1))
				2404	break;
				2405
				2406	/*
				2407	* Meh... this color is already done, clear first
				2408	* flusher and repeat cascading.
				2409	*/
				2410	wq->first_flusher = NULL;
				2411	}
				2412
				2413	out_unlock:
				2414	mutex_unlock(&wq->flush_mutex);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2415	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	2416	EXPORT_SYMBOL_GPL(flush_workqueue);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2417
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2418	/**
				2419	* drain_workqueue - drain a workqueue
				2420	* @wq: workqueue to drain
				2421	*
				2422	* Wait until the workqueue becomes empty. While draining is in progress,
				2423	* only chain queueing is allowed. IOW, only currently pending or running
				2424	* work items on @wq can queue further work items on it. @wq is flushed
				2425	* repeatedly until it becomes empty. The number of flushing is detemined
				2426	* by the depth of chaining and should be relatively short. Whine if it
				2427	* takes too long.
				2428	*/
				2429	void drain_workqueue(struct workqueue_struct *wq)
				2430	{
				2431	unsigned int flush_cnt = 0;
				2432	unsigned int cpu;
				2433
				2434	/*
				2435	* __queue_work() needs to test whether there are drainers, is much
				2436	* hotter than drain_workqueue() and already looks at @wq->flags.
				2437	* Use WQ_DRAINING so that queue doesn't have to check nr_drainers.
				2438	*/
				2439	spin_lock(&workqueue_lock);
				2440	if (!wq->nr_drainers++)
				2441	wq->flags \|= WQ_DRAINING;
				2442	spin_unlock(&workqueue_lock);
				2443	reflush:
				2444	flush_workqueue(wq);
				2445
				2446	for_each_cwq_cpu(cpu, wq) {
				2447	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
Thomas Tuttle	fa2563e	2011-09-14 16:22:28 -0700	[diff] [blame]	2448	bool drained;
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2449
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	2450	spin_lock_irq(&cwq->pool->gcwq->lock);
Thomas Tuttle	fa2563e	2011-09-14 16:22:28 -0700	[diff] [blame]	2451	drained = !cwq->nr_active && list_empty(&cwq->delayed_works);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	2452	spin_unlock_irq(&cwq->pool->gcwq->lock);
Thomas Tuttle	fa2563e	2011-09-14 16:22:28 -0700	[diff] [blame]	2453
				2454	if (drained)
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2455	continue;
				2456
				2457	if (++flush_cnt == 10 \|\|
				2458	(flush_cnt % 100 == 0 && flush_cnt <= 1000))
				2459	pr_warning("workqueue %s: flush on destruction isn't complete after %u tries\n",
				2460	wq->name, flush_cnt);
				2461	goto reflush;
				2462	}
				2463
				2464	spin_lock(&workqueue_lock);
				2465	if (!--wq->nr_drainers)
				2466	wq->flags &= ~WQ_DRAINING;
				2467	spin_unlock(&workqueue_lock);
				2468	}
				2469	EXPORT_SYMBOL_GPL(drain_workqueue);
				2470
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2471	static bool start_flush_work(struct work_struct work, struct wq_barrier barr,
				2472	bool wait_executing)
				2473	{
				2474	struct worker *worker = NULL;
				2475	struct global_cwq *gcwq;
				2476	struct cpu_workqueue_struct *cwq;
				2477
				2478	might_sleep();
				2479	gcwq = get_work_gcwq(work);
				2480	if (!gcwq)
				2481	return false;
				2482
				2483	spin_lock_irq(&gcwq->lock);
				2484	if (!list_empty(&work->entry)) {
				2485	/*
				2486	* See the comment near try_to_grab_pending()->smp_rmb().
				2487	* If it was re-queued to a different gcwq under us, we
				2488	* are not going to wait.
				2489	*/
				2490	smp_rmb();
				2491	cwq = get_work_cwq(work);
Tejun Heo	5865888	2012-07-12 14:46:37 -0700	[diff] [blame]	2492	if (unlikely(!cwq \|\| gcwq != cwq->pool->gcwq))
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2493	goto already_gone;
				2494	} else if (wait_executing) {
				2495	worker = find_worker_executing_work(gcwq, work);
				2496	if (!worker)
				2497	goto already_gone;
				2498	cwq = worker->current_cwq;
				2499	} else
				2500	goto already_gone;
				2501
				2502	insert_wq_barrier(cwq, barr, work, worker);
				2503	spin_unlock_irq(&gcwq->lock);
				2504
Tejun Heo	e159489	2011-01-09 23:32:15 +0100	[diff] [blame]	2505	/*
				2506	* If @max_active is 1 or rescuer is in use, flushing another work
				2507	* item on the same workqueue may lead to deadlock. Make sure the
				2508	* flusher is not running on the same workqueue by verifying write
				2509	* access.
				2510	*/
				2511	if (cwq->wq->saved_max_active == 1 \|\| cwq->wq->flags & WQ_RESCUER)
				2512	lock_map_acquire(&cwq->wq->lockdep_map);
				2513	else
				2514	lock_map_acquire_read(&cwq->wq->lockdep_map);
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2515	lock_map_release(&cwq->wq->lockdep_map);
Tejun Heo	e159489	2011-01-09 23:32:15 +0100	[diff] [blame]	2516
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2517	return true;
				2518	already_gone:
				2519	spin_unlock_irq(&gcwq->lock);
				2520	return false;
				2521	}
				2522
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2523	/**
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2524	* flush_work - wait for a work to finish executing the last queueing instance
				2525	* @work: the work to flush
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2526	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2527	* Wait until @work has finished execution. This function considers
				2528	* only the last queueing instance of @work. If @work has been
				2529	* enqueued across different CPUs on a non-reentrant workqueue or on
				2530	* multiple workqueues, @work might still be executing on return on
				2531	* some of the CPUs from earlier queueing.
Oleg Nesterov	a67da70	2008-07-25 01:47:52 -0700	[diff] [blame]	2532	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2533	* If @work was queued only on a non-reentrant, ordered or unbound
				2534	* workqueue, @work is guaranteed to be idle on return if it hasn't
				2535	* been requeued since flush started.
				2536	*
				2537	* RETURNS:
				2538	* %true if flush_work() waited for the work to finish execution,
				2539	* %false if it was already idle.
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2540	*/
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2541	bool flush_work(struct work_struct *work)
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2542	{
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2543	struct wq_barrier barr;
				2544
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2545	if (start_flush_work(work, &barr, true)) {
				2546	wait_for_completion(&barr.done);
				2547	destroy_work_on_stack(&barr.work);
				2548	return true;
				2549	} else
				2550	return false;
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2551	}
				2552	EXPORT_SYMBOL_GPL(flush_work);
				2553
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2554	static bool wait_on_cpu_work(struct global_cwq gcwq, struct work_struct work)
				2555	{
				2556	struct wq_barrier barr;
				2557	struct worker *worker;
				2558
				2559	spin_lock_irq(&gcwq->lock);
				2560
				2561	worker = find_worker_executing_work(gcwq, work);
				2562	if (unlikely(worker))
				2563	insert_wq_barrier(worker->current_cwq, &barr, work, worker);
				2564
				2565	spin_unlock_irq(&gcwq->lock);
				2566
				2567	if (unlikely(worker)) {
				2568	wait_for_completion(&barr.done);
				2569	destroy_work_on_stack(&barr.work);
				2570	return true;
				2571	} else
				2572	return false;
				2573	}
				2574
				2575	static bool wait_on_work(struct work_struct *work)
				2576	{
				2577	bool ret = false;
				2578	int cpu;
				2579
				2580	might_sleep();
				2581
				2582	lock_map_acquire(&work->lockdep_map);
				2583	lock_map_release(&work->lockdep_map);
				2584
				2585	for_each_gcwq_cpu(cpu)
				2586	ret \|= wait_on_cpu_work(get_gcwq(cpu), work);
				2587	return ret;
				2588	}
				2589
Tejun Heo	0938349	2010-09-16 10:48:29 +0200	[diff] [blame]	2590	/**
				2591	* flush_work_sync - wait until a work has finished execution
				2592	* @work: the work to flush
				2593	*
				2594	* Wait until @work has finished execution. On return, it's
				2595	* guaranteed that all queueing instances of @work which happened
				2596	* before this function is called are finished. In other words, if
				2597	* @work hasn't been requeued since this function was called, @work is
				2598	* guaranteed to be idle on return.
				2599	*
				2600	* RETURNS:
				2601	* %true if flush_work_sync() waited for the work to finish execution,
				2602	* %false if it was already idle.
				2603	*/
				2604	bool flush_work_sync(struct work_struct *work)
				2605	{
				2606	struct wq_barrier barr;
				2607	bool pending, waited;
				2608
				2609	/* we'll wait for executions separately, queue barr only if pending */
				2610	pending = start_flush_work(work, &barr, false);
				2611
				2612	/* wait for executions to finish */
				2613	waited = wait_on_work(work);
				2614
				2615	/* wait for the pending one */
				2616	if (pending) {
				2617	wait_for_completion(&barr.done);
				2618	destroy_work_on_stack(&barr.work);
				2619	}
				2620
				2621	return pending \|\| waited;
				2622	}
				2623	EXPORT_SYMBOL_GPL(flush_work_sync);
				2624
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2625	/*
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2626	* Upon a successful return (>= 0), the caller "owns" WORK_STRUCT_PENDING bit,
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2627	* so this work can't be re-armed in any way.
				2628	*/
				2629	static int try_to_grab_pending(struct work_struct *work)
				2630	{
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2631	struct global_cwq *gcwq;
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2632	int ret = -1;
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2633
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	2634	if (!test_and_set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(work)))
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2635	return 0;
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2636
				2637	/*
				2638	* The queueing is in progress, or it is already queued. Try to
				2639	* steal it from ->worklist without clearing WORK_STRUCT_PENDING.
				2640	*/
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	2641	gcwq = get_work_gcwq(work);
				2642	if (!gcwq)
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2643	return ret;
				2644
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2645	spin_lock_irq(&gcwq->lock);
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2646	if (!list_empty(&work->entry)) {
				2647	/*
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	2648	* This work is queued, but perhaps we locked the wrong gcwq.
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2649	* In that case we must see the new value after rmb(), see
				2650	* insert_work()->wmb().
				2651	*/
				2652	smp_rmb();
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	2653	if (gcwq == get_work_gcwq(work)) {
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2654	debug_work_deactivate(work);
Lai Jiangshan	31eafff	2012-09-18 10:40:00 -0700	[diff] [blame]	2655
				2656	/*
				2657	* A delayed work item cannot be grabbed directly
				2658	* because it might have linked NO_COLOR work items
				2659	* which, if left on the delayed_list, will confuse
				2660	* cwq->nr_active management later on and cause
				2661	* stall. Make sure the work item is activated
				2662	* before grabbing.
				2663	*/
				2664	if (*work_data_bits(work) & WORK_STRUCT_DELAYED)
				2665	cwq_activate_delayed_work(work);
				2666
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2667	list_del_init(&work->entry);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	2668	cwq_dec_nr_in_flight(get_work_cwq(work),
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	2669	get_work_color(work),
				2670	*work_data_bits(work) & WORK_STRUCT_DELAYED);
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2671	ret = 1;
				2672	}
				2673	}
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	2674	spin_unlock_irq(&gcwq->lock);
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2675
				2676	return ret;
				2677	}
				2678
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2679	static bool __cancel_work_timer(struct work_struct *work,
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2680	struct timer_list* timer)
				2681	{
				2682	int ret;
				2683
				2684	do {
				2685	ret = (timer && likely(del_timer(timer)));
				2686	if (!ret)
				2687	ret = try_to_grab_pending(work);
				2688	wait_on_work(work);
				2689	} while (unlikely(ret < 0));
				2690
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	2691	clear_work_data(work);
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2692	return ret;
				2693	}
				2694
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2695	/**
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2696	* cancel_work_sync - cancel a work and wait for it to finish
				2697	* @work: the work to cancel
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2698	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2699	* Cancel @work and wait for its execution to finish. This function
				2700	* can be used even if the work re-queues itself or migrates to
				2701	* another workqueue. On return from this function, @work is
				2702	* guaranteed to be not pending or executing on any CPU.
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2703	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2704	* cancel_work_sync(&delayed_work->work) must not be used for
				2705	* delayed_work's. Use cancel_delayed_work_sync() instead.
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2706	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2707	* The caller must ensure that the workqueue on which @work was last
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2708	* queued can't be destroyed before this function returns.
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2709	*
				2710	* RETURNS:
				2711	* %true if @work was pending, %false otherwise.
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2712	*/
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2713	bool cancel_work_sync(struct work_struct *work)
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2714	{
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2715	return __cancel_work_timer(work, NULL);
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	2716	}
Oleg Nesterov	28e53bd	2007-05-09 02:34:22 -0700	[diff] [blame]	2717	EXPORT_SYMBOL_GPL(cancel_work_sync);
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	2718
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2719	/**
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2720	* flush_delayed_work - wait for a dwork to finish executing the last queueing
				2721	* @dwork: the delayed work to flush
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2722	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2723	* Delayed timer is cancelled and the pending work is queued for
				2724	* immediate execution. Like flush_work(), this function only
				2725	* considers the last queueing instance of @dwork.
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2726	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2727	* RETURNS:
				2728	* %true if flush_work() waited for the work to finish execution,
				2729	* %false if it was already idle.
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2730	*/
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2731	bool flush_delayed_work(struct delayed_work *dwork)
				2732	{
				2733	if (del_timer_sync(&dwork->timer))
				2734	__queue_work(raw_smp_processor_id(),
				2735	get_work_cwq(&dwork->work)->wq, &dwork->work);
				2736	return flush_work(&dwork->work);
				2737	}
				2738	EXPORT_SYMBOL(flush_delayed_work);
				2739
				2740	/**
Tejun Heo	0938349	2010-09-16 10:48:29 +0200	[diff] [blame]	2741	* flush_delayed_work_sync - wait for a dwork to finish
				2742	* @dwork: the delayed work to flush
				2743	*
				2744	* Delayed timer is cancelled and the pending work is queued for
				2745	* execution immediately. Other than timer handling, its behavior
				2746	* is identical to flush_work_sync().
				2747	*
				2748	* RETURNS:
				2749	* %true if flush_work_sync() waited for the work to finish execution,
				2750	* %false if it was already idle.
				2751	*/
				2752	bool flush_delayed_work_sync(struct delayed_work *dwork)
				2753	{
				2754	if (del_timer_sync(&dwork->timer))
				2755	__queue_work(raw_smp_processor_id(),
				2756	get_work_cwq(&dwork->work)->wq, &dwork->work);
				2757	return flush_work_sync(&dwork->work);
				2758	}
				2759	EXPORT_SYMBOL(flush_delayed_work_sync);
				2760
				2761	/**
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2762	* cancel_delayed_work_sync - cancel a delayed work and wait for it to finish
				2763	* @dwork: the delayed work cancel
				2764	*
				2765	* This is cancel_work_sync() for delayed works.
				2766	*
				2767	* RETURNS:
				2768	* %true if @dwork was pending, %false otherwise.
				2769	*/
				2770	bool cancel_delayed_work_sync(struct delayed_work *dwork)
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2771	{
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2772	return __cancel_work_timer(&dwork->work, &dwork->timer);
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2773	}
Oleg Nesterov	f5a421a	2007-07-15 23:41:44 -0700	[diff] [blame]	2774	EXPORT_SYMBOL(cancel_delayed_work_sync);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2775
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2776	/**
				2777	* schedule_work - put work task in global workqueue
				2778	* @work: job to be done
				2779	*
Bart Van Assche	5b0f437d	2009-07-30 19:00:53 +0200	[diff] [blame]	2780	* Returns zero if @work was already on the kernel-global workqueue and
				2781	* non-zero otherwise.
				2782	*
				2783	* This puts a job in the kernel-global workqueue if it was not already
				2784	* queued and leaves it in the same position on the kernel-global
				2785	* workqueue otherwise.
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2786	*/
Harvey Harrison	7ad5b3a	2008-02-08 04:19:53 -0800	[diff] [blame]	2787	int schedule_work(struct work_struct *work)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2788	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	2789	return queue_work(system_wq, work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2790	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	2791	EXPORT_SYMBOL(schedule_work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2792
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	2793	/*
				2794	* schedule_work_on - put work task on a specific cpu
				2795	* @cpu: cpu to put the work task on
				2796	* @work: job to be done
				2797	*
				2798	* This puts a job on a specific cpu
				2799	*/
				2800	int schedule_work_on(int cpu, struct work_struct *work)
				2801	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	2802	return queue_work_on(cpu, system_wq, work);
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	2803	}
				2804	EXPORT_SYMBOL(schedule_work_on);
				2805
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2806	/**
				2807	* schedule_delayed_work - put work task in global workqueue after delay
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	2808	* @dwork: job to be done
				2809	* @delay: number of jiffies to wait or 0 for immediate execution
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2810	*
				2811	* After waiting for a given time this puts a job in the kernel-global
				2812	* workqueue.
				2813	*/
Harvey Harrison	7ad5b3a	2008-02-08 04:19:53 -0800	[diff] [blame]	2814	int schedule_delayed_work(struct delayed_work *dwork,
Ingo Molnar	82f67cd	2007-02-16 01:28:13 -0800	[diff] [blame]	2815	unsigned long delay)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2816	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	2817	return queue_delayed_work(system_wq, dwork, delay);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2818	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	2819	EXPORT_SYMBOL(schedule_delayed_work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2820
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2821	/**
				2822	* schedule_delayed_work_on - queue work in global workqueue on CPU after delay
				2823	* @cpu: cpu to use
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	2824	* @dwork: job to be done
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2825	* @delay: number of jiffies to wait
				2826	*
				2827	* After waiting for a given time this puts a job in the kernel-global
				2828	* workqueue on the specified CPU.
				2829	*/
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2830	int schedule_delayed_work_on(int cpu,
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	2831	struct delayed_work *dwork, unsigned long delay)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2832	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	2833	return queue_delayed_work_on(cpu, system_wq, dwork, delay);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2834	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	2835	EXPORT_SYMBOL(schedule_delayed_work_on);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2836
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2837	/**
Tejun Heo	31ddd87	2010-10-19 11:14:49 +0200	[diff] [blame]	2838	* schedule_on_each_cpu - execute a function synchronously on each online CPU
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2839	* @func: the function to call
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2840	*
Tejun Heo	31ddd87	2010-10-19 11:14:49 +0200	[diff] [blame]	2841	* schedule_on_each_cpu() executes @func on each online CPU using the
				2842	* system workqueue and blocks until all CPUs have completed.
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2843	* schedule_on_each_cpu() is very slow.
Tejun Heo	31ddd87	2010-10-19 11:14:49 +0200	[diff] [blame]	2844	*
				2845	* RETURNS:
				2846	* 0 on success, -errno on failure.
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2847	*/
David Howells	65f27f3	2006-11-22 14:55:48 +0000	[diff] [blame]	2848	int schedule_on_each_cpu(work_func_t func)
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	2849	{
				2850	int cpu;
Namhyung Kim	38f5156	2010-08-08 14:24:09 +0200	[diff] [blame]	2851	struct work_struct __percpu *works;
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	2852
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2853	works = alloc_percpu(struct work_struct);
				2854	if (!works)
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	2855	return -ENOMEM;
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2856
Gautham R Shenoy	95402b3	2008-01-25 21:08:02 +0100	[diff] [blame]	2857	get_online_cpus();
Tejun Heo	9398180	2009-11-17 14:06:20 -0800	[diff] [blame]	2858
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	2859	for_each_online_cpu(cpu) {
Ingo Molnar	9bfb183	2006-12-18 20:05:09 +0100	[diff] [blame]	2860	struct work_struct *work = per_cpu_ptr(works, cpu);
				2861
				2862	INIT_WORK(work, func);
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	2863	schedule_work_on(cpu, work);
Andi Kleen	65a6446	2009-10-14 06:22:47 +0200	[diff] [blame]	2864	}
Tejun Heo	9398180	2009-11-17 14:06:20 -0800	[diff] [blame]	2865
				2866	for_each_online_cpu(cpu)
				2867	flush_work(per_cpu_ptr(works, cpu));
				2868
Gautham R Shenoy	95402b3	2008-01-25 21:08:02 +0100	[diff] [blame]	2869	put_online_cpus();
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2870	free_percpu(works);
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	2871	return 0;
				2872	}
				2873
Alan Stern	eef6a7d	2010-02-12 17:39:21 +0900	[diff] [blame]	2874	/**
				2875	* flush_scheduled_work - ensure that any scheduled work has run to completion.
				2876	*
				2877	* Forces execution of the kernel-global workqueue and blocks until its
				2878	* completion.
				2879	*
				2880	* Think twice before calling this function! It's very easy to get into
				2881	* trouble if you don't take great care. Either of the following situations
				2882	* will lead to deadlock:
				2883	*
				2884	* One of the work items currently on the workqueue needs to acquire
				2885	* a lock held by your code or its caller.
				2886	*
				2887	* Your code is running in the context of a work routine.
				2888	*
				2889	* They will be detected by lockdep when they occur, but the first might not
				2890	* occur very often. It depends on what work items are on the workqueue and
				2891	* what locks they need, which you have no control over.
				2892	*
				2893	* In most situations flushing the entire workqueue is overkill; you merely
				2894	* need to know that a particular work item isn't queued and isn't running.
				2895	* In such cases you should use cancel_delayed_work_sync() or
				2896	* cancel_work_sync() instead.
				2897	*/
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2898	void flush_scheduled_work(void)
				2899	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	2900	flush_workqueue(system_wq);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2901	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	2902	EXPORT_SYMBOL(flush_scheduled_work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2903
				2904	/**
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	2905	* execute_in_process_context - reliably execute the routine with user context
				2906	* @fn: the function to execute
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	2907	* @ew: guaranteed storage for the execute work structure (must
				2908	* be available when the work executes)
				2909	*
				2910	* Executes the function immediately if process context is available,
				2911	* otherwise schedules the function for delayed execution.
				2912	*
				2913	* Returns: 0 - function was executed
				2914	* 1 - function was scheduled for execution
				2915	*/
David Howells	65f27f3	2006-11-22 14:55:48 +0000	[diff] [blame]	2916	int execute_in_process_context(work_func_t fn, struct execute_work *ew)
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	2917	{
				2918	if (!in_interrupt()) {
David Howells	65f27f3	2006-11-22 14:55:48 +0000	[diff] [blame]	2919	fn(&ew->work);
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	2920	return 0;
				2921	}
				2922
David Howells	65f27f3	2006-11-22 14:55:48 +0000	[diff] [blame]	2923	INIT_WORK(&ew->work, fn);
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	2924	schedule_work(&ew->work);
				2925
				2926	return 1;
				2927	}
				2928	EXPORT_SYMBOL_GPL(execute_in_process_context);
				2929
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2930	int keventd_up(void)
				2931	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	2932	return system_wq != NULL;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2933	}
				2934
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	2935	static int alloc_cwqs(struct workqueue_struct *wq)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2936	{
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	2937	/*
Tejun Heo	0f90004	2010-06-29 10:07:11 +0200	[diff] [blame]	2938	* cwqs are forced aligned according to WORK_STRUCT_FLAG_BITS.
				2939	* Make sure that the alignment isn't lower than that of
				2940	* unsigned long long.
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	2941	*/
Tejun Heo	0f90004	2010-06-29 10:07:11 +0200	[diff] [blame]	2942	const size_t size = sizeof(struct cpu_workqueue_struct);
				2943	const size_t align = max_t(size_t, 1 << WORK_STRUCT_FLAG_BITS,
				2944	__alignof__(unsigned long long));
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	2945
Lai Jiangshan	e06ffa1	2012-03-09 18:03:20 +0800	[diff] [blame]	2946	if (!(wq->flags & WQ_UNBOUND))
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2947	wq->cpu_wq.pcpu = __alloc_percpu(size, align);
Tejun Heo	931ac77	2010-07-20 11:07:48 +0200	[diff] [blame]	2948	else {
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2949	void *ptr;
Frederic Weisbecker	e1d8aa9	2009-01-12 23:15:46 +0100	[diff] [blame]	2950
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2951	/*
				2952	* Allocate enough room to align cwq and put an extra
				2953	* pointer at the end pointing back to the originally
				2954	* allocated pointer which will be used for free.
				2955	*/
				2956	ptr = kzalloc(size + align + sizeof(void *), GFP_KERNEL);
				2957	if (ptr) {
				2958	wq->cpu_wq.single = PTR_ALIGN(ptr, align);
				2959	(void *)(wq->cpu_wq.single + 1) = ptr;
				2960	}
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	2961	}
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2962
Tejun Heo	0415b00	2011-03-24 18:50:09 +0100	[diff] [blame]	2963	/* just in case, make sure it's actually aligned */
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	2964	BUG_ON(!IS_ALIGNED(wq->cpu_wq.v, align));
				2965	return wq->cpu_wq.v ? 0 : -ENOMEM;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	2966	}
				2967
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	2968	static void free_cwqs(struct workqueue_struct *wq)
Oleg Nesterov	06ba38a	2007-05-09 02:34:15 -0700	[diff] [blame]	2969	{
Lai Jiangshan	e06ffa1	2012-03-09 18:03:20 +0800	[diff] [blame]	2970	if (!(wq->flags & WQ_UNBOUND))
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2971	free_percpu(wq->cpu_wq.pcpu);
				2972	else if (wq->cpu_wq.single) {
				2973	/* the pointer to free is stored right after the cwq */
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	2974	kfree((void *)(wq->cpu_wq.single + 1));
Oleg Nesterov	06ba38a	2007-05-09 02:34:15 -0700	[diff] [blame]	2975	}
				2976	}
				2977
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2978	static int wq_clamp_max_active(int max_active, unsigned int flags,
				2979	const char *name)
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	2980	{
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2981	int lim = flags & WQ_UNBOUND ? WQ_UNBOUND_MAX_ACTIVE : WQ_MAX_ACTIVE;
				2982
				2983	if (max_active < 1 \|\| max_active > lim)
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	2984	printk(KERN_WARNING "workqueue: max_active %d requested for %s "
				2985	"is out of range, clamping between %d and %d\n",
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2986	max_active, name, 1, lim);
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	2987
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	2988	return clamp_val(max_active, 1, lim);
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	2989	}
				2990
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	2991	struct workqueue_struct __alloc_workqueue_key(const char fmt,
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	2992	unsigned int flags,
				2993	int max_active,
				2994	struct lock_class_key *key,
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	2995	const char *lock_name, ...)
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	2996	{
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	2997	va_list args, args1;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	2998	struct workqueue_struct *wq;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2999	unsigned int cpu;
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3000	size_t namelen;
				3001
				3002	/* determine namelen, allocate wq and format name */
				3003	va_start(args, lock_name);
				3004	va_copy(args1, args);
				3005	namelen = vsnprintf(NULL, 0, fmt, args) + 1;
				3006
				3007	wq = kzalloc(sizeof(*wq) + namelen, GFP_KERNEL);
				3008	if (!wq)
				3009	goto err;
				3010
				3011	vsnprintf(wq->name, namelen, fmt, args1);
				3012	va_end(args);
				3013	va_end(args1);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3014
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3015	/*
Tejun Heo	6370a6a	2010-10-11 15:12:27 +0200	[diff] [blame]	3016	* Workqueues which may be used during memory reclaim should
				3017	* have a rescuer to guarantee forward progress.
				3018	*/
				3019	if (flags & WQ_MEM_RECLAIM)
				3020	flags \|= WQ_RESCUER;
				3021
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3022	max_active = max_active ?: WQ_DFL_ACTIVE;
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3023	max_active = wq_clamp_max_active(max_active, flags, wq->name);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3024
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3025	/* init wq */
Tejun Heo	97e37d7	2010-06-29 10:07:10 +0200	[diff] [blame]	3026	wq->flags = flags;
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3027	wq->saved_max_active = max_active;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	3028	mutex_init(&wq->flush_mutex);
				3029	atomic_set(&wq->nr_cwqs_to_flush, 0);
				3030	INIT_LIST_HEAD(&wq->flusher_queue);
				3031	INIT_LIST_HEAD(&wq->flusher_overflow);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3032
Johannes Berg	eb13ba8	2008-01-16 09:51:58 +0100	[diff] [blame]	3033	lockdep_init_map(&wq->lockdep_map, lock_name, key, 0);
Oleg Nesterov	cce1a16	2007-05-09 02:34:13 -0700	[diff] [blame]	3034	INIT_LIST_HEAD(&wq->list);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3035
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3036	if (alloc_cwqs(wq) < 0)
				3037	goto err;
				3038
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3039	for_each_cwq_cpu(cpu, wq) {
Tejun Heo	1537663	2010-06-29 10:07:11 +0200	[diff] [blame]	3040	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3041	struct global_cwq *gcwq = get_gcwq(cpu);
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	3042	int pool_idx = (bool)(flags & WQ_HIGHPRI);
Tejun Heo	1537663	2010-06-29 10:07:11 +0200	[diff] [blame]	3043
Tejun Heo	0f90004	2010-06-29 10:07:11 +0200	[diff] [blame]	3044	BUG_ON((unsigned long)cwq & WORK_STRUCT_FLAG_MASK);
Tejun Heo	dcb32ee	2012-07-13 22:16:45 -0700	[diff] [blame]	3045	cwq->pool = &gcwq->pools[pool_idx];
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	3046	cwq->wq = wq;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	3047	cwq->flush_color = -1;
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	3048	cwq->max_active = max_active;
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	3049	INIT_LIST_HEAD(&cwq->delayed_works);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3050	}
				3051
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3052	if (flags & WQ_RESCUER) {
				3053	struct worker *rescuer;
				3054
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	3055	if (!alloc_mayday_mask(&wq->mayday_mask, GFP_KERNEL))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3056	goto err;
				3057
				3058	wq->rescuer = rescuer = alloc_worker();
				3059	if (!rescuer)
				3060	goto err;
				3061
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3062	rescuer->task = kthread_create(rescuer_thread, wq, "%s",
				3063	wq->name);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3064	if (IS_ERR(rescuer->task))
				3065	goto err;
				3066
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3067	rescuer->task->flags \|= PF_THREAD_BOUND;
				3068	wake_up_process(rescuer->task);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3069	}
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3070
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3071	/*
				3072	* workqueue_lock protects global freeze state and workqueues
				3073	* list. Grab it, set max_active accordingly and add the new
				3074	* workqueue to workqueues list.
				3075	*/
Tejun Heo	1537663	2010-06-29 10:07:11 +0200	[diff] [blame]	3076	spin_lock(&workqueue_lock);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3077
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3078	if (workqueue_freezing && wq->flags & WQ_FREEZABLE)
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3079	for_each_cwq_cpu(cpu, wq)
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3080	get_cwq(cpu, wq)->max_active = 0;
				3081
Tejun Heo	1537663	2010-06-29 10:07:11 +0200	[diff] [blame]	3082	list_add(&wq->list, &workqueues);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3083
Tejun Heo	1537663	2010-06-29 10:07:11 +0200	[diff] [blame]	3084	spin_unlock(&workqueue_lock);
				3085
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3086	return wq;
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	3087	err:
				3088	if (wq) {
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3089	free_cwqs(wq);
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	3090	free_mayday_mask(wq->mayday_mask);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3091	kfree(wq->rescuer);
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	3092	kfree(wq);
				3093	}
				3094	return NULL;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3095	}
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3096	EXPORT_SYMBOL_GPL(__alloc_workqueue_key);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3097
				3098	/**
				3099	* destroy_workqueue - safely terminate a workqueue
				3100	* @wq: target workqueue
				3101	*
				3102	* Safely destroy a workqueue. All work currently pending will be done first.
				3103	*/
				3104	void destroy_workqueue(struct workqueue_struct *wq)
				3105	{
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	3106	unsigned int cpu;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3107
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	3108	/* drain it before proceeding with destruction */
				3109	drain_workqueue(wq);
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	3110
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3111	/*
				3112	* wq list is used to freeze wq, remove from list after
				3113	* flushing is complete in case freeze races us.
				3114	*/
Gautham R Shenoy	95402b3	2008-01-25 21:08:02 +0100	[diff] [blame]	3115	spin_lock(&workqueue_lock);
Oleg Nesterov	b1f4ec1	2007-05-09 02:34:12 -0700	[diff] [blame]	3116	list_del(&wq->list);
Gautham R Shenoy	95402b3	2008-01-25 21:08:02 +0100	[diff] [blame]	3117	spin_unlock(&workqueue_lock);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3118
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3119	/* sanity check */
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3120	for_each_cwq_cpu(cpu, wq) {
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	3121	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
				3122	int i;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3123
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	3124	for (i = 0; i < WORK_NR_COLORS; i++)
				3125	BUG_ON(cwq->nr_in_flight[i]);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	3126	BUG_ON(cwq->nr_active);
				3127	BUG_ON(!list_empty(&cwq->delayed_works));
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	3128	}
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3129
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3130	if (wq->flags & WQ_RESCUER) {
				3131	kthread_stop(wq->rescuer->task);
Tejun Heo	f2e005a	2010-07-20 15:59:09 +0200	[diff] [blame]	3132	free_mayday_mask(wq->mayday_mask);
Xiaotian Feng	8d9df9f	2010-08-16 09:54:28 +0200	[diff] [blame]	3133	kfree(wq->rescuer);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3134	}
				3135
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3136	free_cwqs(wq);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3137	kfree(wq);
				3138	}
				3139	EXPORT_SYMBOL_GPL(destroy_workqueue);
				3140
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3141	/**
				3142	* workqueue_set_max_active - adjust max_active of a workqueue
				3143	* @wq: target workqueue
				3144	* @max_active: new max_active value.
				3145	*
				3146	* Set max_active of @wq to @max_active.
				3147	*
				3148	* CONTEXT:
				3149	* Don't call from IRQ context.
				3150	*/
				3151	void workqueue_set_max_active(struct workqueue_struct *wq, int max_active)
				3152	{
				3153	unsigned int cpu;
				3154
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3155	max_active = wq_clamp_max_active(max_active, wq->flags, wq->name);
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3156
				3157	spin_lock(&workqueue_lock);
				3158
				3159	wq->saved_max_active = max_active;
				3160
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3161	for_each_cwq_cpu(cpu, wq) {
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3162	struct global_cwq *gcwq = get_gcwq(cpu);
				3163
				3164	spin_lock_irq(&gcwq->lock);
				3165
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3166	if (!(wq->flags & WQ_FREEZABLE) \|\|
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3167	!(gcwq->flags & GCWQ_FREEZING))
				3168	get_cwq(gcwq->cpu, wq)->max_active = max_active;
				3169
				3170	spin_unlock_irq(&gcwq->lock);
				3171	}
				3172
				3173	spin_unlock(&workqueue_lock);
				3174	}
				3175	EXPORT_SYMBOL_GPL(workqueue_set_max_active);
				3176
				3177	/**
				3178	* workqueue_congested - test whether a workqueue is congested
				3179	* @cpu: CPU in question
				3180	* @wq: target workqueue
				3181	*
				3182	* Test whether @wq's cpu workqueue for @cpu is congested. There is
				3183	* no synchronization around this function and the test result is
				3184	* unreliable and only useful as advisory hints or for debugging.
				3185	*
				3186	* RETURNS:
				3187	* %true if congested, %false otherwise.
				3188	*/
				3189	bool workqueue_congested(unsigned int cpu, struct workqueue_struct *wq)
				3190	{
				3191	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
				3192
				3193	return !list_empty(&cwq->delayed_works);
				3194	}
				3195	EXPORT_SYMBOL_GPL(workqueue_congested);
				3196
				3197	/**
				3198	* work_cpu - return the last known associated cpu for @work
				3199	* @work: the work of interest
				3200	*
				3201	* RETURNS:
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3202	* CPU number if @work was ever queued. WORK_CPU_NONE otherwise.
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3203	*/
				3204	unsigned int work_cpu(struct work_struct *work)
				3205	{
				3206	struct global_cwq *gcwq = get_work_gcwq(work);
				3207
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3208	return gcwq ? gcwq->cpu : WORK_CPU_NONE;
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3209	}
				3210	EXPORT_SYMBOL_GPL(work_cpu);
				3211
				3212	/**
				3213	* work_busy - test whether a work is currently pending or running
				3214	* @work: the work to be tested
				3215	*
				3216	* Test whether @work is currently pending or running. There is no
				3217	* synchronization around this function and the test result is
				3218	* unreliable and only useful as advisory hints or for debugging.
				3219	* Especially for reentrant wqs, the pending state might hide the
				3220	* running state.
				3221	*
				3222	* RETURNS:
				3223	* OR'd bitmask of WORK_BUSY_* bits.
				3224	*/
				3225	unsigned int work_busy(struct work_struct *work)
				3226	{
				3227	struct global_cwq *gcwq = get_work_gcwq(work);
				3228	unsigned long flags;
				3229	unsigned int ret = 0;
				3230
				3231	if (!gcwq)
				3232	return false;
				3233
				3234	spin_lock_irqsave(&gcwq->lock, flags);
				3235
				3236	if (work_pending(work))
				3237	ret \|= WORK_BUSY_PENDING;
				3238	if (find_worker_executing_work(gcwq, work))
				3239	ret \|= WORK_BUSY_RUNNING;
				3240
				3241	spin_unlock_irqrestore(&gcwq->lock, flags);
				3242
				3243	return ret;
				3244	}
				3245	EXPORT_SYMBOL_GPL(work_busy);
				3246
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3247	/*
				3248	* CPU hotplug.
				3249	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3250	* There are two challenges in supporting CPU hotplug. Firstly, there
				3251	* are a lot of assumptions on strong associations among work, cwq and
				3252	* gcwq which make migrating pending and scheduled works very
				3253	* difficult to implement without impacting hot paths. Secondly,
				3254	* gcwqs serve mix of short, long and very long running works making
				3255	* blocked draining impractical.
				3256	*
				3257	* This is solved by allowing a gcwq to be detached from CPU, running
				3258	* it with unbound (rogue) workers and allowing it to be reattached
				3259	* later if the cpu comes back online. A separate thread is created
				3260	* to govern a gcwq in such state and is called the trustee of the
				3261	* gcwq.
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3262	*
				3263	* Trustee states and their descriptions.
				3264	*
				3265	* START Command state used on startup. On CPU_DOWN_PREPARE, a
				3266	* new trustee is started with this state.
				3267	*
				3268	* IN_CHARGE Once started, trustee will enter this state after
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3269	* assuming the manager role and making all existing
				3270	* workers rogue. DOWN_PREPARE waits for trustee to
				3271	* enter this state. After reaching IN_CHARGE, trustee
				3272	* tries to execute the pending worklist until it's empty
				3273	* and the state is set to BUTCHER, or the state is set
				3274	* to RELEASE.
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3275	*
				3276	* BUTCHER Command state which is set by the cpu callback after
				3277	* the cpu has went down. Once this state is set trustee
				3278	* knows that there will be no new works on the worklist
				3279	* and once the worklist is empty it can proceed to
				3280	* killing idle workers.
				3281	*
				3282	* RELEASE Command state which is set by the cpu callback if the
				3283	* cpu down has been canceled or it has come online
				3284	* again. After recognizing this state, trustee stops
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3285	* trying to drain or butcher and clears ROGUE, rebinds
				3286	* all remaining workers back to the cpu and releases
				3287	* manager role.
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3288	*
				3289	* DONE Trustee will enter this state after BUTCHER or RELEASE
				3290	* is complete.
				3291	*
				3292	* trustee CPU draining
				3293	* took over down complete
				3294	* START -----------> IN_CHARGE -----------> BUTCHER -----------> DONE
				3295	* \| \| ^
				3296	* \| CPU is back online v return workers \|
				3297	* ----------------> RELEASE --------------
				3298	*/
				3299
				3300	/**
				3301	* trustee_wait_event_timeout - timed event wait for trustee
				3302	* @cond: condition to wait for
				3303	* @timeout: timeout in jiffies
				3304	*
				3305	* wait_event_timeout() for trustee to use. Handles locking and
				3306	* checks for RELEASE request.
				3307	*
				3308	* CONTEXT:
				3309	* spin_lock_irq(gcwq->lock) which may be released and regrabbed
				3310	* multiple times. To be used by trustee.
				3311	*
				3312	* RETURNS:
				3313	* Positive indicating left time if @cond is satisfied, 0 if timed
				3314	* out, -1 if canceled.
				3315	*/
				3316	#define trustee_wait_event_timeout(cond, timeout) ({ \
				3317	long __ret = (timeout); \
				3318	while (!((cond) \|\| (gcwq->trustee_state == TRUSTEE_RELEASE)) && \
				3319	__ret) { \
				3320	spin_unlock_irq(&gcwq->lock); \
				3321	__wait_event_timeout(gcwq->trustee_wait, (cond) \|\| \
				3322	(gcwq->trustee_state == TRUSTEE_RELEASE), \
				3323	__ret); \
				3324	spin_lock_irq(&gcwq->lock); \
				3325	} \
				3326	gcwq->trustee_state == TRUSTEE_RELEASE ? -1 : (__ret); \
				3327	})
				3328
				3329	/**
				3330	* trustee_wait_event - event wait for trustee
				3331	* @cond: condition to wait for
				3332	*
				3333	* wait_event() for trustee to use. Automatically handles locking and
				3334	* checks for CANCEL request.
				3335	*
				3336	* CONTEXT:
				3337	* spin_lock_irq(gcwq->lock) which may be released and regrabbed
				3338	* multiple times. To be used by trustee.
				3339	*
				3340	* RETURNS:
				3341	* 0 if @cond is satisfied, -1 if canceled.
				3342	*/
				3343	#define trustee_wait_event(cond) ({ \
				3344	long __ret1; \
				3345	__ret1 = trustee_wait_event_timeout(cond, MAX_SCHEDULE_TIMEOUT);\
				3346	__ret1 < 0 ? -1 : 0; \
				3347	})
				3348
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3349	static bool gcwq_is_managing_workers(struct global_cwq *gcwq)
				3350	{
				3351	struct worker_pool *pool;
				3352
				3353	for_each_worker_pool(pool, gcwq)
				3354	if (pool->flags & POOL_MANAGING_WORKERS)
				3355	return true;
				3356	return false;
				3357	}
				3358
				3359	static bool gcwq_has_idle_workers(struct global_cwq *gcwq)
				3360	{
				3361	struct worker_pool *pool;
				3362
				3363	for_each_worker_pool(pool, gcwq)
				3364	if (!list_empty(&pool->idle_list))
				3365	return true;
				3366	return false;
				3367	}
				3368
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3369	static int __cpuinit trustee_thread(void *__gcwq)
				3370	{
				3371	struct global_cwq *gcwq = __gcwq;
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3372	struct worker_pool *pool;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3373	struct worker *worker;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3374	struct work_struct *work;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3375	struct hlist_node *pos;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3376	long rc;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3377	int i;
				3378
				3379	BUG_ON(gcwq->cpu != smp_processor_id());
				3380
				3381	spin_lock_irq(&gcwq->lock);
				3382	/*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3383	* Claim the manager position and make all workers rogue.
				3384	* Trustee must be bound to the target cpu and can't be
				3385	* cancelled.
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3386	*/
				3387	BUG_ON(gcwq->cpu != smp_processor_id());
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3388	rc = trustee_wait_event(!gcwq_is_managing_workers(gcwq));
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3389	BUG_ON(rc < 0);
				3390
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3391	for_each_worker_pool(pool, gcwq) {
				3392	pool->flags \|= POOL_MANAGING_WORKERS;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3393
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3394	list_for_each_entry(worker, &pool->idle_list, entry)
				3395	worker->flags \|= WORKER_ROGUE;
				3396	}
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3397
				3398	for_each_busy_worker(worker, i, pos, gcwq)
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	3399	worker->flags \|= WORKER_ROGUE;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3400
				3401	/*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3402	* Call schedule() so that we cross rq->lock and thus can
				3403	* guarantee sched callbacks see the rogue flag. This is
				3404	* necessary as scheduler callbacks may be invoked from other
				3405	* cpus.
				3406	*/
				3407	spin_unlock_irq(&gcwq->lock);
				3408	schedule();
				3409	spin_lock_irq(&gcwq->lock);
				3410
				3411	/*
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	3412	* Sched callbacks are disabled now. Zap nr_running. After
				3413	* this, nr_running stays zero and need_more_worker() and
				3414	* keep_working() are always true as long as the worklist is
				3415	* not empty.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3416	*/
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3417	for_each_worker_pool(pool, gcwq)
				3418	atomic_set(get_pool_nr_running(pool), 0);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3419
				3420	spin_unlock_irq(&gcwq->lock);
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3421	for_each_worker_pool(pool, gcwq)
				3422	del_timer_sync(&pool->idle_timer);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3423	spin_lock_irq(&gcwq->lock);
				3424
				3425	/*
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3426	* We're now in charge. Notify and proceed to drain. We need
				3427	* to keep the gcwq running during the whole CPU down
				3428	* procedure as other cpu hotunplug callbacks may need to
				3429	* flush currently running tasks.
				3430	*/
				3431	gcwq->trustee_state = TRUSTEE_IN_CHARGE;
				3432	wake_up_all(&gcwq->trustee_wait);
				3433
				3434	/*
				3435	* The original cpu is in the process of dying and may go away
				3436	* anytime now. When that happens, we and all workers would
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3437	* be migrated to other cpus. Try draining any left work. We
				3438	* want to get it over with ASAP - spam rescuers, wake up as
				3439	* many idlers as necessary and create new ones till the
				3440	* worklist is empty. Note that if the gcwq is frozen, there
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3441	* may be frozen works in freezable cwqs. Don't declare
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3442	* completion while frozen.
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3443	*/
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3444	while (true) {
				3445	bool busy = false;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3446
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3447	for_each_worker_pool(pool, gcwq)
				3448	busy \|= pool->nr_workers != pool->nr_idle;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3449
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3450	if (!busy && !(gcwq->flags & GCWQ_FREEZING) &&
				3451	gcwq->trustee_state != TRUSTEE_IN_CHARGE)
				3452	break;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3453
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3454	for_each_worker_pool(pool, gcwq) {
				3455	int nr_works = 0;
				3456
				3457	list_for_each_entry(work, &pool->worklist, entry) {
				3458	send_mayday(work);
				3459	nr_works++;
				3460	}
				3461
				3462	list_for_each_entry(worker, &pool->idle_list, entry) {
				3463	if (!nr_works--)
				3464	break;
				3465	wake_up_process(worker->task);
				3466	}
				3467
				3468	if (need_to_create_worker(pool)) {
				3469	spin_unlock_irq(&gcwq->lock);
				3470	worker = create_worker(pool, false);
				3471	spin_lock_irq(&gcwq->lock);
				3472	if (worker) {
				3473	worker->flags \|= WORKER_ROGUE;
				3474	start_worker(worker);
				3475	}
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3476	}
				3477	}
				3478
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3479	/* give a breather */
				3480	if (trustee_wait_event_timeout(false, TRUSTEE_COOLDOWN) < 0)
				3481	break;
				3482	}
				3483
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3484	/*
				3485	* Either all works have been scheduled and cpu is down, or
				3486	* cpu down has already been canceled. Wait for and butcher
				3487	* all workers till we're canceled.
				3488	*/
				3489	do {
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3490	rc = trustee_wait_event(gcwq_has_idle_workers(gcwq));
				3491
				3492	i = 0;
				3493	for_each_worker_pool(pool, gcwq) {
				3494	while (!list_empty(&pool->idle_list)) {
				3495	worker = list_first_entry(&pool->idle_list,
				3496	struct worker, entry);
				3497	destroy_worker(worker);
				3498	}
				3499	i \|= pool->nr_workers;
				3500	}
				3501	} while (i && rc >= 0);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3502
				3503	/*
				3504	* At this point, either draining has completed and no worker
				3505	* is left, or cpu down has been canceled or the cpu is being
				3506	* brought back up. There shouldn't be any idle one left.
				3507	* Tell the remaining busy ones to rebind once it finishes the
				3508	* currently scheduled works by scheduling the rebind_work.
				3509	*/
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3510	for_each_worker_pool(pool, gcwq)
				3511	WARN_ON(!list_empty(&pool->idle_list));
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3512
				3513	for_each_busy_worker(worker, i, pos, gcwq) {
				3514	struct work_struct *rebind_work = &worker->rebind_work;
Lai Jiangshan	6adebb0	2012-09-02 00:28:19 +0800	[diff] [blame]	3515	unsigned long worker_flags = worker->flags;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3516
				3517	/*
				3518	* Rebind_work may race with future cpu hotplug
				3519	* operations. Use a separate flag to mark that
Lai Jiangshan	6adebb0	2012-09-02 00:28:19 +0800	[diff] [blame]	3520	* rebinding is scheduled. The morphing should
				3521	* be atomic.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3522	*/
Lai Jiangshan	6adebb0	2012-09-02 00:28:19 +0800	[diff] [blame]	3523	worker_flags \|= WORKER_REBIND;
				3524	worker_flags &= ~WORKER_ROGUE;
				3525	ACCESS_ONCE(worker->flags) = worker_flags;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3526
				3527	/* queue rebind_work, wq doesn't matter, use the default one */
				3528	if (test_and_set_bit(WORK_STRUCT_PENDING_BIT,
				3529	work_data_bits(rebind_work)))
				3530	continue;
				3531
				3532	debug_work_activate(rebind_work);
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3533	insert_work(get_cwq(gcwq->cpu, system_wq), rebind_work,
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3534	worker->scheduled.next,
				3535	work_color_to_flags(WORK_NO_COLOR));
				3536	}
				3537
				3538	/* relinquish manager role */
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3539	for_each_worker_pool(pool, gcwq)
				3540	pool->flags &= ~POOL_MANAGING_WORKERS;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3541
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3542	/* notify completion */
				3543	gcwq->trustee = NULL;
				3544	gcwq->trustee_state = TRUSTEE_DONE;
				3545	wake_up_all(&gcwq->trustee_wait);
				3546	spin_unlock_irq(&gcwq->lock);
				3547	return 0;
				3548	}
				3549
				3550	/**
				3551	* wait_trustee_state - wait for trustee to enter the specified state
				3552	* @gcwq: gcwq the trustee of interest belongs to
				3553	* @state: target state to wait for
				3554	*
				3555	* Wait for the trustee to reach @state. DONE is already matched.
				3556	*
				3557	* CONTEXT:
				3558	* spin_lock_irq(gcwq->lock) which may be released and regrabbed
				3559	* multiple times. To be used by cpu_callback.
				3560	*/
				3561	static void __cpuinit wait_trustee_state(struct global_cwq *gcwq, int state)
Namhyung Kim	06bd6eb	2010-08-22 23:19:42 +0900	[diff] [blame]	3562	__releases(&gcwq->lock)
				3563	__acquires(&gcwq->lock)
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3564	{
				3565	if (!(gcwq->trustee_state == state \|\|
				3566	gcwq->trustee_state == TRUSTEE_DONE)) {
				3567	spin_unlock_irq(&gcwq->lock);
				3568	__wait_event(gcwq->trustee_wait,
				3569	gcwq->trustee_state == state \|\|
				3570	gcwq->trustee_state == TRUSTEE_DONE);
				3571	spin_lock_irq(&gcwq->lock);
				3572	}
				3573	}
				3574
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3575	static int __devinit workqueue_cpu_callback(struct notifier_block *nfb,
				3576	unsigned long action,
				3577	void *hcpu)
				3578	{
				3579	unsigned int cpu = (unsigned long)hcpu;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3580	struct global_cwq *gcwq = get_gcwq(cpu);
				3581	struct task_struct *new_trustee = NULL;
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3582	struct worker *new_workers[NR_WORKER_POOLS] = { };
				3583	struct worker_pool *pool;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3584	unsigned long flags;
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3585	int i;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3586
Rafael J. Wysocki	8bb7844	2007-05-09 02:35:10 -0700	[diff] [blame]	3587	action &= ~CPU_TASKS_FROZEN;
				3588
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3589	switch (action) {
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3590	case CPU_DOWN_PREPARE:
				3591	new_trustee = kthread_create(trustee_thread, gcwq,
				3592	"workqueue_trustee/%d\n", cpu);
				3593	if (IS_ERR(new_trustee))
				3594	return notifier_from_errno(PTR_ERR(new_trustee));
				3595	kthread_bind(new_trustee, cpu);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3596	/* fall through */
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3597	case CPU_UP_PREPARE:
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3598	i = 0;
				3599	for_each_worker_pool(pool, gcwq) {
				3600	BUG_ON(pool->first_idle);
				3601	new_workers[i] = create_worker(pool, false);
				3602	if (!new_workers[i++])
				3603	goto err_destroy;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3604	}
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3605	}
				3606
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3607	/* some are called w/ irq disabled, don't disturb irq status */
				3608	spin_lock_irqsave(&gcwq->lock, flags);
				3609
Oleg Nesterov	00dfcaf	2008-04-29 01:00:27 -0700	[diff] [blame]	3610	switch (action) {
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3611	case CPU_DOWN_PREPARE:
				3612	/* initialize trustee and tell it to acquire the gcwq */
				3613	BUG_ON(gcwq->trustee \|\| gcwq->trustee_state != TRUSTEE_DONE);
				3614	gcwq->trustee = new_trustee;
				3615	gcwq->trustee_state = TRUSTEE_START;
				3616	wake_up_process(gcwq->trustee);
				3617	wait_trustee_state(gcwq, TRUSTEE_IN_CHARGE);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3618	/* fall through */
				3619	case CPU_UP_PREPARE:
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3620	i = 0;
				3621	for_each_worker_pool(pool, gcwq) {
				3622	BUG_ON(pool->first_idle);
				3623	pool->first_idle = new_workers[i++];
				3624	}
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3625	break;
				3626
				3627	case CPU_DYING:
				3628	/*
				3629	* Before this, the trustee and all workers except for
				3630	* the ones which are still executing works from
				3631	* before the last CPU down must be on the cpu. After
				3632	* this, they'll all be diasporas.
				3633	*/
				3634	gcwq->flags \|= GCWQ_DISASSOCIATED;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3635	break;
				3636
Oleg Nesterov	3da1c84	2008-07-25 01:47:50 -0700	[diff] [blame]	3637	case CPU_POST_DEAD:
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3638	gcwq->trustee_state = TRUSTEE_BUTCHER;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3639	/* fall through */
				3640	case CPU_UP_CANCELED:
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3641	for_each_worker_pool(pool, gcwq) {
				3642	destroy_worker(pool->first_idle);
				3643	pool->first_idle = NULL;
				3644	}
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3645	break;
				3646
				3647	case CPU_DOWN_FAILED:
				3648	case CPU_ONLINE:
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3649	gcwq->flags &= ~GCWQ_DISASSOCIATED;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3650	if (gcwq->trustee_state != TRUSTEE_DONE) {
				3651	gcwq->trustee_state = TRUSTEE_RELEASE;
				3652	wake_up_process(gcwq->trustee);
				3653	wait_trustee_state(gcwq, TRUSTEE_DONE);
				3654	}
				3655
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3656	/*
				3657	* Trustee is done and there might be no worker left.
				3658	* Put the first_idle in and request a real manager to
				3659	* take a look.
				3660	*/
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3661	for_each_worker_pool(pool, gcwq) {
				3662	spin_unlock_irq(&gcwq->lock);
				3663	kthread_bind(pool->first_idle->task, cpu);
				3664	spin_lock_irq(&gcwq->lock);
				3665	pool->flags \|= POOL_MANAGE_WORKERS;
				3666	start_worker(pool->first_idle);
				3667	pool->first_idle = NULL;
				3668	}
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3669	break;
Oleg Nesterov	00dfcaf	2008-04-29 01:00:27 -0700	[diff] [blame]	3670	}
				3671
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3672	spin_unlock_irqrestore(&gcwq->lock, flags);
				3673
Tejun Heo	1537663	2010-06-29 10:07:11 +0200	[diff] [blame]	3674	return notifier_from_errno(0);
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3675
				3676	err_destroy:
				3677	if (new_trustee)
				3678	kthread_stop(new_trustee);
				3679
				3680	spin_lock_irqsave(&gcwq->lock, flags);
				3681	for (i = 0; i < NR_WORKER_POOLS; i++)
				3682	if (new_workers[i])
				3683	destroy_worker(new_workers[i]);
				3684	spin_unlock_irqrestore(&gcwq->lock, flags);
				3685
				3686	return NOTIFY_BAD;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3687	}
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3688
Tejun Heo	d3b4254	2012-07-17 12:39:26 -0700	[diff] [blame]	3689	/*
				3690	* Workqueues should be brought up before normal priority CPU notifiers.
				3691	* This will be registered high priority CPU notifier.
				3692	*/
				3693	static int __devinit workqueue_cpu_up_callback(struct notifier_block *nfb,
				3694	unsigned long action,
				3695	void *hcpu)
				3696	{
				3697	switch (action & ~CPU_TASKS_FROZEN) {
				3698	case CPU_UP_PREPARE:
				3699	case CPU_UP_CANCELED:
				3700	case CPU_DOWN_FAILED:
				3701	case CPU_ONLINE:
				3702	return workqueue_cpu_callback(nfb, action, hcpu);
				3703	}
				3704	return NOTIFY_OK;
				3705	}
				3706
				3707	/*
				3708	* Workqueues should be brought down after normal priority CPU notifiers.
				3709	* This will be registered as low priority CPU notifier.
				3710	*/
				3711	static int __devinit workqueue_cpu_down_callback(struct notifier_block *nfb,
				3712	unsigned long action,
				3713	void *hcpu)
				3714	{
				3715	switch (action & ~CPU_TASKS_FROZEN) {
				3716	case CPU_DOWN_PREPARE:
				3717	case CPU_DYING:
				3718	case CPU_POST_DEAD:
				3719	return workqueue_cpu_callback(nfb, action, hcpu);
				3720	}
				3721	return NOTIFY_OK;
				3722	}
				3723
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3724	#ifdef CONFIG_SMP
Rusty Russell	8ccad40	2009-01-16 15:31:15 -0800	[diff] [blame]	3725
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3726	struct work_for_cpu {
Tejun Heo	fc7da7e	2012-09-18 12:48:43 -0700	[diff] [blame]	3727	struct work_struct work;
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3728	long (fn)(void );
				3729	void *arg;
				3730	long ret;
				3731	};
				3732
Tejun Heo	fc7da7e	2012-09-18 12:48:43 -0700	[diff] [blame]	3733	static void work_for_cpu_fn(struct work_struct *work)
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3734	{
Tejun Heo	fc7da7e	2012-09-18 12:48:43 -0700	[diff] [blame]	3735	struct work_for_cpu *wfc = container_of(work, struct work_for_cpu, work);
				3736
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3737	wfc->ret = wfc->fn(wfc->arg);
				3738	}
				3739
				3740	/**
				3741	* work_on_cpu - run a function in user context on a particular cpu
				3742	* @cpu: the cpu to run on
				3743	* @fn: the function to run
				3744	* @arg: the function arg
				3745	*
Rusty Russell	31ad908	2009-01-16 15:31:15 -0800	[diff] [blame]	3746	* This will return the value @fn returns.
				3747	* It is up to the caller to ensure that the cpu doesn't go offline.
Andrew Morton	6b44003	2009-04-09 09:50:37 -0600	[diff] [blame]	3748	* The caller must not hold any locks which would prevent @fn from completing.
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3749	*/
				3750	long work_on_cpu(unsigned int cpu, long (fn)(void ), void *arg)
				3751	{
Tejun Heo	fc7da7e	2012-09-18 12:48:43 -0700	[diff] [blame]	3752	struct work_for_cpu wfc = { .fn = fn, .arg = arg };
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3753
Tejun Heo	fc7da7e	2012-09-18 12:48:43 -0700	[diff] [blame]	3754	INIT_WORK_ONSTACK(&wfc.work, work_for_cpu_fn);
				3755	schedule_work_on(cpu, &wfc.work);
				3756	flush_work(&wfc.work);
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	3757	return wfc.ret;
				3758	}
				3759	EXPORT_SYMBOL_GPL(work_on_cpu);
				3760	#endif /* CONFIG_SMP */
				3761
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3762	#ifdef CONFIG_FREEZER
Rusty Russell	e7577c5	2009-01-01 10:12:25 +1030	[diff] [blame]	3763
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3764	/**
				3765	* freeze_workqueues_begin - begin freezing workqueues
				3766	*
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3767	* Start freezing workqueues. After this function returns, all freezable
				3768	* workqueues will queue new works to their frozen_works list instead of
				3769	* gcwq->worklist.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3770	*
				3771	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3772	* Grabs and releases workqueue_lock and gcwq->lock's.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3773	*/
				3774	void freeze_workqueues_begin(void)
				3775	{
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3776	unsigned int cpu;
				3777
				3778	spin_lock(&workqueue_lock);
				3779
				3780	BUG_ON(workqueue_freezing);
				3781	workqueue_freezing = true;
				3782
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3783	for_each_gcwq_cpu(cpu) {
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3784	struct global_cwq *gcwq = get_gcwq(cpu);
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3785	struct workqueue_struct *wq;
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3786
				3787	spin_lock_irq(&gcwq->lock);
				3788
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3789	BUG_ON(gcwq->flags & GCWQ_FREEZING);
				3790	gcwq->flags \|= GCWQ_FREEZING;
				3791
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3792	list_for_each_entry(wq, &workqueues, list) {
				3793	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
				3794
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3795	if (cwq && wq->flags & WQ_FREEZABLE)
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3796	cwq->max_active = 0;
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3797	}
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3798
				3799	spin_unlock_irq(&gcwq->lock);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3800	}
				3801
				3802	spin_unlock(&workqueue_lock);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3803	}
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3804
				3805	/**
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3806	* freeze_workqueues_busy - are freezable workqueues still busy?
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3807	*
				3808	* Check whether freezing is complete. This function must be called
				3809	* between freeze_workqueues_begin() and thaw_workqueues().
				3810	*
				3811	* CONTEXT:
				3812	* Grabs and releases workqueue_lock.
				3813	*
				3814	* RETURNS:
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3815	* %true if some freezable workqueues are still busy. %false if freezing
				3816	* is complete.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3817	*/
				3818	bool freeze_workqueues_busy(void)
				3819	{
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3820	unsigned int cpu;
				3821	bool busy = false;
				3822
				3823	spin_lock(&workqueue_lock);
				3824
				3825	BUG_ON(!workqueue_freezing);
				3826
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3827	for_each_gcwq_cpu(cpu) {
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3828	struct workqueue_struct *wq;
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3829	/*
				3830	* nr_active is monotonically decreasing. It's safe
				3831	* to peek without lock.
				3832	*/
				3833	list_for_each_entry(wq, &workqueues, list) {
				3834	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
				3835
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3836	if (!cwq \|\| !(wq->flags & WQ_FREEZABLE))
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3837	continue;
				3838
				3839	BUG_ON(cwq->nr_active < 0);
				3840	if (cwq->nr_active) {
				3841	busy = true;
				3842	goto out_unlock;
				3843	}
				3844	}
				3845	}
				3846	out_unlock:
				3847	spin_unlock(&workqueue_lock);
				3848	return busy;
				3849	}
				3850
				3851	/**
				3852	* thaw_workqueues - thaw workqueues
				3853	*
				3854	* Thaw workqueues. Normal queueing is restored and all collected
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	3855	* frozen works are transferred to their respective gcwq worklists.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3856	*
				3857	* CONTEXT:
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3858	* Grabs and releases workqueue_lock and gcwq->lock's.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3859	*/
				3860	void thaw_workqueues(void)
				3861	{
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3862	unsigned int cpu;
				3863
				3864	spin_lock(&workqueue_lock);
				3865
				3866	if (!workqueue_freezing)
				3867	goto out_unlock;
				3868
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3869	for_each_gcwq_cpu(cpu) {
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3870	struct global_cwq *gcwq = get_gcwq(cpu);
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3871	struct worker_pool *pool;
Tejun Heo	bdbc5dd	2010-07-02 10:03:51 +0200	[diff] [blame]	3872	struct workqueue_struct *wq;
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3873
				3874	spin_lock_irq(&gcwq->lock);
				3875
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3876	BUG_ON(!(gcwq->flags & GCWQ_FREEZING));
				3877	gcwq->flags &= ~GCWQ_FREEZING;
				3878
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3879	list_for_each_entry(wq, &workqueues, list) {
				3880	struct cpu_workqueue_struct *cwq = get_cwq(cpu, wq);
				3881
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	3882	if (!cwq \|\| !(wq->flags & WQ_FREEZABLE))
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3883	continue;
				3884
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3885	/* restore max_active and repopulate worklist */
				3886	cwq->max_active = wq->saved_max_active;
				3887
				3888	while (!list_empty(&cwq->delayed_works) &&
				3889	cwq->nr_active < cwq->max_active)
				3890	cwq_activate_first_delayed(cwq);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3891	}
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3892
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3893	for_each_worker_pool(pool, gcwq)
				3894	wake_up_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3895
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3896	spin_unlock_irq(&gcwq->lock);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3897	}
				3898
				3899	workqueue_freezing = false;
				3900	out_unlock:
				3901	spin_unlock(&workqueue_lock);
				3902	}
				3903	#endif /* CONFIG_FREEZER */
				3904
Suresh Siddha	6ee0578	2010-07-30 14:57:37 -0700	[diff] [blame]	3905	static int __init init_workqueues(void)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3906	{
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	3907	unsigned int cpu;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	3908	int i;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	3909
Tejun Heo	d3b4254	2012-07-17 12:39:26 -0700	[diff] [blame]	3910	cpu_notifier(workqueue_cpu_up_callback, CPU_PRI_WORKQUEUE_UP);
				3911	cpu_notifier(workqueue_cpu_down_callback, CPU_PRI_WORKQUEUE_DOWN);
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3912
				3913	/* initialize gcwqs */
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3914	for_each_gcwq_cpu(cpu) {
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3915	struct global_cwq *gcwq = get_gcwq(cpu);
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3916	struct worker_pool *pool;
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3917
				3918	spin_lock_init(&gcwq->lock);
				3919	gcwq->cpu = cpu;
Tejun Heo	477a3c3	2010-08-31 10:54:35 +0200	[diff] [blame]	3920	gcwq->flags \|= GCWQ_DISASSOCIATED;
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3921
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	3922	for (i = 0; i < BUSY_WORKER_HASH_SIZE; i++)
				3923	INIT_HLIST_HEAD(&gcwq->busy_hash[i]);
				3924
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3925	for_each_worker_pool(pool, gcwq) {
				3926	pool->gcwq = gcwq;
				3927	INIT_LIST_HEAD(&pool->worklist);
				3928	INIT_LIST_HEAD(&pool->idle_list);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3929
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3930	init_timer_deferrable(&pool->idle_timer);
				3931	pool->idle_timer.function = idle_worker_timeout;
				3932	pool->idle_timer.data = (unsigned long)pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3933
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3934	setup_timer(&pool->mayday_timer, gcwq_mayday_timeout,
				3935	(unsigned long)pool);
				3936
				3937	ida_init(&pool->worker_ida);
				3938	}
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	3939
				3940	gcwq->trustee_state = TRUSTEE_DONE;
				3941	init_waitqueue_head(&gcwq->trustee_wait);
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	3942	}
				3943
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3944	/* create the initial worker */
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3945	for_each_online_gcwq_cpu(cpu) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3946	struct global_cwq *gcwq = get_gcwq(cpu);
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3947	struct worker_pool *pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3948
Tejun Heo	477a3c3	2010-08-31 10:54:35 +0200	[diff] [blame]	3949	if (cpu != WORK_CPU_UNBOUND)
				3950	gcwq->flags &= ~GCWQ_DISASSOCIATED;
Tejun Heo	9c6bae0	2012-07-13 22:16:44 -0700	[diff] [blame]	3951
				3952	for_each_worker_pool(pool, gcwq) {
				3953	struct worker *worker;
				3954
				3955	worker = create_worker(pool, true);
				3956	BUG_ON(!worker);
				3957	spin_lock_irq(&gcwq->lock);
				3958	start_worker(worker);
				3959	spin_unlock_irq(&gcwq->lock);
				3960	}
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3961	}
				3962
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3963	system_wq = alloc_workqueue("events", 0, 0);
				3964	system_long_wq = alloc_workqueue("events_long", 0, 0);
				3965	system_nrt_wq = alloc_workqueue("events_nrt", WQ_NON_REENTRANT, 0);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3966	system_unbound_wq = alloc_workqueue("events_unbound", WQ_UNBOUND,
				3967	WQ_UNBOUND_MAX_ACTIVE);
Tejun Heo	24d51ad	2011-02-21 09:52:50 +0100	[diff] [blame]	3968	system_freezable_wq = alloc_workqueue("events_freezable",
				3969	WQ_FREEZABLE, 0);
Alan Stern	62d3c54	2012-03-02 10:51:00 +0100	[diff] [blame]	3970	system_nrt_freezable_wq = alloc_workqueue("events_nrt_freezable",
				3971	WQ_NON_REENTRANT \| WQ_FREEZABLE, 0);
Hitoshi Mitake	e5cba24	2010-11-26 12:06:44 +0100	[diff] [blame]	3972	BUG_ON(!system_wq \|\| !system_long_wq \|\| !system_nrt_wq \|\|
Alan Stern	62d3c54	2012-03-02 10:51:00 +0100	[diff] [blame]	3973	!system_unbound_wq \|\| !system_freezable_wq \|\|
				3974	!system_nrt_freezable_wq);
Suresh Siddha	6ee0578	2010-07-30 14:57:37 -0700	[diff] [blame]	3975	return 0;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3976	}
Suresh Siddha	6ee0578	2010-07-30 14:57:37 -0700	[diff] [blame]	3977	early_initcall(init_workqueues);