Blame - kernel/workqueue.c - android_kernel_oneplus_msm8996

blob: 147fc5a784f0eb4f806b7c708e8379b105052fd3 [file] [log] [blame]

Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1	/*
Tejun Heo	c54fce6	2010-09-10 16:51:36 +0200	[diff] [blame]	2	* kernel/workqueue.c - generic async execution with shared worker pool
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3	*
Tejun Heo	c54fce6	2010-09-10 16:51:36 +0200	[diff] [blame]	4	* Copyright (C) 2002 Ingo Molnar
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	5	*
Tejun Heo	c54fce6	2010-09-10 16:51:36 +0200	[diff] [blame]	6	* Derived from the taskqueue/keventd code by:
				7	* David Woodhouse <dwmw2@infradead.org>
				8	* Andrew Morton
				9	* Kai Petzke <wpp@marie.physik.tu-berlin.de>
				10	* Theodore Ts'o <tytso@mit.edu>
Christoph Lameter	89ada67	2005-10-30 15:01:59 -0800	[diff] [blame]	11	*
Christoph Lameter	cde5353	2008-07-04 09:59:22 -0700	[diff] [blame]	12	* Made to use alloc_percpu by Christoph Lameter.
Tejun Heo	c54fce6	2010-09-10 16:51:36 +0200	[diff] [blame]	13	*
				14	* Copyright (C) 2010 SUSE Linux Products GmbH
				15	* Copyright (C) 2010 Tejun Heo <tj@kernel.org>
				16	*
				17	* This is the generic async execution mechanism. Work items as are
				18	* executed in process context. The worker pool is shared and
				19	* automatically managed. There is one worker pool for each CPU and
				20	* one extra for works which are better served by workers which are
				21	* not bound to any specific CPU.
				22	*
				23	* Please read Documentation/workqueue.txt for details.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	24	*/
				25
Paul Gortmaker	9984de1	2011-05-23 14:51:41 -0400	[diff] [blame]	26	#include <linux/export.h>
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	27	#include <linux/kernel.h>
				28	#include <linux/sched.h>
				29	#include <linux/init.h>
				30	#include <linux/signal.h>
				31	#include <linux/completion.h>
				32	#include <linux/workqueue.h>
				33	#include <linux/slab.h>
				34	#include <linux/cpu.h>
				35	#include <linux/notifier.h>
				36	#include <linux/kthread.h>
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	37	#include <linux/hardirq.h>
Christoph Lameter	4693402	2006-10-11 01:21:26 -0700	[diff] [blame]	38	#include <linux/mempolicy.h>
Rafael J. Wysocki	341a595	2006-12-06 20:34:49 -0800	[diff] [blame]	39	#include <linux/freezer.h>
Peter Zijlstra	d5abe66	2006-12-06 20:37:26 -0800	[diff] [blame]	40	#include <linux/kallsyms.h>
				41	#include <linux/debug_locks.h>
Johannes Berg	4e6045f	2007-10-18 23:39:55 -0700	[diff] [blame]	42	#include <linux/lockdep.h>
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	43	#include <linux/idr.h>
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	44	#include <linux/jhash.h>
Sasha Levin	42f8570	2012-12-17 10:01:23 -0500	[diff] [blame]	45	#include <linux/hashtable.h>
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	46	#include <linux/rculist.h>
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	47
Tejun Heo	ea13844	2013-01-18 14:05:55 -0800	[diff] [blame]	48	#include "workqueue_internal.h"
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	49
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	50	enum {
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	51	/*
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	52	* worker_pool flags
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	53	*
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	54	* A bound pool is either associated or disassociated with its CPU.
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	55	* While associated (!DISASSOCIATED), all workers are bound to the
				56	* CPU and none has %WORKER_UNBOUND set and concurrency management
				57	* is in effect.
				58	*
				59	* While DISASSOCIATED, the cpu may be offline and all workers have
				60	* %WORKER_UNBOUND set and concurrency management disabled, and may
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	61	* be executing on any CPU. The pool behaves as an unbound one.
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	62	*
				63	* Note that DISASSOCIATED can be flipped only while holding
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	64	* assoc_mutex to avoid changing binding state while
				65	* create_worker() is in progress.
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	66	*/
Tejun Heo	11ebea5	2012-07-12 14:46:37 -0700	[diff] [blame]	67	POOL_MANAGE_WORKERS = 1 << 0, /* need to manage workers */
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	68	POOL_DISASSOCIATED = 1 << 2, /* cpu can't serve workers */
Tejun Heo	35b6bb6	2013-01-24 11:01:33 -0800	[diff] [blame]	69	POOL_FREEZING = 1 << 3, /* freeze in progress */
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	70
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	71	/* worker flags */
				72	WORKER_STARTED = 1 << 0, /* started */
				73	WORKER_DIE = 1 << 1, /* die die die */
				74	WORKER_IDLE = 1 << 2, /* is idle */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	75	WORKER_PREP = 1 << 3, /* preparing to run works */
Tejun Heo	fb0e7be	2010-06-29 10:07:15 +0200	[diff] [blame]	76	WORKER_CPU_INTENSIVE = 1 << 6, /* cpu intensive */
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	77	WORKER_UNBOUND = 1 << 7, /* worker is unbound */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	78
Lai Jiangshan	5f7dabf	2012-09-18 09:59:23 -0700	[diff] [blame]	79	WORKER_NOT_RUNNING = WORKER_PREP \| WORKER_UNBOUND \|
Tejun Heo	403c821	2012-07-17 12:39:27 -0700	[diff] [blame]	80	WORKER_CPU_INTENSIVE,
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	81
Tejun Heo	e34cdddb	2013-01-24 11:01:33 -0800	[diff] [blame]	82	NR_STD_WORKER_POOLS = 2, /* # standard pools per cpu */
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	83
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	84	UNBOUND_POOL_HASH_ORDER = 6, /* hashed by pool->attrs */
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	85	BUSY_WORKER_HASH_ORDER = 6, /* 64 pointers */
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	86
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	87	MAX_IDLE_WORKERS_RATIO = 4, /* 1/4 of busy can be idle */
				88	IDLE_WORKER_TIMEOUT = 300 * HZ, /* keep idle ones for 5 mins */
				89
Tejun Heo	3233cdb	2011-02-16 18:10:19 +0100	[diff] [blame]	90	MAYDAY_INITIAL_TIMEOUT = HZ / 100 >= 2 ? HZ / 100 : 2,
				91	/* call for help after 10ms
				92	(min two ticks) */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	93	MAYDAY_INTERVAL = HZ / 10, /* and then every 100ms */
				94	CREATE_COOLDOWN = HZ, /* time to breath after fail */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	95
				96	/*
				97	* Rescue workers are used only on emergencies and shared by
				98	* all cpus. Give -20.
				99	*/
				100	RESCUER_NICE_LEVEL = -20,
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	101	HIGHPRI_NICE_LEVEL = -20,
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	102	};
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	103
				104	/*
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	105	* Structure fields follow one of the following exclusion rules.
				106	*
Tejun Heo	e41e704	2010-08-24 14:22:47 +0200	[diff] [blame]	107	* I: Modifiable by initialization/destruction paths and read-only for
				108	* everyone else.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	109	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	110	* P: Preemption protected. Disabling preemption is enough and should
				111	* only be modified and accessed from the local cpu.
				112	*
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	113	* L: pool->lock protected. Access with pool->lock held.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	114	*
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	115	* X: During normal operation, modification requires pool->lock and should
				116	* be done only from local cpu. Either disabling preemption on local
				117	* cpu or grabbing pool->lock is enough for read access. If
				118	* POOL_DISASSOCIATED is set, it's identical to L.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	119	*
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	120	* F: wq->flush_mutex protected.
				121	*
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	122	* W: workqueue_lock protected.
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	123	*
				124	* R: workqueue_lock protected for writes. Sched-RCU protected for reads.
Tejun Heo	75ccf59	2013-03-12 11:30:04 -0700	[diff] [blame]	125	*
				126	* FR: wq->flush_mutex and workqueue_lock protected for writes. Sched-RCU
				127	* protected for reads.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	128	*/
				129
Tejun Heo	2eaebdb	2013-01-18 14:05:55 -0800	[diff] [blame]	130	/* struct worker is defined in workqueue_internal.h */
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	131
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	132	struct worker_pool {
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	133	spinlock_t lock; /* the pool lock */
Tejun Heo	d84ff05	2013-03-12 11:29:59 -0700	[diff] [blame]	134	int cpu; /* I: the associated cpu */
Tejun Heo	9daf9e6	2013-01-24 11:01:33 -0800	[diff] [blame]	135	int id; /* I: pool ID */
Tejun Heo	11ebea5	2012-07-12 14:46:37 -0700	[diff] [blame]	136	unsigned int flags; /* X: flags */
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	137
				138	struct list_head worklist; /* L: list of pending works */
				139	int nr_workers; /* L: total number of workers */
Lai Jiangshan	ea1abd6	2012-09-18 09:59:22 -0700	[diff] [blame]	140
				141	/* nr_idle includes the ones off idle_list for rebinding */
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	142	int nr_idle; /* L: currently idle ones */
				143
				144	struct list_head idle_list; /* X: list of idle workers */
				145	struct timer_list idle_timer; /* L: worker idle timeout */
				146	struct timer_list mayday_timer; /* L: SOS timer for workers */
				147
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	148	/* a workers is either on busy_hash or idle_list, or the manager */
Tejun Heo	c9e7cf2	2013-01-24 11:01:33 -0800	[diff] [blame]	149	DECLARE_HASHTABLE(busy_hash, BUSY_WORKER_HASH_ORDER);
				150	/* L: hash of busy workers */
				151
Tejun Heo	34a06bd	2013-03-12 11:30:00 -0700	[diff] [blame]	152	struct mutex manager_arb; /* manager arbitration */
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	153	struct mutex assoc_mutex; /* protect POOL_DISASSOCIATED */
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	154	struct ida worker_ida; /* L: for worker IDs */
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	155
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	156	struct workqueue_attrs attrs; / I: worker attributes */
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	157	struct hlist_node hash_node; /* W: unbound_pool_hash node */
				158	int refcnt; /* W: refcnt for unbound pools */
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	159
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	160	/*
				161	* The current concurrency level. As it's likely to be accessed
				162	* from other CPUs during try_to_wake_up(), put it in a separate
				163	* cacheline.
				164	*/
				165	atomic_t nr_running ____cacheline_aligned_in_smp;
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	166
				167	/*
				168	* Destruction of pool is sched-RCU protected to allow dereferences
				169	* from get_work_pool().
				170	*/
				171	struct rcu_head rcu;
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	172	} ____cacheline_aligned_in_smp;
				173
				174	/*
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	175	* The per-pool workqueue. While queued, the lower WORK_STRUCT_FLAG_BITS
				176	* of work_struct->data are used for flags and the remaining high bits
				177	* point to the pwq; thus, pwqs need to be aligned at two's power of the
				178	* number of flag bits.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	179	*/
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	180	struct pool_workqueue {
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	181	struct worker_pool pool; / I: the associated pool */
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	182	struct workqueue_struct wq; / I: the owning workqueue */
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	183	int work_color; /* L: current color */
				184	int flush_color; /* L: flushing color */
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	185	int refcnt; /* L: reference count */
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	186	int nr_in_flight[WORK_NR_COLORS];
				187	/* L: nr of in_flight works */
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	188	int nr_active; /* L: nr of active works */
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	189	int max_active; /* L: max active works */
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	190	struct list_head delayed_works; /* L: delayed works */
Tejun Heo	75ccf59	2013-03-12 11:30:04 -0700	[diff] [blame]	191	struct list_head pwqs_node; /* FR: node on wq->pwqs */
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	192	struct list_head mayday_node; /* W: node on wq->maydays */
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	193
				194	/*
				195	* Release of unbound pwq is punted to system_wq. See put_pwq()
				196	* and pwq_unbound_release_workfn() for details. pool_workqueue
				197	* itself is also sched-RCU protected so that the first pwq can be
				198	* determined without grabbing workqueue_lock.
				199	*/
				200	struct work_struct unbound_release_work;
				201	struct rcu_head rcu;
Tejun Heo	e904e6c	2013-03-12 11:29:57 -0700	[diff] [blame]	202	} __aligned(1 << WORK_STRUCT_FLAG_BITS);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	203
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	204	/*
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	205	* Structure used to wait for workqueue flush.
				206	*/
				207	struct wq_flusher {
				208	struct list_head list; /* F: list of flushers */
				209	int flush_color; /* F: flush color waiting for */
				210	struct completion done; /* flush completion */
				211	};
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	212
Tejun Heo	226223a	2013-03-12 11:30:05 -0700	[diff] [blame]	213	struct wq_device;
				214
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	215	/*
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	216	* The externally visible workqueue. It relays the issued work items to
				217	* the appropriate worker_pool through its pool_workqueues.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	218	*/
				219	struct workqueue_struct {
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	220	unsigned int flags; /* W: WQ_* flags */
Tejun Heo	420c0dd	2013-03-12 11:29:59 -0700	[diff] [blame]	221	struct pool_workqueue __percpu cpu_pwqs; / I: per-cpu pwq's */
Tejun Heo	75ccf59	2013-03-12 11:30:04 -0700	[diff] [blame]	222	struct list_head pwqs; /* FR: all pwqs of this wq */
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	223	struct list_head list; /* W: list of all workqueues */
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	224
				225	struct mutex flush_mutex; /* protects wq flushing */
				226	int work_color; /* F: current work color */
				227	int flush_color; /* F: current flush color */
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	228	atomic_t nr_pwqs_to_flush; /* flush in progress */
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	229	struct wq_flusher first_flusher; / F: first flusher */
				230	struct list_head flusher_queue; /* F: flush waiters */
				231	struct list_head flusher_overflow; /* F: flush overflow list */
				232
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	233	struct list_head maydays; /* W: pwqs requesting rescue */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	234	struct worker rescuer; / I: rescue worker */
				235
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	236	int nr_drainers; /* W: drain in progress */
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	237	int saved_max_active; /* W: saved pwq max_active */
Tejun Heo	226223a	2013-03-12 11:30:05 -0700	[diff] [blame]	238
				239	#ifdef CONFIG_SYSFS
				240	struct wq_device wq_dev; / I: for sysfs interface */
				241	#endif
Johannes Berg	4e6045f	2007-10-18 23:39:55 -0700	[diff] [blame]	242	#ifdef CONFIG_LOCKDEP
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	243	struct lockdep_map lockdep_map;
Johannes Berg	4e6045f	2007-10-18 23:39:55 -0700	[diff] [blame]	244	#endif
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	245	char name[]; /* I: workqueue name */
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	246	};
				247
Tejun Heo	e904e6c	2013-03-12 11:29:57 -0700	[diff] [blame]	248	static struct kmem_cache *pwq_cache;
				249
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	250	/* W: hash of all unbound pools keyed by pool->attrs */
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	251	static DEFINE_HASHTABLE(unbound_pool_hash, UNBOUND_POOL_HASH_ORDER);
				252
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	253	/* I: attributes used when instantiating standard unbound pools on demand */
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	254	static struct workqueue_attrs *unbound_std_wq_attrs[NR_STD_WORKER_POOLS];
				255
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	256	struct workqueue_struct *system_wq __read_mostly;
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	257	EXPORT_SYMBOL_GPL(system_wq);
Valentin Ilie	044c782	2012-08-19 00:52:42 +0300	[diff] [blame]	258	struct workqueue_struct *system_highpri_wq __read_mostly;
Joonsoo Kim	1aabe90	2012-08-15 23:25:39 +0900	[diff] [blame]	259	EXPORT_SYMBOL_GPL(system_highpri_wq);
Valentin Ilie	044c782	2012-08-19 00:52:42 +0300	[diff] [blame]	260	struct workqueue_struct *system_long_wq __read_mostly;
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	261	EXPORT_SYMBOL_GPL(system_long_wq);
Valentin Ilie	044c782	2012-08-19 00:52:42 +0300	[diff] [blame]	262	struct workqueue_struct *system_unbound_wq __read_mostly;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	263	EXPORT_SYMBOL_GPL(system_unbound_wq);
Valentin Ilie	044c782	2012-08-19 00:52:42 +0300	[diff] [blame]	264	struct workqueue_struct *system_freezable_wq __read_mostly;
Tejun Heo	24d51ad	2011-02-21 09:52:50 +0100	[diff] [blame]	265	EXPORT_SYMBOL_GPL(system_freezable_wq);
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	266
Tejun Heo	97bd234	2010-10-05 10:41:14 +0200	[diff] [blame]	267	#define CREATE_TRACE_POINTS
				268	#include <trace/events/workqueue.h>
				269
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	270	#define assert_rcu_or_wq_lock() \
				271	rcu_lockdep_assert(rcu_read_lock_sched_held() \|\| \
				272	lockdep_is_held(&workqueue_lock), \
				273	"sched RCU or workqueue lock should be held")
				274
Tejun Heo	f02ae73	2013-03-12 11:30:03 -0700	[diff] [blame]	275	#define for_each_cpu_worker_pool(pool, cpu) \
				276	for ((pool) = &per_cpu(cpu_worker_pools, cpu)[0]; \
				277	(pool) < &per_cpu(cpu_worker_pools, cpu)[NR_STD_WORKER_POOLS]; \
Tejun Heo	7a62c2c	2013-03-12 11:30:03 -0700	[diff] [blame]	278	(pool)++)
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	279
Sasha Levin	b67bfe0	2013-02-27 17:06:00 -0800	[diff] [blame]	280	#define for_each_busy_worker(worker, i, pool) \
				281	hash_for_each(pool->busy_hash, i, worker, hentry)
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	282
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	283	/**
Tejun Heo	1711696	2013-03-12 11:29:58 -0700	[diff] [blame]	284	* for_each_pool - iterate through all worker_pools in the system
				285	* @pool: iteration cursor
Tejun Heo	611c92a	2013-03-13 16:51:36 -0700	[diff] [blame^]	286	* @pi: integer used for iteration
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	287	*
				288	* This must be called either with workqueue_lock held or sched RCU read
				289	* locked. If the pool needs to be used beyond the locking in effect, the
				290	* caller is responsible for guaranteeing that the pool stays online.
				291	*
				292	* The if/else clause exists only for the lockdep assertion and can be
				293	* ignored.
Tejun Heo	1711696	2013-03-12 11:29:58 -0700	[diff] [blame]	294	*/
Tejun Heo	611c92a	2013-03-13 16:51:36 -0700	[diff] [blame^]	295	#define for_each_pool(pool, pi) \
				296	idr_for_each_entry(&worker_pool_idr, pool, pi) \
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	297	if (({ assert_rcu_or_wq_lock(); false; })) { } \
				298	else
Tejun Heo	1711696	2013-03-12 11:29:58 -0700	[diff] [blame]	299
				300	/**
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	301	* for_each_pwq - iterate through all pool_workqueues of the specified workqueue
				302	* @pwq: iteration cursor
				303	* @wq: the target workqueue
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	304	*
				305	* This must be called either with workqueue_lock held or sched RCU read
				306	* locked. If the pwq needs to be used beyond the locking in effect, the
				307	* caller is responsible for guaranteeing that the pwq stays online.
				308	*
				309	* The if/else clause exists only for the lockdep assertion and can be
				310	* ignored.
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	311	*/
				312	#define for_each_pwq(pwq, wq) \
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	313	list_for_each_entry_rcu((pwq), &(wq)->pwqs, pwqs_node) \
				314	if (({ assert_rcu_or_wq_lock(); false; })) { } \
				315	else
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	316
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	317	#ifdef CONFIG_DEBUG_OBJECTS_WORK
				318
				319	static struct debug_obj_descr work_debug_descr;
				320
Stanislaw Gruszka	9977728	2011-03-07 09:58:33 +0100	[diff] [blame]	321	static void work_debug_hint(void addr)
				322	{
				323	return ((struct work_struct *) addr)->func;
				324	}
				325
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	326	/*
				327	* fixup_init is called when:
				328	* - an active object is initialized
				329	*/
				330	static int work_fixup_init(void *addr, enum debug_obj_state state)
				331	{
				332	struct work_struct *work = addr;
				333
				334	switch (state) {
				335	case ODEBUG_STATE_ACTIVE:
				336	cancel_work_sync(work);
				337	debug_object_init(work, &work_debug_descr);
				338	return 1;
				339	default:
				340	return 0;
				341	}
				342	}
				343
				344	/*
				345	* fixup_activate is called when:
				346	* - an active object is activated
				347	* - an unknown object is activated (might be a statically initialized object)
				348	*/
				349	static int work_fixup_activate(void *addr, enum debug_obj_state state)
				350	{
				351	struct work_struct *work = addr;
				352
				353	switch (state) {
				354
				355	case ODEBUG_STATE_NOTAVAILABLE:
				356	/*
				357	* This is not really a fixup. The work struct was
				358	* statically initialized. We just make sure that it
				359	* is tracked in the object tracker.
				360	*/
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	361	if (test_bit(WORK_STRUCT_STATIC_BIT, work_data_bits(work))) {
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	362	debug_object_init(work, &work_debug_descr);
				363	debug_object_activate(work, &work_debug_descr);
				364	return 0;
				365	}
				366	WARN_ON_ONCE(1);
				367	return 0;
				368
				369	case ODEBUG_STATE_ACTIVE:
				370	WARN_ON(1);
				371
				372	default:
				373	return 0;
				374	}
				375	}
				376
				377	/*
				378	* fixup_free is called when:
				379	* - an active object is freed
				380	*/
				381	static int work_fixup_free(void *addr, enum debug_obj_state state)
				382	{
				383	struct work_struct *work = addr;
				384
				385	switch (state) {
				386	case ODEBUG_STATE_ACTIVE:
				387	cancel_work_sync(work);
				388	debug_object_free(work, &work_debug_descr);
				389	return 1;
				390	default:
				391	return 0;
				392	}
				393	}
				394
				395	static struct debug_obj_descr work_debug_descr = {
				396	.name = "work_struct",
Stanislaw Gruszka	9977728	2011-03-07 09:58:33 +0100	[diff] [blame]	397	.debug_hint = work_debug_hint,
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	398	.fixup_init = work_fixup_init,
				399	.fixup_activate = work_fixup_activate,
				400	.fixup_free = work_fixup_free,
				401	};
				402
				403	static inline void debug_work_activate(struct work_struct *work)
				404	{
				405	debug_object_activate(work, &work_debug_descr);
				406	}
				407
				408	static inline void debug_work_deactivate(struct work_struct *work)
				409	{
				410	debug_object_deactivate(work, &work_debug_descr);
				411	}
				412
				413	void __init_work(struct work_struct *work, int onstack)
				414	{
				415	if (onstack)
				416	debug_object_init_on_stack(work, &work_debug_descr);
				417	else
				418	debug_object_init(work, &work_debug_descr);
				419	}
				420	EXPORT_SYMBOL_GPL(__init_work);
				421
				422	void destroy_work_on_stack(struct work_struct *work)
				423	{
				424	debug_object_free(work, &work_debug_descr);
				425	}
				426	EXPORT_SYMBOL_GPL(destroy_work_on_stack);
				427
				428	#else
				429	static inline void debug_work_activate(struct work_struct *work) { }
				430	static inline void debug_work_deactivate(struct work_struct *work) { }
				431	#endif
				432
Gautham R Shenoy	95402b3	2008-01-25 21:08:02 +0100	[diff] [blame]	433	/* Serializes the accesses to the list of workqueues. */
				434	static DEFINE_SPINLOCK(workqueue_lock);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	435	static LIST_HEAD(workqueues);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	436	static bool workqueue_freezing; /* W: have wqs started freezing? */
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	437
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	438	/* the per-cpu worker pools */
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	439	static DEFINE_PER_CPU_SHARED_ALIGNED(struct worker_pool [NR_STD_WORKER_POOLS],
Tejun Heo	f02ae73	2013-03-12 11:30:03 -0700	[diff] [blame]	440	cpu_worker_pools);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	441
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	442	/*
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	443	* R: idr of all pools. Modifications are protected by workqueue_lock.
				444	* Read accesses are protected by sched-RCU protected.
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	445	*/
Tejun Heo	9daf9e6	2013-01-24 11:01:33 -0800	[diff] [blame]	446	static DEFINE_IDR(worker_pool_idr);
				447
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	448	static int worker_thread(void *__worker);
Tejun Heo	226223a	2013-03-12 11:30:05 -0700	[diff] [blame]	449	static void copy_workqueue_attrs(struct workqueue_attrs *to,
				450	const struct workqueue_attrs *from);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	451
Tejun Heo	9daf9e6	2013-01-24 11:01:33 -0800	[diff] [blame]	452	/* allocate ID and assign it to @pool */
				453	static int worker_pool_assign_id(struct worker_pool *pool)
				454	{
				455	int ret;
				456
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	457	do {
				458	if (!idr_pre_get(&worker_pool_idr, GFP_KERNEL))
				459	return -ENOMEM;
				460
				461	spin_lock_irq(&workqueue_lock);
				462	ret = idr_get_new(&worker_pool_idr, pool, &pool->id);
				463	spin_unlock_irq(&workqueue_lock);
				464	} while (ret == -EAGAIN);
Tejun Heo	9daf9e6	2013-01-24 11:01:33 -0800	[diff] [blame]	465
				466	return ret;
				467	}
				468
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	469	/**
				470	* first_pwq - return the first pool_workqueue of the specified workqueue
				471	* @wq: the target workqueue
				472	*
				473	* This must be called either with workqueue_lock held or sched RCU read
				474	* locked. If the pwq needs to be used beyond the locking in effect, the
				475	* caller is responsible for guaranteeing that the pwq stays online.
				476	*/
Tejun Heo	7fb98ea	2013-03-12 11:30:00 -0700	[diff] [blame]	477	static struct pool_workqueue first_pwq(struct workqueue_struct wq)
Oleg Nesterov	a848e3b	2007-05-09 02:34:17 -0700	[diff] [blame]	478	{
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	479	assert_rcu_or_wq_lock();
				480	return list_first_or_null_rcu(&wq->pwqs, struct pool_workqueue,
				481	pwqs_node);
Oleg Nesterov	a848e3b	2007-05-09 02:34:17 -0700	[diff] [blame]	482	}
				483
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	484	static unsigned int work_color_to_flags(int color)
				485	{
				486	return color << WORK_STRUCT_COLOR_SHIFT;
				487	}
				488
				489	static int get_work_color(struct work_struct *work)
				490	{
				491	return (*work_data_bits(work) >> WORK_STRUCT_COLOR_SHIFT) &
				492	((1 << WORK_STRUCT_COLOR_BITS) - 1);
				493	}
				494
				495	static int work_next_color(int color)
				496	{
				497	return (color + 1) % WORK_NR_COLORS;
Oleg Nesterov	b1f4ec1	2007-05-09 02:34:12 -0700	[diff] [blame]	498	}
				499
David Howells	4594bf1	2006-12-07 11:33:26 +0000	[diff] [blame]	500	/*
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	501	* While queued, %WORK_STRUCT_PWQ is set and non flag bits of a work's data
				502	* contain the pointer to the queued pwq. Once execution starts, the flag
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	503	* is cleared and the high bits contain OFFQ flags and pool ID.
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	504	*
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	505	* set_work_pwq(), set_work_pool_and_clear_pending(), mark_work_canceling()
				506	* and clear_work_data() can be used to set the pwq, pool or clear
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	507	* work->data. These functions should only be called while the work is
				508	* owned - ie. while the PENDING bit is set.
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	509	*
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	510	* get_work_pool() and get_work_pwq() can be used to obtain the pool or pwq
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	511	* corresponding to a work. Pool is available once the work has been
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	512	* queued anywhere after initialization until it is sync canceled. pwq is
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	513	* available only while the work item is queued.
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	514	*
				515	* %WORK_OFFQ_CANCELING is used to mark a work item which is being
				516	* canceled. While being canceled, a work item may have its PENDING set
				517	* but stay off timer and worklist for arbitrarily long and nobody should
				518	* try to steal the PENDING bit.
David Howells	4594bf1	2006-12-07 11:33:26 +0000	[diff] [blame]	519	*/
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	520	static inline void set_work_data(struct work_struct *work, unsigned long data,
				521	unsigned long flags)
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	522	{
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	523	WARN_ON_ONCE(!work_pending(work));
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	524	atomic_long_set(&work->data, data \| flags \| work_static(work));
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	525	}
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	526
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	527	static void set_work_pwq(struct work_struct work, struct pool_workqueue pwq,
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	528	unsigned long extra_flags)
Oleg Nesterov	4d707b9	2010-04-23 17:40:40 +0200	[diff] [blame]	529	{
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	530	set_work_data(work, (unsigned long)pwq,
				531	WORK_STRUCT_PENDING \| WORK_STRUCT_PWQ \| extra_flags);
Oleg Nesterov	4d707b9	2010-04-23 17:40:40 +0200	[diff] [blame]	532	}
				533
Lai Jiangshan	4468a00	2013-02-06 18:04:53 -0800	[diff] [blame]	534	static void set_work_pool_and_keep_pending(struct work_struct *work,
				535	int pool_id)
				536	{
				537	set_work_data(work, (unsigned long)pool_id << WORK_OFFQ_POOL_SHIFT,
				538	WORK_STRUCT_PENDING);
				539	}
				540
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	541	static void set_work_pool_and_clear_pending(struct work_struct *work,
				542	int pool_id)
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	543	{
Tejun Heo	23657bb	2012-08-13 17:08:19 -0700	[diff] [blame]	544	/*
				545	* The following wmb is paired with the implied mb in
				546	* test_and_set_bit(PENDING) and ensures all updates to @work made
				547	* here are visible to and precede any updates by the next PENDING
				548	* owner.
				549	*/
				550	smp_wmb();
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	551	set_work_data(work, (unsigned long)pool_id << WORK_OFFQ_POOL_SHIFT, 0);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	552	}
				553
				554	static void clear_work_data(struct work_struct *work)
				555	{
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	556	smp_wmb(); /* see set_work_pool_and_clear_pending() */
				557	set_work_data(work, WORK_STRUCT_NO_POOL, 0);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	558	}
				559
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	560	static struct pool_workqueue get_work_pwq(struct work_struct work)
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	561	{
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	562	unsigned long data = atomic_long_read(&work->data);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	563
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	564	if (data & WORK_STRUCT_PWQ)
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	565	return (void *)(data & WORK_STRUCT_WQ_DATA_MASK);
				566	else
				567	return NULL;
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	568	}
				569
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	570	/**
				571	* get_work_pool - return the worker_pool a given work was associated with
				572	* @work: the work item of interest
				573	*
				574	* Return the worker_pool @work was last associated with. %NULL if none.
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	575	*
				576	* Pools are created and destroyed under workqueue_lock, and allows read
				577	* access under sched-RCU read lock. As such, this function should be
				578	* called under workqueue_lock or with preemption disabled.
				579	*
				580	* All fields of the returned pool are accessible as long as the above
				581	* mentioned locking is in effect. If the returned pool needs to be used
				582	* beyond the critical section, the caller is responsible for ensuring the
				583	* returned pool is and stays online.
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	584	*/
				585	static struct worker_pool get_work_pool(struct work_struct work)
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	586	{
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	587	unsigned long data = atomic_long_read(&work->data);
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	588	int pool_id;
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	589
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	590	assert_rcu_or_wq_lock();
				591
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	592	if (data & WORK_STRUCT_PWQ)
				593	return ((struct pool_workqueue *)
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	594	(data & WORK_STRUCT_WQ_DATA_MASK))->pool;
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	595
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	596	pool_id = data >> WORK_OFFQ_POOL_SHIFT;
				597	if (pool_id == WORK_OFFQ_POOL_NONE)
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	598	return NULL;
				599
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	600	return idr_find(&worker_pool_idr, pool_id);
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	601	}
				602
				603	/**
				604	* get_work_pool_id - return the worker pool ID a given work is associated with
				605	* @work: the work item of interest
				606	*
				607	* Return the worker_pool ID @work was last associated with.
				608	* %WORK_OFFQ_POOL_NONE if none.
				609	*/
				610	static int get_work_pool_id(struct work_struct *work)
				611	{
Lai Jiangshan	54d5b7d	2013-02-07 13:14:20 -0800	[diff] [blame]	612	unsigned long data = atomic_long_read(&work->data);
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	613
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	614	if (data & WORK_STRUCT_PWQ)
				615	return ((struct pool_workqueue *)
Lai Jiangshan	54d5b7d	2013-02-07 13:14:20 -0800	[diff] [blame]	616	(data & WORK_STRUCT_WQ_DATA_MASK))->pool->id;
				617
				618	return data >> WORK_OFFQ_POOL_SHIFT;
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	619	}
				620
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	621	static void mark_work_canceling(struct work_struct *work)
				622	{
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	623	unsigned long pool_id = get_work_pool_id(work);
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	624
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	625	pool_id <<= WORK_OFFQ_POOL_SHIFT;
				626	set_work_data(work, pool_id \| WORK_OFFQ_CANCELING, WORK_STRUCT_PENDING);
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	627	}
				628
				629	static bool work_is_canceling(struct work_struct *work)
				630	{
				631	unsigned long data = atomic_long_read(&work->data);
				632
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	633	return !(data & WORK_STRUCT_PWQ) && (data & WORK_OFFQ_CANCELING);
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	634	}
				635
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	636	/*
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	637	* Policy functions. These define the policies on how the global worker
				638	* pools are managed. Unless noted otherwise, these functions assume that
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	639	* they're being called with pool->lock held.
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	640	*/
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	641
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	642	static bool __need_more_worker(struct worker_pool *pool)
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	643	{
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	644	return !atomic_read(&pool->nr_running);
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	645	}
				646
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	647	/*
				648	* Need to wake up a worker? Called from anything but currently
				649	* running workers.
Tejun Heo	974271c	2012-07-12 14:46:37 -0700	[diff] [blame]	650	*
				651	* Note that, because unbound workers never contribute to nr_running, this
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	652	* function will always return %true for unbound pools as long as the
Tejun Heo	974271c	2012-07-12 14:46:37 -0700	[diff] [blame]	653	* worklist isn't empty.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	654	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	655	static bool need_more_worker(struct worker_pool *pool)
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	656	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	657	return !list_empty(&pool->worklist) && __need_more_worker(pool);
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	658	}
				659
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	660	/* Can I start working? Called from busy but !running workers. */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	661	static bool may_start_working(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	662	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	663	return pool->nr_idle;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	664	}
				665
				666	/* Do I need to keep working? Called from currently running workers. */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	667	static bool keep_working(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	668	{
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	669	return !list_empty(&pool->worklist) &&
				670	atomic_read(&pool->nr_running) <= 1;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	671	}
				672
				673	/* Do we need a new worker? Called from manager. */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	674	static bool need_to_create_worker(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	675	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	676	return need_more_worker(pool) && !may_start_working(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	677	}
				678
				679	/* Do I need to be the manager? */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	680	static bool need_to_manage_workers(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	681	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	682	return need_to_create_worker(pool) \|\|
Tejun Heo	11ebea5	2012-07-12 14:46:37 -0700	[diff] [blame]	683	(pool->flags & POOL_MANAGE_WORKERS);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	684	}
				685
				686	/* Do we have too many workers and should some go away? */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	687	static bool too_many_workers(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	688	{
Tejun Heo	34a06bd	2013-03-12 11:30:00 -0700	[diff] [blame]	689	bool managing = mutex_is_locked(&pool->manager_arb);
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	690	int nr_idle = pool->nr_idle + managing; /* manager is considered idle */
				691	int nr_busy = pool->nr_workers - nr_idle;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	692
Lai Jiangshan	ea1abd6	2012-09-18 09:59:22 -0700	[diff] [blame]	693	/*
				694	* nr_idle and idle_list may disagree if idle rebinding is in
				695	* progress. Never return %true if idle_list is empty.
				696	*/
				697	if (list_empty(&pool->idle_list))
				698	return false;
				699
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	700	return nr_idle > 2 && (nr_idle - 2) * MAX_IDLE_WORKERS_RATIO >= nr_busy;
				701	}
				702
				703	/*
				704	* Wake up functions.
				705	*/
				706
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	707	/* Return the first worker. Safe with preemption disabled */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	708	static struct worker first_worker(struct worker_pool pool)
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	709	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	710	if (unlikely(list_empty(&pool->idle_list)))
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	711	return NULL;
				712
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	713	return list_first_entry(&pool->idle_list, struct worker, entry);
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	714	}
				715
				716	/**
				717	* wake_up_worker - wake up an idle worker
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	718	* @pool: worker pool to wake worker from
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	719	*
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	720	* Wake up the first idle worker of @pool.
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	721	*
				722	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	723	* spin_lock_irq(pool->lock).
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	724	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	725	static void wake_up_worker(struct worker_pool *pool)
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	726	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	727	struct worker *worker = first_worker(pool);
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	728
				729	if (likely(worker))
				730	wake_up_process(worker->task);
				731	}
				732
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	733	/**
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	734	* wq_worker_waking_up - a worker is waking up
				735	* @task: task waking up
				736	* @cpu: CPU @task is waking up to
				737	*
				738	* This function is called during try_to_wake_up() when a worker is
				739	* being awoken.
				740	*
				741	* CONTEXT:
				742	* spin_lock_irq(rq->lock)
				743	*/
Tejun Heo	d84ff05	2013-03-12 11:29:59 -0700	[diff] [blame]	744	void wq_worker_waking_up(struct task_struct *task, int cpu)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	745	{
				746	struct worker *worker = kthread_data(task);
				747
Joonsoo Kim	3657600	2012-10-26 23:03:49 +0900	[diff] [blame]	748	if (!(worker->flags & WORKER_NOT_RUNNING)) {
Tejun Heo	ec22ca5	2013-01-24 11:01:33 -0800	[diff] [blame]	749	WARN_ON_ONCE(worker->pool->cpu != cpu);
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	750	atomic_inc(&worker->pool->nr_running);
Joonsoo Kim	3657600	2012-10-26 23:03:49 +0900	[diff] [blame]	751	}
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	752	}
				753
				754	/**
				755	* wq_worker_sleeping - a worker is going to sleep
				756	* @task: task going to sleep
				757	* @cpu: CPU in question, must be the current CPU number
				758	*
				759	* This function is called during schedule() when a busy worker is
				760	* going to sleep. Worker on the same cpu can be woken up by
				761	* returning pointer to its task.
				762	*
				763	* CONTEXT:
				764	* spin_lock_irq(rq->lock)
				765	*
				766	* RETURNS:
				767	* Worker task on @cpu to wake up, %NULL if none.
				768	*/
Tejun Heo	d84ff05	2013-03-12 11:29:59 -0700	[diff] [blame]	769	struct task_struct wq_worker_sleeping(struct task_struct task, int cpu)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	770	{
				771	struct worker worker = kthread_data(task), to_wakeup = NULL;
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	772	struct worker_pool *pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	773
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	774	/*
				775	* Rescuers, which may not have all the fields set up like normal
				776	* workers, also reach here, let's not access anything before
				777	* checking NOT_RUNNING.
				778	*/
Steven Rostedt	2d64672	2010-12-03 23:12:33 -0500	[diff] [blame]	779	if (worker->flags & WORKER_NOT_RUNNING)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	780	return NULL;
				781
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	782	pool = worker->pool;
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	783
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	784	/* this can only happen on the local cpu */
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	785	if (WARN_ON_ONCE(cpu != raw_smp_processor_id()))
				786	return NULL;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	787
				788	/*
				789	* The counterpart of the following dec_and_test, implied mb,
				790	* worklist not empty test sequence is in insert_work().
				791	* Please read comment there.
				792	*
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	793	* NOT_RUNNING is clear. This means that we're bound to and
				794	* running on the local cpu w/ rq lock held and preemption
				795	* disabled, which in turn means that none else could be
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	796	* manipulating idle_list, so dereferencing idle_list without pool
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	797	* lock is safe.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	798	*/
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	799	if (atomic_dec_and_test(&pool->nr_running) &&
				800	!list_empty(&pool->worklist))
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	801	to_wakeup = first_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	802	return to_wakeup ? to_wakeup->task : NULL;
				803	}
				804
				805	/**
				806	* worker_set_flags - set worker flags and adjust nr_running accordingly
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	807	* @worker: self
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	808	* @flags: flags to set
				809	* @wakeup: wakeup an idle worker if necessary
				810	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	811	* Set @flags in @worker->flags and adjust nr_running accordingly. If
				812	* nr_running becomes zero and @wakeup is %true, an idle worker is
				813	* woken up.
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	814	*
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	815	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	816	* spin_lock_irq(pool->lock)
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	817	*/
				818	static inline void worker_set_flags(struct worker *worker, unsigned int flags,
				819	bool wakeup)
				820	{
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	821	struct worker_pool *pool = worker->pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	822
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	823	WARN_ON_ONCE(worker->task != current);
				824
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	825	/*
				826	* If transitioning into NOT_RUNNING, adjust nr_running and
				827	* wake up an idle worker as necessary if requested by
				828	* @wakeup.
				829	*/
				830	if ((flags & WORKER_NOT_RUNNING) &&
				831	!(worker->flags & WORKER_NOT_RUNNING)) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	832	if (wakeup) {
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	833	if (atomic_dec_and_test(&pool->nr_running) &&
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	834	!list_empty(&pool->worklist))
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	835	wake_up_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	836	} else
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	837	atomic_dec(&pool->nr_running);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	838	}
				839
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	840	worker->flags \|= flags;
				841	}
				842
				843	/**
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	844	* worker_clr_flags - clear worker flags and adjust nr_running accordingly
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	845	* @worker: self
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	846	* @flags: flags to clear
				847	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	848	* Clear @flags in @worker->flags and adjust nr_running accordingly.
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	849	*
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	850	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	851	* spin_lock_irq(pool->lock)
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	852	*/
				853	static inline void worker_clr_flags(struct worker *worker, unsigned int flags)
				854	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	855	struct worker_pool *pool = worker->pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	856	unsigned int oflags = worker->flags;
				857
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	858	WARN_ON_ONCE(worker->task != current);
				859
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	860	worker->flags &= ~flags;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	861
Tejun Heo	42c025f	2011-01-11 15:58:49 +0100	[diff] [blame]	862	/*
				863	* If transitioning out of NOT_RUNNING, increment nr_running. Note
				864	* that the nested NOT_RUNNING is not a noop. NOT_RUNNING is mask
				865	* of multiple flags, not a single flag.
				866	*/
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	867	if ((flags & WORKER_NOT_RUNNING) && (oflags & WORKER_NOT_RUNNING))
				868	if (!(worker->flags & WORKER_NOT_RUNNING))
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	869	atomic_inc(&pool->nr_running);
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	870	}
				871
				872	/**
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	873	* find_worker_executing_work - find worker which is executing a work
Tejun Heo	c9e7cf2	2013-01-24 11:01:33 -0800	[diff] [blame]	874	* @pool: pool of interest
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	875	* @work: work to find worker for
				876	*
Tejun Heo	c9e7cf2	2013-01-24 11:01:33 -0800	[diff] [blame]	877	* Find a worker which is executing @work on @pool by searching
				878	* @pool->busy_hash which is keyed by the address of @work. For a worker
Tejun Heo	a2c1c57	2012-12-18 10:35:02 -0800	[diff] [blame]	879	* to match, its current execution should match the address of @work and
				880	* its work function. This is to avoid unwanted dependency between
				881	* unrelated work executions through a work item being recycled while still
				882	* being executed.
				883	*
				884	* This is a bit tricky. A work item may be freed once its execution
				885	* starts and nothing prevents the freed area from being recycled for
				886	* another work item. If the same work item address ends up being reused
				887	* before the original execution finishes, workqueue will identify the
				888	* recycled work item as currently executing and make it wait until the
				889	* current execution finishes, introducing an unwanted dependency.
				890	*
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	891	* This function checks the work item address and work function to avoid
				892	* false positives. Note that this isn't complete as one may construct a
				893	* work function which can introduce dependency onto itself through a
				894	* recycled work item. Well, if somebody wants to shoot oneself in the
				895	* foot that badly, there's only so much we can do, and if such deadlock
				896	* actually occurs, it should be easy to locate the culprit work function.
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	897	*
				898	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	899	* spin_lock_irq(pool->lock).
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	900	*
				901	* RETURNS:
				902	* Pointer to worker which is executing @work if found, NULL
				903	* otherwise.
				904	*/
Tejun Heo	c9e7cf2	2013-01-24 11:01:33 -0800	[diff] [blame]	905	static struct worker find_worker_executing_work(struct worker_pool pool,
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	906	struct work_struct *work)
				907	{
Sasha Levin	42f8570	2012-12-17 10:01:23 -0500	[diff] [blame]	908	struct worker *worker;
Sasha Levin	42f8570	2012-12-17 10:01:23 -0500	[diff] [blame]	909
Sasha Levin	b67bfe0	2013-02-27 17:06:00 -0800	[diff] [blame]	910	hash_for_each_possible(pool->busy_hash, worker, hentry,
Tejun Heo	a2c1c57	2012-12-18 10:35:02 -0800	[diff] [blame]	911	(unsigned long)work)
				912	if (worker->current_work == work &&
				913	worker->current_func == work->func)
Sasha Levin	42f8570	2012-12-17 10:01:23 -0500	[diff] [blame]	914	return worker;
				915
				916	return NULL;
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	917	}
				918
				919	/**
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	920	* move_linked_works - move linked works to a list
				921	* @work: start of series of works to be scheduled
				922	* @head: target list to append @work to
				923	* @nextp: out paramter for nested worklist walking
				924	*
				925	* Schedule linked works starting from @work to @head. Work series to
				926	* be scheduled starts at @work and includes any consecutive work with
				927	* WORK_STRUCT_LINKED set in its predecessor.
				928	*
				929	* If @nextp is not NULL, it's updated to point to the next work of
				930	* the last scheduled work. This allows move_linked_works() to be
				931	* nested inside outer list_for_each_entry_safe().
				932	*
				933	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	934	* spin_lock_irq(pool->lock).
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	935	*/
				936	static void move_linked_works(struct work_struct work, struct list_head head,
				937	struct work_struct **nextp)
				938	{
				939	struct work_struct *n;
				940
				941	/*
				942	* Linked worklist will always end before the end of the list,
				943	* use NULL for list head.
				944	*/
				945	list_for_each_entry_safe_from(work, n, NULL, entry) {
				946	list_move_tail(&work->entry, head);
				947	if (!(*work_data_bits(work) & WORK_STRUCT_LINKED))
				948	break;
				949	}
				950
				951	/*
				952	* If we're already inside safe list traversal and have moved
				953	* multiple works to the scheduled queue, the next position
				954	* needs to be updated.
				955	*/
				956	if (nextp)
				957	*nextp = n;
				958	}
				959
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	960	/**
				961	* get_pwq - get an extra reference on the specified pool_workqueue
				962	* @pwq: pool_workqueue to get
				963	*
				964	* Obtain an extra reference on @pwq. The caller should guarantee that
				965	* @pwq has positive refcnt and be holding the matching pool->lock.
				966	*/
				967	static void get_pwq(struct pool_workqueue *pwq)
				968	{
				969	lockdep_assert_held(&pwq->pool->lock);
				970	WARN_ON_ONCE(pwq->refcnt <= 0);
				971	pwq->refcnt++;
				972	}
				973
				974	/**
				975	* put_pwq - put a pool_workqueue reference
				976	* @pwq: pool_workqueue to put
				977	*
				978	* Drop a reference of @pwq. If its refcnt reaches zero, schedule its
				979	* destruction. The caller should be holding the matching pool->lock.
				980	*/
				981	static void put_pwq(struct pool_workqueue *pwq)
				982	{
				983	lockdep_assert_held(&pwq->pool->lock);
				984	if (likely(--pwq->refcnt))
				985	return;
				986	if (WARN_ON_ONCE(!(pwq->wq->flags & WQ_UNBOUND)))
				987	return;
				988	/*
				989	* @pwq can't be released under pool->lock, bounce to
				990	* pwq_unbound_release_workfn(). This never recurses on the same
				991	* pool->lock as this path is taken only for unbound workqueues and
				992	* the release work item is scheduled on a per-cpu workqueue. To
				993	* avoid lockdep warning, unbound pool->locks are given lockdep
				994	* subclass of 1 in get_unbound_pool().
				995	*/
				996	schedule_work(&pwq->unbound_release_work);
				997	}
				998
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	999	static void pwq_activate_delayed_work(struct work_struct *work)
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1000	{
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1001	struct pool_workqueue *pwq = get_work_pwq(work);
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1002
				1003	trace_workqueue_activate_work(work);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1004	move_linked_works(work, &pwq->pool->worklist, NULL);
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1005	__clear_bit(WORK_STRUCT_DELAYED_BIT, work_data_bits(work));
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1006	pwq->nr_active++;
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1007	}
				1008
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1009	static void pwq_activate_first_delayed(struct pool_workqueue *pwq)
Lai Jiangshan	3aa6249	2012-09-18 10:40:00 -0700	[diff] [blame]	1010	{
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1011	struct work_struct *work = list_first_entry(&pwq->delayed_works,
Lai Jiangshan	3aa6249	2012-09-18 10:40:00 -0700	[diff] [blame]	1012	struct work_struct, entry);
				1013
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1014	pwq_activate_delayed_work(work);
Lai Jiangshan	3aa6249	2012-09-18 10:40:00 -0700	[diff] [blame]	1015	}
				1016
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1017	/**
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1018	* pwq_dec_nr_in_flight - decrement pwq's nr_in_flight
				1019	* @pwq: pwq of interest
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1020	* @color: color of work which left the queue
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1021	*
				1022	* A work either has completed or is removed from pending queue,
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1023	* decrement nr_in_flight of its pwq and handle workqueue flushing.
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1024	*
				1025	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1026	* spin_lock_irq(pool->lock).
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1027	*/
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1028	static void pwq_dec_nr_in_flight(struct pool_workqueue *pwq, int color)
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1029	{
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	1030	/* uncolored work items don't participate in flushing or nr_active */
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1031	if (color == WORK_NO_COLOR)
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	1032	goto out_put;
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1033
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1034	pwq->nr_in_flight[color]--;
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1035
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1036	pwq->nr_active--;
				1037	if (!list_empty(&pwq->delayed_works)) {
Lai Jiangshan	b3f9f40	2012-09-18 10:40:00 -0700	[diff] [blame]	1038	/* one down, submit a delayed one */
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1039	if (pwq->nr_active < pwq->max_active)
				1040	pwq_activate_first_delayed(pwq);
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1041	}
				1042
				1043	/* is flush in progress and are we at the flushing tip? */
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1044	if (likely(pwq->flush_color != color))
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	1045	goto out_put;
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1046
				1047	/* are there still in-flight works? */
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1048	if (pwq->nr_in_flight[color])
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	1049	goto out_put;
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1050
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1051	/* this pwq is done, clear flush_color */
				1052	pwq->flush_color = -1;
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1053
				1054	/*
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1055	* If this was the last pwq, wake up the first flusher. It
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1056	* will handle the rest.
				1057	*/
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1058	if (atomic_dec_and_test(&pwq->wq->nr_pwqs_to_flush))
				1059	complete(&pwq->wq->first_flusher->done);
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	1060	out_put:
				1061	put_pwq(pwq);
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1062	}
				1063
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	1064	/**
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	1065	* try_to_grab_pending - steal work item from worklist and disable irq
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	1066	* @work: work item to steal
				1067	* @is_dwork: @work is a delayed_work
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	1068	* @flags: place to store irq state
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	1069	*
				1070	* Try to grab PENDING bit of @work. This function can handle @work in any
				1071	* stable state - idle, on timer or on worklist. Return values are
				1072	*
				1073	* 1 if @work was pending and we successfully stole PENDING
				1074	* 0 if @work was idle and we claimed PENDING
				1075	* -EAGAIN if PENDING couldn't be grabbed at the moment, safe to busy-retry
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	1076	* -ENOENT if someone else is canceling @work, this state may persist
				1077	* for arbitrarily long
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	1078	*
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	1079	* On >= 0 return, the caller owns @work's PENDING bit. To avoid getting
Tejun Heo	e0aecdd	2012-08-21 13:18:24 -0700	[diff] [blame]	1080	* interrupted while holding PENDING and @work off queue, irq must be
				1081	* disabled on entry. This, combined with delayed_work->timer being
				1082	* irqsafe, ensures that we return -EAGAIN for finite short period of time.
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	1083	*
				1084	* On successful return, >= 0, irq is disabled and the caller is
				1085	* responsible for releasing it using local_irq_restore(*@flags).
				1086	*
Tejun Heo	e0aecdd	2012-08-21 13:18:24 -0700	[diff] [blame]	1087	* This function is safe to call from any context including IRQ handler.
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1088	*/
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	1089	static int try_to_grab_pending(struct work_struct *work, bool is_dwork,
				1090	unsigned long *flags)
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1091	{
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1092	struct worker_pool *pool;
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1093	struct pool_workqueue *pwq;
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1094
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	1095	local_irq_save(*flags);
				1096
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	1097	/* try to steal the timer if it exists */
				1098	if (is_dwork) {
				1099	struct delayed_work *dwork = to_delayed_work(work);
				1100
Tejun Heo	e0aecdd	2012-08-21 13:18:24 -0700	[diff] [blame]	1101	/*
				1102	* dwork->timer is irqsafe. If del_timer() fails, it's
				1103	* guaranteed that the timer is not queued anywhere and not
				1104	* running on the local CPU.
				1105	*/
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	1106	if (likely(del_timer(&dwork->timer)))
				1107	return 1;
				1108	}
				1109
				1110	/* try to claim PENDING the normal way */
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1111	if (!test_and_set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(work)))
				1112	return 0;
				1113
				1114	/*
				1115	* The queueing is in progress, or it is already queued. Try to
				1116	* steal it from ->worklist without clearing WORK_STRUCT_PENDING.
				1117	*/
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1118	pool = get_work_pool(work);
				1119	if (!pool)
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	1120	goto fail;
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1121
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1122	spin_lock(&pool->lock);
Lai Jiangshan	0b3dae6	2013-02-06 18:04:53 -0800	[diff] [blame]	1123	/*
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1124	* work->data is guaranteed to point to pwq only while the work
				1125	* item is queued on pwq->wq, and both updating work->data to point
				1126	* to pwq on queueing and to pool on dequeueing are done under
				1127	* pwq->pool->lock. This in turn guarantees that, if work->data
				1128	* points to pwq which is associated with a locked pool, the work
Lai Jiangshan	0b3dae6	2013-02-06 18:04:53 -0800	[diff] [blame]	1129	* item is currently queued on that pool.
				1130	*/
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1131	pwq = get_work_pwq(work);
				1132	if (pwq && pwq->pool == pool) {
Tejun Heo	1606283	2013-02-06 18:04:53 -0800	[diff] [blame]	1133	debug_work_deactivate(work);
Lai Jiangshan	3aa6249	2012-09-18 10:40:00 -0700	[diff] [blame]	1134
Tejun Heo	1606283	2013-02-06 18:04:53 -0800	[diff] [blame]	1135	/*
				1136	* A delayed work item cannot be grabbed directly because
				1137	* it might have linked NO_COLOR work items which, if left
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1138	* on the delayed_list, will confuse pwq->nr_active
Tejun Heo	1606283	2013-02-06 18:04:53 -0800	[diff] [blame]	1139	* management later on and cause stall. Make sure the work
				1140	* item is activated before grabbing.
				1141	*/
				1142	if (*work_data_bits(work) & WORK_STRUCT_DELAYED)
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1143	pwq_activate_delayed_work(work);
Lai Jiangshan	3aa6249	2012-09-18 10:40:00 -0700	[diff] [blame]	1144
Tejun Heo	1606283	2013-02-06 18:04:53 -0800	[diff] [blame]	1145	list_del_init(&work->entry);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1146	pwq_dec_nr_in_flight(get_work_pwq(work), get_work_color(work));
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	1147
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1148	/* work->data points to pwq iff queued, point to pool */
Tejun Heo	1606283	2013-02-06 18:04:53 -0800	[diff] [blame]	1149	set_work_pool_and_keep_pending(work, pool->id);
Lai Jiangshan	4468a00	2013-02-06 18:04:53 -0800	[diff] [blame]	1150
Tejun Heo	1606283	2013-02-06 18:04:53 -0800	[diff] [blame]	1151	spin_unlock(&pool->lock);
				1152	return 1;
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1153	}
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1154	spin_unlock(&pool->lock);
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	1155	fail:
				1156	local_irq_restore(*flags);
				1157	if (work_is_canceling(work))
				1158	return -ENOENT;
				1159	cpu_relax();
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	1160	return -EAGAIN;
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1161	}
				1162
				1163	/**
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	1164	* insert_work - insert a work into a pool
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1165	* @pwq: pwq @work belongs to
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1166	* @work: work to insert
				1167	* @head: insertion point
				1168	* @extra_flags: extra WORK_STRUCT_* flags to set
				1169	*
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1170	* Insert @work which belongs to @pwq after @head. @extra_flags is or'd to
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	1171	* work_struct flags.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1172	*
				1173	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1174	* spin_lock_irq(pool->lock).
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1175	*/
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1176	static void insert_work(struct pool_workqueue pwq, struct work_struct work,
				1177	struct list_head *head, unsigned int extra_flags)
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	1178	{
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1179	struct worker_pool *pool = pwq->pool;
Frederic Weisbecker	e1d8aa9	2009-01-12 23:15:46 +0100	[diff] [blame]	1180
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1181	/* we own @work, set data and link */
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1182	set_work_pwq(work, pwq, extra_flags);
Oleg Nesterov	1a4d9b0	2008-07-25 01:47:47 -0700	[diff] [blame]	1183	list_add_tail(&work->entry, head);
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	1184	get_pwq(pwq);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1185
				1186	/*
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	1187	* Ensure either wq_worker_sleeping() sees the above
				1188	* list_add_tail() or we see zero nr_running to avoid workers lying
				1189	* around lazily while there are works to be processed.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1190	*/
				1191	smp_mb();
				1192
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1193	if (__need_more_worker(pool))
				1194	wake_up_worker(pool);
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	1195	}
				1196
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	1197	/*
				1198	* Test whether @work is being queued from another work executing on the
Tejun Heo	8d03ecf	2013-02-13 19:29:10 -0800	[diff] [blame]	1199	* same workqueue.
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	1200	*/
				1201	static bool is_chained_work(struct workqueue_struct *wq)
				1202	{
Tejun Heo	8d03ecf	2013-02-13 19:29:10 -0800	[diff] [blame]	1203	struct worker *worker;
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	1204
Tejun Heo	8d03ecf	2013-02-13 19:29:10 -0800	[diff] [blame]	1205	worker = current_wq_worker();
				1206	/*
				1207	* Return %true iff I'm a worker execuing a work item on @wq. If
				1208	* I'm @worker, it's safe to dereference it without locking.
				1209	*/
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1210	return worker && worker->current_pwq->wq == wq;
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	1211	}
				1212
Tejun Heo	d84ff05	2013-03-12 11:29:59 -0700	[diff] [blame]	1213	static void __queue_work(int cpu, struct workqueue_struct *wq,
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1214	struct work_struct *work)
				1215	{
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1216	struct pool_workqueue *pwq;
Tejun Heo	c917808	2013-03-12 11:30:04 -0700	[diff] [blame]	1217	struct worker_pool *last_pool;
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1218	struct list_head *worklist;
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1219	unsigned int work_flags;
Joonsoo Kim	b75cac9	2012-08-15 23:25:37 +0900	[diff] [blame]	1220	unsigned int req_cpu = cpu;
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	1221
				1222	/*
				1223	* While a work item is PENDING && off queue, a task trying to
				1224	* steal the PENDING will busy-loop waiting for it to either get
				1225	* queued or lose PENDING. Grabbing PENDING and queueing should
				1226	* happen with IRQ disabled.
				1227	*/
				1228	WARN_ON_ONCE(!irqs_disabled());
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1229
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	1230	debug_work_activate(work);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1231
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	1232	/* if dying, only works from the same workqueue are allowed */
Tejun Heo	618b01e	2013-03-12 11:30:04 -0700	[diff] [blame]	1233	if (unlikely(wq->flags & __WQ_DRAINING) &&
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	1234	WARN_ON_ONCE(!is_chained_work(wq)))
Tejun Heo	e41e704	2010-08-24 14:22:47 +0200	[diff] [blame]	1235	return;
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	1236	retry:
Tejun Heo	c917808	2013-03-12 11:30:04 -0700	[diff] [blame]	1237	/* pwq which will be used unless @work is executing elsewhere */
Tejun Heo	c7fc77f	2010-07-02 10:03:51 +0200	[diff] [blame]	1238	if (!(wq->flags & WQ_UNBOUND)) {
Tejun Heo	5746982	2012-08-03 10:30:45 -0700	[diff] [blame]	1239	if (cpu == WORK_CPU_UNBOUND)
Tejun Heo	c7fc77f	2010-07-02 10:03:51 +0200	[diff] [blame]	1240	cpu = raw_smp_processor_id();
Tejun Heo	7fb98ea	2013-03-12 11:30:00 -0700	[diff] [blame]	1241	pwq = per_cpu_ptr(wq->cpu_pwqs, cpu);
Tejun Heo	c917808	2013-03-12 11:30:04 -0700	[diff] [blame]	1242	} else {
				1243	pwq = first_pwq(wq);
				1244	}
Tejun Heo	dbf2576	2012-08-20 14:51:23 -0700	[diff] [blame]	1245
Tejun Heo	c917808	2013-03-12 11:30:04 -0700	[diff] [blame]	1246	/*
				1247	* If @work was previously on a different pool, it might still be
				1248	* running there, in which case the work needs to be queued on that
				1249	* pool to guarantee non-reentrancy.
				1250	*/
				1251	last_pool = get_work_pool(work);
				1252	if (last_pool && last_pool != pwq->pool) {
				1253	struct worker *worker;
Tejun Heo	18aa9ef	2010-06-29 10:07:13 +0200	[diff] [blame]	1254
Tejun Heo	c917808	2013-03-12 11:30:04 -0700	[diff] [blame]	1255	spin_lock(&last_pool->lock);
Tejun Heo	18aa9ef	2010-06-29 10:07:13 +0200	[diff] [blame]	1256
Tejun Heo	c917808	2013-03-12 11:30:04 -0700	[diff] [blame]	1257	worker = find_worker_executing_work(last_pool, work);
Tejun Heo	18aa9ef	2010-06-29 10:07:13 +0200	[diff] [blame]	1258
Tejun Heo	c917808	2013-03-12 11:30:04 -0700	[diff] [blame]	1259	if (worker && worker->current_pwq->wq == wq) {
				1260	pwq = worker->current_pwq;
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	1261	} else {
Tejun Heo	c917808	2013-03-12 11:30:04 -0700	[diff] [blame]	1262	/* meh... not running there, queue here */
				1263	spin_unlock(&last_pool->lock);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1264	spin_lock(&pwq->pool->lock);
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	1265	}
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1266	} else {
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1267	spin_lock(&pwq->pool->lock);
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	1268	}
				1269
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	1270	/*
				1271	* pwq is determined and locked. For unbound pools, we could have
				1272	* raced with pwq release and it could already be dead. If its
				1273	* refcnt is zero, repeat pwq selection. Note that pwqs never die
				1274	* without another pwq replacing it as the first pwq or while a
				1275	* work item is executing on it, so the retying is guaranteed to
				1276	* make forward-progress.
				1277	*/
				1278	if (unlikely(!pwq->refcnt)) {
				1279	if (wq->flags & WQ_UNBOUND) {
				1280	spin_unlock(&pwq->pool->lock);
				1281	cpu_relax();
				1282	goto retry;
				1283	}
				1284	/* oops */
				1285	WARN_ONCE(true, "workqueue: per-cpu pwq for %s on cpu%d has 0 refcnt",
				1286	wq->name, cpu);
				1287	}
				1288
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1289	/* pwq determined, queue */
				1290	trace_workqueue_queue_work(req_cpu, pwq, work);
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	1291
Dan Carpenter	f5b2552	2012-04-13 22:06:58 +0300	[diff] [blame]	1292	if (WARN_ON(!list_empty(&work->entry))) {
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1293	spin_unlock(&pwq->pool->lock);
Dan Carpenter	f5b2552	2012-04-13 22:06:58 +0300	[diff] [blame]	1294	return;
				1295	}
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1296
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1297	pwq->nr_in_flight[pwq->work_color]++;
				1298	work_flags = work_color_to_flags(pwq->work_color);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1299
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1300	if (likely(pwq->nr_active < pwq->max_active)) {
Tejun Heo	cdadf00	2010-10-05 10:49:55 +0200	[diff] [blame]	1301	trace_workqueue_activate_work(work);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1302	pwq->nr_active++;
				1303	worklist = &pwq->pool->worklist;
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1304	} else {
				1305	work_flags \|= WORK_STRUCT_DELAYED;
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1306	worklist = &pwq->delayed_works;
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1307	}
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1308
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1309	insert_work(pwq, work, worklist, work_flags);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1310
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1311	spin_unlock(&pwq->pool->lock);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1312	}
				1313
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1314	/**
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	1315	* queue_work_on - queue work on specific cpu
				1316	* @cpu: CPU number to execute work on
				1317	* @wq: workqueue to use
				1318	* @work: work to queue
				1319	*
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	1320	* Returns %false if @work was already on a queue, %true otherwise.
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	1321	*
				1322	* We queue the work to a specific CPU, the caller must ensure it
				1323	* can't go away.
				1324	*/
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	1325	bool queue_work_on(int cpu, struct workqueue_struct *wq,
				1326	struct work_struct *work)
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	1327	{
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	1328	bool ret = false;
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	1329	unsigned long flags;
				1330
				1331	local_irq_save(flags);
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	1332
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	1333	if (!test_and_set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(work))) {
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1334	__queue_work(cpu, wq, work);
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	1335	ret = true;
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	1336	}
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	1337
				1338	local_irq_restore(flags);
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	1339	return ret;
				1340	}
				1341	EXPORT_SYMBOL_GPL(queue_work_on);
				1342
Tejun Heo	0a13c00	2012-08-03 10:30:44 -0700	[diff] [blame]	1343	/**
				1344	* queue_work - queue work on a workqueue
				1345	* @wq: workqueue to use
				1346	* @work: work to queue
				1347	*
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	1348	* Returns %false if @work was already on a queue, %true otherwise.
Tejun Heo	0a13c00	2012-08-03 10:30:44 -0700	[diff] [blame]	1349	*
				1350	* We queue the work to the CPU on which it was submitted, but if the CPU dies
				1351	* it can be processed by another CPU.
				1352	*/
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	1353	bool queue_work(struct workqueue_struct wq, struct work_struct work)
Tejun Heo	0a13c00	2012-08-03 10:30:44 -0700	[diff] [blame]	1354	{
Tejun Heo	5746982	2012-08-03 10:30:45 -0700	[diff] [blame]	1355	return queue_work_on(WORK_CPU_UNBOUND, wq, work);
Tejun Heo	0a13c00	2012-08-03 10:30:44 -0700	[diff] [blame]	1356	}
				1357	EXPORT_SYMBOL_GPL(queue_work);
				1358
Tejun Heo	d8e794d	2012-08-03 10:30:45 -0700	[diff] [blame]	1359	void delayed_work_timer_fn(unsigned long __data)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1360	{
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1361	struct delayed_work dwork = (struct delayed_work )__data;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1362
Tejun Heo	e0aecdd	2012-08-21 13:18:24 -0700	[diff] [blame]	1363	/* should have been called from irqsafe timer with irq already off */
Lai Jiangshan	60c057b	2013-02-06 18:04:53 -0800	[diff] [blame]	1364	__queue_work(dwork->cpu, dwork->wq, &dwork->work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1365	}
Konstantin Khlebnikov	1438ade5	2013-01-24 16:36:31 +0400	[diff] [blame]	1366	EXPORT_SYMBOL(delayed_work_timer_fn);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1367
Tejun Heo	7beb2ed	2012-08-03 10:30:46 -0700	[diff] [blame]	1368	static void __queue_delayed_work(int cpu, struct workqueue_struct *wq,
				1369	struct delayed_work *dwork, unsigned long delay)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1370	{
Tejun Heo	7beb2ed	2012-08-03 10:30:46 -0700	[diff] [blame]	1371	struct timer_list *timer = &dwork->timer;
				1372	struct work_struct *work = &dwork->work;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1373
Tejun Heo	7beb2ed	2012-08-03 10:30:46 -0700	[diff] [blame]	1374	WARN_ON_ONCE(timer->function != delayed_work_timer_fn \|\|
				1375	timer->data != (unsigned long)dwork);
Tejun Heo	fc4b514	2012-12-04 07:40:39 -0800	[diff] [blame]	1376	WARN_ON_ONCE(timer_pending(timer));
				1377	WARN_ON_ONCE(!list_empty(&work->entry));
Tejun Heo	7beb2ed	2012-08-03 10:30:46 -0700	[diff] [blame]	1378
Tejun Heo	8852aac	2012-12-01 16:23:42 -0800	[diff] [blame]	1379	/*
				1380	* If @delay is 0, queue @dwork->work immediately. This is for
				1381	* both optimization and correctness. The earliest @timer can
				1382	* expire is on the closest next tick and delayed_work users depend
				1383	* on that there's no such delay when @delay is 0.
				1384	*/
				1385	if (!delay) {
				1386	__queue_work(cpu, wq, &dwork->work);
				1387	return;
				1388	}
				1389
Tejun Heo	7beb2ed	2012-08-03 10:30:46 -0700	[diff] [blame]	1390	timer_stats_timer_set_start_info(&dwork->timer);
				1391
Lai Jiangshan	60c057b	2013-02-06 18:04:53 -0800	[diff] [blame]	1392	dwork->wq = wq;
Tejun Heo	1265057	2012-08-08 09:38:42 -0700	[diff] [blame]	1393	dwork->cpu = cpu;
Tejun Heo	7beb2ed	2012-08-03 10:30:46 -0700	[diff] [blame]	1394	timer->expires = jiffies + delay;
				1395
				1396	if (unlikely(cpu != WORK_CPU_UNBOUND))
				1397	add_timer_on(timer, cpu);
				1398	else
				1399	add_timer(timer);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1400	}
				1401
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1402	/**
				1403	* queue_delayed_work_on - queue work on specific CPU after delay
				1404	* @cpu: CPU number to execute work on
				1405	* @wq: workqueue to use
Randy Dunlap	af9997e	2006-12-22 01:06:52 -0800	[diff] [blame]	1406	* @dwork: work to queue
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1407	* @delay: number of jiffies to wait before queueing
				1408	*
Tejun Heo	715f130	2012-08-03 10:30:46 -0700	[diff] [blame]	1409	* Returns %false if @work was already on a queue, %true otherwise. If
				1410	* @delay is zero and @dwork is idle, it will be scheduled for immediate
				1411	* execution.
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1412	*/
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	1413	bool queue_delayed_work_on(int cpu, struct workqueue_struct *wq,
				1414	struct delayed_work *dwork, unsigned long delay)
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1415	{
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1416	struct work_struct *work = &dwork->work;
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	1417	bool ret = false;
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	1418	unsigned long flags;
				1419
				1420	/* read the comment in __queue_work() */
				1421	local_irq_save(flags);
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1422
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	1423	if (!test_and_set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(work))) {
Tejun Heo	7beb2ed	2012-08-03 10:30:46 -0700	[diff] [blame]	1424	__queue_delayed_work(cpu, wq, dwork, delay);
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	1425	ret = true;
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1426	}
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	1427
				1428	local_irq_restore(flags);
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1429	return ret;
				1430	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	1431	EXPORT_SYMBOL_GPL(queue_delayed_work_on);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1432
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1433	/**
Tejun Heo	0a13c00	2012-08-03 10:30:44 -0700	[diff] [blame]	1434	* queue_delayed_work - queue work on a workqueue after delay
				1435	* @wq: workqueue to use
				1436	* @dwork: delayable work to queue
				1437	* @delay: number of jiffies to wait before queueing
				1438	*
Tejun Heo	715f130	2012-08-03 10:30:46 -0700	[diff] [blame]	1439	* Equivalent to queue_delayed_work_on() but tries to use the local CPU.
Tejun Heo	0a13c00	2012-08-03 10:30:44 -0700	[diff] [blame]	1440	*/
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	1441	bool queue_delayed_work(struct workqueue_struct *wq,
Tejun Heo	0a13c00	2012-08-03 10:30:44 -0700	[diff] [blame]	1442	struct delayed_work *dwork, unsigned long delay)
				1443	{
Tejun Heo	5746982	2012-08-03 10:30:45 -0700	[diff] [blame]	1444	return queue_delayed_work_on(WORK_CPU_UNBOUND, wq, dwork, delay);
Tejun Heo	0a13c00	2012-08-03 10:30:44 -0700	[diff] [blame]	1445	}
				1446	EXPORT_SYMBOL_GPL(queue_delayed_work);
				1447
				1448	/**
Tejun Heo	8376fe2	2012-08-03 10:30:47 -0700	[diff] [blame]	1449	* mod_delayed_work_on - modify delay of or queue a delayed work on specific CPU
				1450	* @cpu: CPU number to execute work on
				1451	* @wq: workqueue to use
				1452	* @dwork: work to queue
				1453	* @delay: number of jiffies to wait before queueing
				1454	*
				1455	* If @dwork is idle, equivalent to queue_delayed_work_on(); otherwise,
				1456	* modify @dwork's timer so that it expires after @delay. If @delay is
				1457	* zero, @work is guaranteed to be scheduled immediately regardless of its
				1458	* current state.
				1459	*
				1460	* Returns %false if @dwork was idle and queued, %true if @dwork was
				1461	* pending and its timer was modified.
				1462	*
Tejun Heo	e0aecdd	2012-08-21 13:18:24 -0700	[diff] [blame]	1463	* This function is safe to call from any context including IRQ handler.
Tejun Heo	8376fe2	2012-08-03 10:30:47 -0700	[diff] [blame]	1464	* See try_to_grab_pending() for details.
				1465	*/
				1466	bool mod_delayed_work_on(int cpu, struct workqueue_struct *wq,
				1467	struct delayed_work *dwork, unsigned long delay)
				1468	{
				1469	unsigned long flags;
				1470	int ret;
				1471
				1472	do {
				1473	ret = try_to_grab_pending(&dwork->work, true, &flags);
				1474	} while (unlikely(ret == -EAGAIN));
				1475
				1476	if (likely(ret >= 0)) {
				1477	__queue_delayed_work(cpu, wq, dwork, delay);
				1478	local_irq_restore(flags);
				1479	}
				1480
				1481	/* -ENOENT from try_to_grab_pending() becomes %true */
				1482	return ret;
				1483	}
				1484	EXPORT_SYMBOL_GPL(mod_delayed_work_on);
				1485
				1486	/**
				1487	* mod_delayed_work - modify delay of or queue a delayed work
				1488	* @wq: workqueue to use
				1489	* @dwork: work to queue
				1490	* @delay: number of jiffies to wait before queueing
				1491	*
				1492	* mod_delayed_work_on() on local CPU.
				1493	*/
				1494	bool mod_delayed_work(struct workqueue_struct wq, struct delayed_work dwork,
				1495	unsigned long delay)
				1496	{
				1497	return mod_delayed_work_on(WORK_CPU_UNBOUND, wq, dwork, delay);
				1498	}
				1499	EXPORT_SYMBOL_GPL(mod_delayed_work);
				1500
				1501	/**
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1502	* worker_enter_idle - enter idle state
				1503	* @worker: worker which is entering idle state
				1504	*
				1505	* @worker is entering idle state. Update stats and idle timer if
				1506	* necessary.
				1507	*
				1508	* LOCKING:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1509	* spin_lock_irq(pool->lock).
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1510	*/
				1511	static void worker_enter_idle(struct worker *worker)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1512	{
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1513	struct worker_pool *pool = worker->pool;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1514
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	1515	if (WARN_ON_ONCE(worker->flags & WORKER_IDLE) \|\|
				1516	WARN_ON_ONCE(!list_empty(&worker->entry) &&
				1517	(worker->hentry.next \|\| worker->hentry.pprev)))
				1518	return;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1519
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	1520	/* can't use worker_set_flags(), also called from start_worker() */
				1521	worker->flags \|= WORKER_IDLE;
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1522	pool->nr_idle++;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1523	worker->last_active = jiffies;
Peter Zijlstra	d5abe66	2006-12-06 20:37:26 -0800	[diff] [blame]	1524
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1525	/* idle_list is LIFO */
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1526	list_add(&worker->entry, &pool->idle_list);
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	1527
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	1528	if (too_many_workers(pool) && !timer_pending(&pool->idle_timer))
				1529	mod_timer(&pool->idle_timer, jiffies + IDLE_WORKER_TIMEOUT);
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	1530
Tejun Heo	544ecf3	2012-05-14 15:04:50 -0700	[diff] [blame]	1531	/*
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	1532	* Sanity check nr_running. Because wq_unbind_fn() releases
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1533	* pool->lock between setting %WORKER_UNBOUND and zapping
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	1534	* nr_running, the warning may trigger spuriously. Check iff
				1535	* unbind is not in progress.
Tejun Heo	544ecf3	2012-05-14 15:04:50 -0700	[diff] [blame]	1536	*/
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	1537	WARN_ON_ONCE(!(pool->flags & POOL_DISASSOCIATED) &&
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1538	pool->nr_workers == pool->nr_idle &&
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	1539	atomic_read(&pool->nr_running));
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1540	}
				1541
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1542	/**
				1543	* worker_leave_idle - leave idle state
				1544	* @worker: worker which is leaving idle state
				1545	*
				1546	* @worker is leaving idle state. Update stats.
				1547	*
				1548	* LOCKING:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1549	* spin_lock_irq(pool->lock).
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1550	*/
				1551	static void worker_leave_idle(struct worker *worker)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1552	{
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1553	struct worker_pool *pool = worker->pool;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1554
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	1555	if (WARN_ON_ONCE(!(worker->flags & WORKER_IDLE)))
				1556	return;
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	1557	worker_clr_flags(worker, WORKER_IDLE);
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1558	pool->nr_idle--;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1559	list_del_init(&worker->entry);
				1560	}
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1561
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1562	/**
Lai Jiangshan	f36dc67	2013-02-19 12:17:02 -0800	[diff] [blame]	1563	* worker_maybe_bind_and_lock - try to bind %current to worker_pool and lock it
				1564	* @pool: target worker_pool
				1565	*
				1566	* Bind %current to the cpu of @pool if it is associated and lock @pool.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1567	*
				1568	* Works which are scheduled while the cpu is online must at least be
				1569	* scheduled to a worker which is bound to the cpu so that if they are
				1570	* flushed from cpu callbacks while cpu is going down, they are
				1571	* guaranteed to execute on the cpu.
				1572	*
Lai Jiangshan	f5faa07	2013-02-19 12:17:02 -0800	[diff] [blame]	1573	* This function is to be used by unbound workers and rescuers to bind
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1574	* themselves to the target cpu and may race with cpu going down or
				1575	* coming online. kthread_bind() can't be used because it may put the
				1576	* worker to already dead cpu and set_cpus_allowed_ptr() can't be used
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	1577	* verbatim as it's best effort and blocking and pool may be
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1578	* [dis]associated in the meantime.
				1579	*
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	1580	* This function tries set_cpus_allowed() and locks pool and verifies the
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	1581	* binding against %POOL_DISASSOCIATED which is set during
Tejun Heo	f2d5a0e	2012-07-17 12:39:26 -0700	[diff] [blame]	1582	* %CPU_DOWN_PREPARE and cleared during %CPU_ONLINE, so if the worker
				1583	* enters idle state or fetches works without dropping lock, it can
				1584	* guarantee the scheduling requirement described in the first paragraph.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1585	*
				1586	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1587	* Might sleep. Called without any lock but returns with pool->lock
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1588	* held.
				1589	*
				1590	* RETURNS:
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	1591	* %true if the associated pool is online (@worker is successfully
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1592	* bound), %false if offline.
				1593	*/
Lai Jiangshan	f36dc67	2013-02-19 12:17:02 -0800	[diff] [blame]	1594	static bool worker_maybe_bind_and_lock(struct worker_pool *pool)
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1595	__acquires(&pool->lock)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1596	{
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1597	while (true) {
				1598	/*
				1599	* The following call may fail, succeed or succeed
				1600	* without actually migrating the task to the cpu if
				1601	* it races with cpu hotunplug operation. Verify
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	1602	* against POOL_DISASSOCIATED.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1603	*/
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	1604	if (!(pool->flags & POOL_DISASSOCIATED))
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	1605	set_cpus_allowed_ptr(current, pool->attrs->cpumask);
Oleg Nesterov	85f4186	2007-05-09 02:34:20 -0700	[diff] [blame]	1606
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1607	spin_lock_irq(&pool->lock);
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	1608	if (pool->flags & POOL_DISASSOCIATED)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1609	return false;
Lai Jiangshan	f5faa07	2013-02-19 12:17:02 -0800	[diff] [blame]	1610	if (task_cpu(current) == pool->cpu &&
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	1611	cpumask_equal(&current->cpus_allowed, pool->attrs->cpumask))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1612	return true;
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1613	spin_unlock_irq(&pool->lock);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	1614
Tejun Heo	5035b20	2011-04-29 18:08:37 +0200	[diff] [blame]	1615	/*
				1616	* We've raced with CPU hot[un]plug. Give it a breather
				1617	* and retry migration. cond_resched() is required here;
				1618	* otherwise, we might deadlock against cpu_stop trying to
				1619	* bring down the CPU on non-preemptive kernel.
				1620	*/
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1621	cpu_relax();
Tejun Heo	5035b20	2011-04-29 18:08:37 +0200	[diff] [blame]	1622	cond_resched();
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1623	}
				1624	}
				1625
				1626	/*
Lai Jiangshan	ea1abd6	2012-09-18 09:59:22 -0700	[diff] [blame]	1627	* Rebind an idle @worker to its CPU. worker_thread() will test
Lai Jiangshan	5f7dabf	2012-09-18 09:59:23 -0700	[diff] [blame]	1628	* list_empty(@worker->entry) before leaving idle and call this function.
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1629	*/
				1630	static void idle_worker_rebind(struct worker *worker)
				1631	{
Lai Jiangshan	5f7dabf	2012-09-18 09:59:23 -0700	[diff] [blame]	1632	/* CPU may go down again inbetween, clear UNBOUND only on success */
Lai Jiangshan	f36dc67	2013-02-19 12:17:02 -0800	[diff] [blame]	1633	if (worker_maybe_bind_and_lock(worker->pool))
Lai Jiangshan	5f7dabf	2012-09-18 09:59:23 -0700	[diff] [blame]	1634	worker_clr_flags(worker, WORKER_UNBOUND);
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1635
Lai Jiangshan	ea1abd6	2012-09-18 09:59:22 -0700	[diff] [blame]	1636	/* rebind complete, become available again */
				1637	list_add(&worker->entry, &worker->pool->idle_list);
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1638	spin_unlock_irq(&worker->pool->lock);
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1639	}
				1640
				1641	/*
				1642	* Function for @worker->rebind.work used to rebind unbound busy workers to
Tejun Heo	403c821	2012-07-17 12:39:27 -0700	[diff] [blame]	1643	* the associated cpu which is coming back online. This is scheduled by
				1644	* cpu up but can race with other cpu hotplug operations and may be
				1645	* executed twice without intervening cpu down.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1646	*/
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1647	static void busy_worker_rebind_fn(struct work_struct *work)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1648	{
				1649	struct worker *worker = container_of(work, struct worker, rebind_work);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1650
Lai Jiangshan	f36dc67	2013-02-19 12:17:02 -0800	[diff] [blame]	1651	if (worker_maybe_bind_and_lock(worker->pool))
Lai Jiangshan	eab6d82	2012-09-18 09:59:22 -0700	[diff] [blame]	1652	worker_clr_flags(worker, WORKER_UNBOUND);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1653
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1654	spin_unlock_irq(&worker->pool->lock);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1655	}
				1656
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1657	/**
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	1658	* rebind_workers - rebind all workers of a pool to the associated CPU
				1659	* @pool: pool of interest
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1660	*
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	1661	* @pool->cpu is coming online. Rebind all workers to the CPU. Rebinding
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1662	* is different for idle and busy ones.
				1663	*
Lai Jiangshan	ea1abd6	2012-09-18 09:59:22 -0700	[diff] [blame]	1664	* Idle ones will be removed from the idle_list and woken up. They will
				1665	* add themselves back after completing rebind. This ensures that the
				1666	* idle_list doesn't contain any unbound workers when re-bound busy workers
				1667	* try to perform local wake-ups for concurrency management.
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1668	*
Lai Jiangshan	ea1abd6	2012-09-18 09:59:22 -0700	[diff] [blame]	1669	* Busy workers can rebind after they finish their current work items.
				1670	* Queueing the rebind work item at the head of the scheduled list is
				1671	* enough. Note that nr_running will be properly bumped as busy workers
				1672	* rebind.
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1673	*
Lai Jiangshan	ea1abd6	2012-09-18 09:59:22 -0700	[diff] [blame]	1674	* On return, all non-manager workers are scheduled for rebind - see
				1675	* manage_workers() for the manager special case. Any idle worker
				1676	* including the manager will not appear on @idle_list until rebind is
				1677	* complete, making local wake-ups safe.
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1678	*/
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	1679	static void rebind_workers(struct worker_pool *pool)
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1680	{
Lai Jiangshan	ea1abd6	2012-09-18 09:59:22 -0700	[diff] [blame]	1681	struct worker worker, n;
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1682	int i;
				1683
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	1684	lockdep_assert_held(&pool->assoc_mutex);
				1685	lockdep_assert_held(&pool->lock);
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1686
Lai Jiangshan	5f7dabf	2012-09-18 09:59:23 -0700	[diff] [blame]	1687	/* dequeue and kick idle ones */
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	1688	list_for_each_entry_safe(worker, n, &pool->idle_list, entry) {
				1689	/*
				1690	* idle workers should be off @pool->idle_list until rebind
				1691	* is complete to avoid receiving premature local wake-ups.
				1692	*/
				1693	list_del_init(&worker->entry);
Lai Jiangshan	96e6530	2012-09-02 00:28:19 +0800	[diff] [blame]	1694
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	1695	/*
				1696	* worker_thread() will see the above dequeuing and call
				1697	* idle_worker_rebind().
				1698	*/
				1699	wake_up_process(worker->task);
				1700	}
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1701
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	1702	/* rebind busy workers */
Sasha Levin	b67bfe0	2013-02-27 17:06:00 -0800	[diff] [blame]	1703	for_each_busy_worker(worker, i, pool) {
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	1704	struct work_struct *rebind_work = &worker->rebind_work;
				1705	struct workqueue_struct *wq;
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1706
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	1707	if (test_and_set_bit(WORK_STRUCT_PENDING_BIT,
				1708	work_data_bits(rebind_work)))
				1709	continue;
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1710
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	1711	debug_work_activate(rebind_work);
Tejun Heo	90beca5	2012-09-04 23:12:33 -0700	[diff] [blame]	1712
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	1713	/*
				1714	* wq doesn't really matter but let's keep @worker->pool
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1715	* and @pwq->pool consistent for sanity.
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	1716	*/
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	1717	if (worker->pool->attrs->nice < 0)
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	1718	wq = system_highpri_wq;
				1719	else
				1720	wq = system_wq;
Tejun Heo	ec58815	2012-09-04 23:16:32 -0700	[diff] [blame]	1721
Tejun Heo	7fb98ea	2013-03-12 11:30:00 -0700	[diff] [blame]	1722	insert_work(per_cpu_ptr(wq->cpu_pwqs, pool->cpu), rebind_work,
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	1723	worker->scheduled.next,
				1724	work_color_to_flags(WORK_NO_COLOR));
Tejun Heo	ec58815	2012-09-04 23:16:32 -0700	[diff] [blame]	1725	}
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1726	}
				1727
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1728	static struct worker *alloc_worker(void)
				1729	{
				1730	struct worker *worker;
				1731
				1732	worker = kzalloc(sizeof(*worker), GFP_KERNEL);
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1733	if (worker) {
				1734	INIT_LIST_HEAD(&worker->entry);
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1735	INIT_LIST_HEAD(&worker->scheduled);
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1736	INIT_WORK(&worker->rebind_work, busy_worker_rebind_fn);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1737	/* on creation a worker is in !idle && prep state */
				1738	worker->flags = WORKER_PREP;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1739	}
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1740	return worker;
				1741	}
				1742
				1743	/**
				1744	* create_worker - create a new workqueue worker
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1745	* @pool: pool the new worker will belong to
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1746	*
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1747	* Create a new worker which is bound to @pool. The returned worker
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1748	* can be started by calling start_worker() or destroyed using
				1749	* destroy_worker().
				1750	*
				1751	* CONTEXT:
				1752	* Might sleep. Does GFP_KERNEL allocations.
				1753	*
				1754	* RETURNS:
				1755	* Pointer to the newly created worker.
				1756	*/
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	1757	static struct worker create_worker(struct worker_pool pool)
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1758	{
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	1759	const char *pri = pool->attrs->nice < 0 ? "H" : "";
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1760	struct worker *worker = NULL;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1761	int id = -1;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1762
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1763	spin_lock_irq(&pool->lock);
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1764	while (ida_get_new(&pool->worker_ida, &id)) {
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1765	spin_unlock_irq(&pool->lock);
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1766	if (!ida_pre_get(&pool->worker_ida, GFP_KERNEL))
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1767	goto fail;
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1768	spin_lock_irq(&pool->lock);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1769	}
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1770	spin_unlock_irq(&pool->lock);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1771
				1772	worker = alloc_worker();
				1773	if (!worker)
				1774	goto fail;
				1775
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1776	worker->pool = pool;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1777	worker->id = id;
				1778
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	1779	if (pool->cpu >= 0)
Eric Dumazet	94dcf29	2011-03-22 16:30:45 -0700	[diff] [blame]	1780	worker->task = kthread_create_on_node(worker_thread,
Tejun Heo	ec22ca5	2013-01-24 11:01:33 -0800	[diff] [blame]	1781	worker, cpu_to_node(pool->cpu),
Tejun Heo	d84ff05	2013-03-12 11:29:59 -0700	[diff] [blame]	1782	"kworker/%d:%d%s", pool->cpu, id, pri);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1783	else
				1784	worker->task = kthread_create(worker_thread, worker,
Tejun Heo	ac6104c	2013-03-12 11:30:03 -0700	[diff] [blame]	1785	"kworker/u%d:%d%s",
				1786	pool->id, id, pri);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1787	if (IS_ERR(worker->task))
				1788	goto fail;
				1789
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	1790	/*
				1791	* set_cpus_allowed_ptr() will fail if the cpumask doesn't have any
				1792	* online CPUs. It'll be re-applied when any of the CPUs come up.
				1793	*/
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	1794	set_user_nice(worker->task, pool->attrs->nice);
				1795	set_cpus_allowed_ptr(worker->task, pool->attrs->cpumask);
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	1796
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	1797	/*
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	1798	* %PF_THREAD_BOUND is used to prevent userland from meddling with
				1799	* cpumask of workqueue workers. This is an abuse. We need
				1800	* %PF_NO_SETAFFINITY.
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	1801	*/
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	1802	worker->task->flags \|= PF_THREAD_BOUND;
				1803
				1804	/*
				1805	* The caller is responsible for ensuring %POOL_DISASSOCIATED
				1806	* remains stable across this function. See the comments above the
				1807	* flag definition for details.
				1808	*/
				1809	if (pool->flags & POOL_DISASSOCIATED)
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	1810	worker->flags \|= WORKER_UNBOUND;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	1811
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1812	return worker;
				1813	fail:
				1814	if (id >= 0) {
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1815	spin_lock_irq(&pool->lock);
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1816	ida_remove(&pool->worker_ida, id);
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1817	spin_unlock_irq(&pool->lock);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1818	}
				1819	kfree(worker);
				1820	return NULL;
				1821	}
				1822
				1823	/**
				1824	* start_worker - start a newly created worker
				1825	* @worker: worker to start
				1826	*
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	1827	* Make the pool aware of @worker and start it.
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1828	*
				1829	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1830	* spin_lock_irq(pool->lock).
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1831	*/
				1832	static void start_worker(struct worker *worker)
				1833	{
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	1834	worker->flags \|= WORKER_STARTED;
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1835	worker->pool->nr_workers++;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1836	worker_enter_idle(worker);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1837	wake_up_process(worker->task);
				1838	}
				1839
				1840	/**
				1841	* destroy_worker - destroy a workqueue worker
				1842	* @worker: worker to be destroyed
				1843	*
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	1844	* Destroy @worker and adjust @pool stats accordingly.
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1845	*
				1846	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1847	* spin_lock_irq(pool->lock) which is released and regrabbed.
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1848	*/
				1849	static void destroy_worker(struct worker *worker)
				1850	{
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1851	struct worker_pool *pool = worker->pool;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1852	int id = worker->id;
				1853
				1854	/* sanity check frenzy */
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	1855	if (WARN_ON(worker->current_work) \|\|
				1856	WARN_ON(!list_empty(&worker->scheduled)))
				1857	return;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1858
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1859	if (worker->flags & WORKER_STARTED)
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1860	pool->nr_workers--;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1861	if (worker->flags & WORKER_IDLE)
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1862	pool->nr_idle--;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1863
				1864	list_del_init(&worker->entry);
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	1865	worker->flags \|= WORKER_DIE;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1866
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1867	spin_unlock_irq(&pool->lock);
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1868
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1869	kthread_stop(worker->task);
				1870	kfree(worker);
				1871
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1872	spin_lock_irq(&pool->lock);
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1873	ida_remove(&pool->worker_ida, id);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1874	}
				1875
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1876	static void idle_worker_timeout(unsigned long __pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1877	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1878	struct worker_pool pool = (void )__pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1879
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1880	spin_lock_irq(&pool->lock);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1881
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1882	if (too_many_workers(pool)) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1883	struct worker *worker;
				1884	unsigned long expires;
				1885
				1886	/* idle_list is kept in LIFO order, check the last one */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1887	worker = list_entry(pool->idle_list.prev, struct worker, entry);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1888	expires = worker->last_active + IDLE_WORKER_TIMEOUT;
				1889
				1890	if (time_before(jiffies, expires))
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1891	mod_timer(&pool->idle_timer, expires);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1892	else {
				1893	/* it's been idle for too long, wake up manager */
Tejun Heo	11ebea5	2012-07-12 14:46:37 -0700	[diff] [blame]	1894	pool->flags \|= POOL_MANAGE_WORKERS;
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1895	wake_up_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1896	}
				1897	}
				1898
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1899	spin_unlock_irq(&pool->lock);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1900	}
				1901
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	1902	static void send_mayday(struct work_struct *work)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1903	{
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1904	struct pool_workqueue *pwq = get_work_pwq(work);
				1905	struct workqueue_struct *wq = pwq->wq;
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	1906
				1907	lockdep_assert_held(&workqueue_lock);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1908
Tejun Heo	493008a	2013-03-12 11:30:03 -0700	[diff] [blame]	1909	if (!wq->rescuer)
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	1910	return;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1911
				1912	/* mayday mayday mayday */
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	1913	if (list_empty(&pwq->mayday_node)) {
				1914	list_add_tail(&pwq->mayday_node, &wq->maydays);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1915	wake_up_process(wq->rescuer->task);
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	1916	}
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1917	}
				1918
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	1919	static void pool_mayday_timeout(unsigned long __pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1920	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1921	struct worker_pool pool = (void )__pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1922	struct work_struct *work;
				1923
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	1924	spin_lock_irq(&workqueue_lock); /* for wq->maydays */
				1925	spin_lock(&pool->lock);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1926
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1927	if (need_to_create_worker(pool)) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1928	/*
				1929	* We've been trying to create a new worker but
				1930	* haven't been successful. We might be hitting an
				1931	* allocation deadlock. Send distress signals to
				1932	* rescuers.
				1933	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1934	list_for_each_entry(work, &pool->worklist, entry)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1935	send_mayday(work);
				1936	}
				1937
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	1938	spin_unlock(&pool->lock);
				1939	spin_unlock_irq(&workqueue_lock);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1940
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1941	mod_timer(&pool->mayday_timer, jiffies + MAYDAY_INTERVAL);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1942	}
				1943
				1944	/**
				1945	* maybe_create_worker - create a new worker if necessary
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1946	* @pool: pool to create a new worker for
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1947	*
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1948	* Create a new worker for @pool if necessary. @pool is guaranteed to
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1949	* have at least one idle worker on return from this function. If
				1950	* creating a new worker takes longer than MAYDAY_INTERVAL, mayday is
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1951	* sent to all rescuers with works scheduled on @pool to resolve
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1952	* possible allocation deadlock.
				1953	*
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	1954	* On return, need_to_create_worker() is guaranteed to be %false and
				1955	* may_start_working() %true.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1956	*
				1957	* LOCKING:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1958	* spin_lock_irq(pool->lock) which may be released and regrabbed
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1959	* multiple times. Does GFP_KERNEL allocations. Called only from
				1960	* manager.
				1961	*
				1962	* RETURNS:
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	1963	* %false if no action was taken and pool->lock stayed locked, %true
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1964	* otherwise.
				1965	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1966	static bool maybe_create_worker(struct worker_pool *pool)
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1967	__releases(&pool->lock)
				1968	__acquires(&pool->lock)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1969	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1970	if (!need_to_create_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1971	return false;
				1972	restart:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1973	spin_unlock_irq(&pool->lock);
Tejun Heo	9f9c236	2010-07-14 11:31:20 +0200	[diff] [blame]	1974
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1975	/* if we don't make progress in MAYDAY_INITIAL_TIMEOUT, call for help */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1976	mod_timer(&pool->mayday_timer, jiffies + MAYDAY_INITIAL_TIMEOUT);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1977
				1978	while (true) {
				1979	struct worker *worker;
				1980
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	1981	worker = create_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1982	if (worker) {
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1983	del_timer_sync(&pool->mayday_timer);
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1984	spin_lock_irq(&pool->lock);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1985	start_worker(worker);
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	1986	if (WARN_ON_ONCE(need_to_create_worker(pool)))
				1987	goto restart;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1988	return true;
				1989	}
				1990
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1991	if (!need_to_create_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1992	break;
				1993
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1994	__set_current_state(TASK_INTERRUPTIBLE);
				1995	schedule_timeout(CREATE_COOLDOWN);
Tejun Heo	9f9c236	2010-07-14 11:31:20 +0200	[diff] [blame]	1996
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1997	if (!need_to_create_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1998	break;
				1999	}
				2000
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2001	del_timer_sync(&pool->mayday_timer);
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2002	spin_lock_irq(&pool->lock);
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2003	if (need_to_create_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2004	goto restart;
				2005	return true;
				2006	}
				2007
				2008	/**
				2009	* maybe_destroy_worker - destroy workers which have been idle for a while
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2010	* @pool: pool to destroy workers for
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2011	*
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2012	* Destroy @pool workers which have been idle for longer than
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2013	* IDLE_WORKER_TIMEOUT.
				2014	*
				2015	* LOCKING:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2016	* spin_lock_irq(pool->lock) which may be released and regrabbed
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2017	* multiple times. Called only from manager.
				2018	*
				2019	* RETURNS:
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	2020	* %false if no action was taken and pool->lock stayed locked, %true
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2021	* otherwise.
				2022	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2023	static bool maybe_destroy_workers(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2024	{
				2025	bool ret = false;
				2026
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2027	while (too_many_workers(pool)) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2028	struct worker *worker;
				2029	unsigned long expires;
				2030
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2031	worker = list_entry(pool->idle_list.prev, struct worker, entry);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2032	expires = worker->last_active + IDLE_WORKER_TIMEOUT;
				2033
				2034	if (time_before(jiffies, expires)) {
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2035	mod_timer(&pool->idle_timer, expires);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2036	break;
				2037	}
				2038
				2039	destroy_worker(worker);
				2040	ret = true;
				2041	}
				2042
				2043	return ret;
				2044	}
				2045
				2046	/**
				2047	* manage_workers - manage worker pool
				2048	* @worker: self
				2049	*
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	2050	* Assume the manager role and manage the worker pool @worker belongs
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2051	* to. At any given time, there can be only zero or one manager per
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	2052	* pool. The exclusion is handled automatically by this function.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2053	*
				2054	* The caller can safely start processing works on false return. On
				2055	* true return, it's guaranteed that need_to_create_worker() is false
				2056	* and may_start_working() is true.
				2057	*
				2058	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2059	* spin_lock_irq(pool->lock) which may be released and regrabbed
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2060	* multiple times. Does GFP_KERNEL allocations.
				2061	*
				2062	* RETURNS:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2063	* spin_lock_irq(pool->lock) which may be released and regrabbed
				2064	* multiple times. Does GFP_KERNEL allocations.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2065	*/
				2066	static bool manage_workers(struct worker *worker)
				2067	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2068	struct worker_pool *pool = worker->pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2069	bool ret = false;
				2070
Tejun Heo	34a06bd	2013-03-12 11:30:00 -0700	[diff] [blame]	2071	if (!mutex_trylock(&pool->manager_arb))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2072	return ret;
				2073
Lai Jiangshan	ee378aa	2012-09-10 10:03:44 -0700	[diff] [blame]	2074	/*
				2075	* To simplify both worker management and CPU hotplug, hold off
				2076	* management while hotplug is in progress. CPU hotplug path can't
Tejun Heo	34a06bd	2013-03-12 11:30:00 -0700	[diff] [blame]	2077	* grab @pool->manager_arb to achieve this because that can lead to
				2078	* idle worker depletion (all become busy thinking someone else is
				2079	* managing) which in turn can result in deadlock under extreme
				2080	* circumstances. Use @pool->assoc_mutex to synchronize manager
				2081	* against CPU hotplug.
Lai Jiangshan	ee378aa	2012-09-10 10:03:44 -0700	[diff] [blame]	2082	*
Lai Jiangshan	b2eb83d	2012-09-18 09:59:23 -0700	[diff] [blame]	2083	* assoc_mutex would always be free unless CPU hotplug is in
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2084	* progress. trylock first without dropping @pool->lock.
Lai Jiangshan	ee378aa	2012-09-10 10:03:44 -0700	[diff] [blame]	2085	*/
Lai Jiangshan	b2eb83d	2012-09-18 09:59:23 -0700	[diff] [blame]	2086	if (unlikely(!mutex_trylock(&pool->assoc_mutex))) {
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2087	spin_unlock_irq(&pool->lock);
Lai Jiangshan	b2eb83d	2012-09-18 09:59:23 -0700	[diff] [blame]	2088	mutex_lock(&pool->assoc_mutex);
Lai Jiangshan	ee378aa	2012-09-10 10:03:44 -0700	[diff] [blame]	2089	/*
				2090	* CPU hotplug could have happened while we were waiting
Lai Jiangshan	b2eb83d	2012-09-18 09:59:23 -0700	[diff] [blame]	2091	* for assoc_mutex. Hotplug itself can't handle us
Lai Jiangshan	ee378aa	2012-09-10 10:03:44 -0700	[diff] [blame]	2092	* because manager isn't either on idle or busy list, and
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	2093	* @pool's state and ours could have deviated.
Lai Jiangshan	ee378aa	2012-09-10 10:03:44 -0700	[diff] [blame]	2094	*
Lai Jiangshan	b2eb83d	2012-09-18 09:59:23 -0700	[diff] [blame]	2095	* As hotplug is now excluded via assoc_mutex, we can
Lai Jiangshan	ee378aa	2012-09-10 10:03:44 -0700	[diff] [blame]	2096	* simply try to bind. It will succeed or fail depending
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	2097	* on @pool's current state. Try it and adjust
Lai Jiangshan	ee378aa	2012-09-10 10:03:44 -0700	[diff] [blame]	2098	* %WORKER_UNBOUND accordingly.
				2099	*/
Lai Jiangshan	f36dc67	2013-02-19 12:17:02 -0800	[diff] [blame]	2100	if (worker_maybe_bind_and_lock(pool))
Lai Jiangshan	ee378aa	2012-09-10 10:03:44 -0700	[diff] [blame]	2101	worker->flags &= ~WORKER_UNBOUND;
				2102	else
				2103	worker->flags \|= WORKER_UNBOUND;
				2104
				2105	ret = true;
				2106	}
				2107
Tejun Heo	11ebea5	2012-07-12 14:46:37 -0700	[diff] [blame]	2108	pool->flags &= ~POOL_MANAGE_WORKERS;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2109
				2110	/*
				2111	* Destroy and then create so that may_start_working() is true
				2112	* on return.
				2113	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2114	ret \|= maybe_destroy_workers(pool);
				2115	ret \|= maybe_create_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2116
Lai Jiangshan	b2eb83d	2012-09-18 09:59:23 -0700	[diff] [blame]	2117	mutex_unlock(&pool->assoc_mutex);
Tejun Heo	34a06bd	2013-03-12 11:30:00 -0700	[diff] [blame]	2118	mutex_unlock(&pool->manager_arb);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2119	return ret;
				2120	}
				2121
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2122	/**
				2123	* process_one_work - process single work
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2124	* @worker: self
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2125	* @work: work to process
				2126	*
				2127	* Process @work. This function contains all the logics necessary to
				2128	* process a single work including synchronization against and
				2129	* interaction with other workers on the same cpu, queueing and
				2130	* flushing. As long as context requirement is met, any worker can
				2131	* call this function to process a work.
				2132	*
				2133	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2134	* spin_lock_irq(pool->lock) which is released and regrabbed.
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2135	*/
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2136	static void process_one_work(struct worker worker, struct work_struct work)
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2137	__releases(&pool->lock)
				2138	__acquires(&pool->lock)
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2139	{
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2140	struct pool_workqueue *pwq = get_work_pwq(work);
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	2141	struct worker_pool *pool = worker->pool;
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2142	bool cpu_intensive = pwq->wq->flags & WQ_CPU_INTENSIVE;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2143	int work_color;
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	2144	struct worker *collision;
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2145	#ifdef CONFIG_LOCKDEP
				2146	/*
				2147	* It is permissible to free the struct work_struct from
				2148	* inside the function that is called from it, this we need to
				2149	* take into account for lockdep too. To avoid bogus "held
				2150	* lock freed" warnings as well as problems when looking into
				2151	* work->lockdep_map, make a copy and use that here.
				2152	*/
Peter Zijlstra	4d82a1d	2012-05-15 08:06:19 -0700	[diff] [blame]	2153	struct lockdep_map lockdep_map;
				2154
				2155	lockdep_copy_map(&lockdep_map, &work->lockdep_map);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2156	#endif
Tejun Heo	6fec10a	2012-07-22 10:16:34 -0700	[diff] [blame]	2157	/*
				2158	* Ensure we're on the correct CPU. DISASSOCIATED test is
				2159	* necessary to avoid spurious warnings from rescuers servicing the
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	2160	* unbound or a disassociated pool.
Tejun Heo	6fec10a	2012-07-22 10:16:34 -0700	[diff] [blame]	2161	*/
Lai Jiangshan	5f7dabf	2012-09-18 09:59:23 -0700	[diff] [blame]	2162	WARN_ON_ONCE(!(worker->flags & WORKER_UNBOUND) &&
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	2163	!(pool->flags & POOL_DISASSOCIATED) &&
Tejun Heo	ec22ca5	2013-01-24 11:01:33 -0800	[diff] [blame]	2164	raw_smp_processor_id() != pool->cpu);
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	2165
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	2166	/*
				2167	* A single work shouldn't be executed concurrently by
				2168	* multiple workers on a single cpu. Check whether anyone is
				2169	* already processing the work. If so, defer the work to the
				2170	* currently executing one.
				2171	*/
Tejun Heo	c9e7cf2	2013-01-24 11:01:33 -0800	[diff] [blame]	2172	collision = find_worker_executing_work(pool, work);
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	2173	if (unlikely(collision)) {
				2174	move_linked_works(work, &collision->scheduled, NULL);
				2175	return;
				2176	}
				2177
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	2178	/* claim and dequeue */
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2179	debug_work_deactivate(work);
Tejun Heo	c9e7cf2	2013-01-24 11:01:33 -0800	[diff] [blame]	2180	hash_add(pool->busy_hash, &worker->hentry, (unsigned long)work);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2181	worker->current_work = work;
Tejun Heo	a2c1c57	2012-12-18 10:35:02 -0800	[diff] [blame]	2182	worker->current_func = work->func;
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2183	worker->current_pwq = pwq;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2184	work_color = get_work_color(work);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	2185
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2186	list_del_init(&work->entry);
				2187
Tejun Heo	649027d	2010-06-29 10:07:14 +0200	[diff] [blame]	2188	/*
Tejun Heo	fb0e7be	2010-06-29 10:07:15 +0200	[diff] [blame]	2189	* CPU intensive works don't participate in concurrency
				2190	* management. They're the scheduler's responsibility.
				2191	*/
				2192	if (unlikely(cpu_intensive))
				2193	worker_set_flags(worker, WORKER_CPU_INTENSIVE, true);
				2194
Tejun Heo	974271c	2012-07-12 14:46:37 -0700	[diff] [blame]	2195	/*
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2196	* Unbound pool isn't concurrency managed and work items should be
Tejun Heo	974271c	2012-07-12 14:46:37 -0700	[diff] [blame]	2197	* executed ASAP. Wake up another worker if necessary.
				2198	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2199	if ((worker->flags & WORKER_UNBOUND) && need_more_worker(pool))
				2200	wake_up_worker(pool);
Tejun Heo	974271c	2012-07-12 14:46:37 -0700	[diff] [blame]	2201
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	2202	/*
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	2203	* Record the last pool and clear PENDING which should be the last
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2204	* update to @work. Also, do this inside @pool->lock so that
Tejun Heo	23657bb	2012-08-13 17:08:19 -0700	[diff] [blame]	2205	* PENDING and queued state changes happen together while IRQ is
				2206	* disabled.
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	2207	*/
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	2208	set_work_pool_and_clear_pending(work, pool->id);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2209
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2210	spin_unlock_irq(&pool->lock);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2211
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2212	lock_map_acquire_read(&pwq->wq->lockdep_map);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2213	lock_map_acquire(&lockdep_map);
Arjan van de Ven	e36c886	2010-08-21 13:07:26 -0700	[diff] [blame]	2214	trace_workqueue_execute_start(work);
Tejun Heo	a2c1c57	2012-12-18 10:35:02 -0800	[diff] [blame]	2215	worker->current_func(work);
Arjan van de Ven	e36c886	2010-08-21 13:07:26 -0700	[diff] [blame]	2216	/*
				2217	* While we must be careful to not use "work" after this, the trace
				2218	* point will only record its address.
				2219	*/
				2220	trace_workqueue_execute_end(work);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2221	lock_map_release(&lockdep_map);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2222	lock_map_release(&pwq->wq->lockdep_map);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2223
				2224	if (unlikely(in_atomic() \|\| lockdep_depth(current) > 0)) {
Valentin Ilie	044c782	2012-08-19 00:52:42 +0300	[diff] [blame]	2225	pr_err("BUG: workqueue leaked lock or atomic: %s/0x%08x/%d\n"
				2226	" last function: %pf\n",
Tejun Heo	a2c1c57	2012-12-18 10:35:02 -0800	[diff] [blame]	2227	current->comm, preempt_count(), task_pid_nr(current),
				2228	worker->current_func);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2229	debug_show_held_locks(current);
				2230	dump_stack();
				2231	}
				2232
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2233	spin_lock_irq(&pool->lock);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2234
Tejun Heo	fb0e7be	2010-06-29 10:07:15 +0200	[diff] [blame]	2235	/* clear cpu intensive status */
				2236	if (unlikely(cpu_intensive))
				2237	worker_clr_flags(worker, WORKER_CPU_INTENSIVE);
				2238
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2239	/* we're done with it, release */
Sasha Levin	42f8570	2012-12-17 10:01:23 -0500	[diff] [blame]	2240	hash_del(&worker->hentry);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2241	worker->current_work = NULL;
Tejun Heo	a2c1c57	2012-12-18 10:35:02 -0800	[diff] [blame]	2242	worker->current_func = NULL;
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2243	worker->current_pwq = NULL;
				2244	pwq_dec_nr_in_flight(pwq, work_color);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2245	}
				2246
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2247	/**
				2248	* process_scheduled_works - process scheduled works
				2249	* @worker: self
				2250	*
				2251	* Process all scheduled works. Please note that the scheduled list
				2252	* may change while processing a work, so this function repeatedly
				2253	* fetches a work from the top and executes it.
				2254	*
				2255	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2256	* spin_lock_irq(pool->lock) which may be released and regrabbed
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2257	* multiple times.
				2258	*/
				2259	static void process_scheduled_works(struct worker *worker)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2260	{
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2261	while (!list_empty(&worker->scheduled)) {
				2262	struct work_struct *work = list_first_entry(&worker->scheduled,
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2263	struct work_struct, entry);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2264	process_one_work(worker, work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2265	}
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2266	}
				2267
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2268	/**
				2269	* worker_thread - the worker thread function
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2270	* @__worker: self
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2271	*
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	2272	* The worker thread function. All workers belong to a worker_pool -
				2273	* either a per-cpu one or dynamic unbound one. These workers process all
				2274	* work items regardless of their specific target workqueue. The only
				2275	* exception is work items which belong to workqueues with a rescuer which
				2276	* will be explained in rescuer_thread().
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2277	*/
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2278	static int worker_thread(void *__worker)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2279	{
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2280	struct worker *worker = __worker;
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	2281	struct worker_pool *pool = worker->pool;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2282
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2283	/* tell the scheduler that this is a workqueue worker */
				2284	worker->task->flags \|= PF_WQ_WORKER;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2285	woke_up:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2286	spin_lock_irq(&pool->lock);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2287
Lai Jiangshan	5f7dabf	2012-09-18 09:59:23 -0700	[diff] [blame]	2288	/* we are off idle list if destruction or rebind is requested */
				2289	if (unlikely(list_empty(&worker->entry))) {
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2290	spin_unlock_irq(&pool->lock);
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	2291
Lai Jiangshan	5f7dabf	2012-09-18 09:59:23 -0700	[diff] [blame]	2292	/* if DIE is set, destruction is requested */
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	2293	if (worker->flags & WORKER_DIE) {
				2294	worker->task->flags &= ~PF_WQ_WORKER;
				2295	return 0;
				2296	}
				2297
Lai Jiangshan	5f7dabf	2012-09-18 09:59:23 -0700	[diff] [blame]	2298	/* otherwise, rebind */
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	2299	idle_worker_rebind(worker);
				2300	goto woke_up;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2301	}
				2302
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2303	worker_leave_idle(worker);
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	2304	recheck:
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2305	/* no more worker necessary? */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2306	if (!need_more_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2307	goto sleep;
				2308
				2309	/* do we need to manage? */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2310	if (unlikely(!may_start_working(pool)) && manage_workers(worker))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2311	goto recheck;
				2312
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2313	/*
				2314	* ->scheduled list can only be filled while a worker is
				2315	* preparing to process a work or actually processing it.
				2316	* Make sure nobody diddled with it while I was sleeping.
				2317	*/
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2318	WARN_ON_ONCE(!list_empty(&worker->scheduled));
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2319
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2320	/*
				2321	* When control reaches this point, we're guaranteed to have
				2322	* at least one idle worker or that someone else has already
				2323	* assumed the manager role.
				2324	*/
				2325	worker_clr_flags(worker, WORKER_PREP);
				2326
				2327	do {
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2328	struct work_struct *work =
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	2329	list_first_entry(&pool->worklist,
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2330	struct work_struct, entry);
				2331
				2332	if (likely(!(*work_data_bits(work) & WORK_STRUCT_LINKED))) {
				2333	/* optimization path, not strictly necessary */
				2334	process_one_work(worker, work);
				2335	if (unlikely(!list_empty(&worker->scheduled)))
				2336	process_scheduled_works(worker);
				2337	} else {
				2338	move_linked_works(work, &worker->scheduled, NULL);
				2339	process_scheduled_works(worker);
				2340	}
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2341	} while (keep_working(pool));
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2342
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2343	worker_set_flags(worker, WORKER_PREP, false);
Tejun Heo	d313dd8	2010-07-02 10:03:51 +0200	[diff] [blame]	2344	sleep:
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2345	if (unlikely(need_to_manage_workers(pool)) && manage_workers(worker))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2346	goto recheck;
Tejun Heo	d313dd8	2010-07-02 10:03:51 +0200	[diff] [blame]	2347
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2348	/*
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2349	* pool->lock is held and there's no work to process and no need to
				2350	* manage, sleep. Workers are woken up only while holding
				2351	* pool->lock or from local cpu, so setting the current state
				2352	* before releasing pool->lock is enough to prevent losing any
				2353	* event.
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2354	*/
				2355	worker_enter_idle(worker);
				2356	__set_current_state(TASK_INTERRUPTIBLE);
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2357	spin_unlock_irq(&pool->lock);
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2358	schedule();
				2359	goto woke_up;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2360	}
				2361
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2362	/**
				2363	* rescuer_thread - the rescuer thread function
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	2364	* @__rescuer: self
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2365	*
				2366	* Workqueue rescuer thread function. There's one rescuer for each
Tejun Heo	493008a	2013-03-12 11:30:03 -0700	[diff] [blame]	2367	* workqueue which has WQ_MEM_RECLAIM set.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2368	*
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	2369	* Regular work processing on a pool may block trying to create a new
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2370	* worker which uses GFP_KERNEL allocation which has slight chance of
				2371	* developing into deadlock if some works currently on the same queue
				2372	* need to be processed to satisfy the GFP_KERNEL allocation. This is
				2373	* the problem rescuer solves.
				2374	*
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	2375	* When such condition is possible, the pool summons rescuers of all
				2376	* workqueues which have works queued on the pool and let them process
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2377	* those works so that forward progress can be guaranteed.
				2378	*
				2379	* This should happen rarely.
				2380	*/
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	2381	static int rescuer_thread(void *__rescuer)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2382	{
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	2383	struct worker *rescuer = __rescuer;
				2384	struct workqueue_struct *wq = rescuer->rescue_wq;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2385	struct list_head *scheduled = &rescuer->scheduled;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2386
				2387	set_user_nice(current, RESCUER_NICE_LEVEL);
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	2388
				2389	/*
				2390	* Mark rescuer as worker too. As WORKER_PREP is never cleared, it
				2391	* doesn't participate in concurrency management.
				2392	*/
				2393	rescuer->task->flags \|= PF_WQ_WORKER;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2394	repeat:
				2395	set_current_state(TASK_INTERRUPTIBLE);
				2396
Mike Galbraith	412d32e	2012-11-28 07:17:18 +0100	[diff] [blame]	2397	if (kthread_should_stop()) {
				2398	__set_current_state(TASK_RUNNING);
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	2399	rescuer->task->flags &= ~PF_WQ_WORKER;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2400	return 0;
Mike Galbraith	412d32e	2012-11-28 07:17:18 +0100	[diff] [blame]	2401	}
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2402
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	2403	/* see whether any pwq is asking for help */
				2404	spin_lock_irq(&workqueue_lock);
				2405
				2406	while (!list_empty(&wq->maydays)) {
				2407	struct pool_workqueue *pwq = list_first_entry(&wq->maydays,
				2408	struct pool_workqueue, mayday_node);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2409	struct worker_pool *pool = pwq->pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2410	struct work_struct work, n;
				2411
				2412	__set_current_state(TASK_RUNNING);
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	2413	list_del_init(&pwq->mayday_node);
				2414
				2415	spin_unlock_irq(&workqueue_lock);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2416
				2417	/* migrate to the target cpu if possible */
Lai Jiangshan	f36dc67	2013-02-19 12:17:02 -0800	[diff] [blame]	2418	worker_maybe_bind_and_lock(pool);
Lai Jiangshan	b310410	2013-02-19 12:17:02 -0800	[diff] [blame]	2419	rescuer->pool = pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2420
				2421	/*
				2422	* Slurp in all works issued via this workqueue and
				2423	* process'em.
				2424	*/
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2425	WARN_ON_ONCE(!list_empty(&rescuer->scheduled));
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	2426	list_for_each_entry_safe(work, n, &pool->worklist, entry)
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2427	if (get_work_pwq(work) == pwq)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2428	move_linked_works(work, scheduled, &n);
				2429
				2430	process_scheduled_works(rescuer);
Tejun Heo	7576958	2011-02-14 14:04:46 +0100	[diff] [blame]	2431
				2432	/*
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2433	* Leave this pool. If keep_working() is %true, notify a
Tejun Heo	7576958	2011-02-14 14:04:46 +0100	[diff] [blame]	2434	* regular worker; otherwise, we end up with 0 concurrency
				2435	* and stalling the execution.
				2436	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2437	if (keep_working(pool))
				2438	wake_up_worker(pool);
Tejun Heo	7576958	2011-02-14 14:04:46 +0100	[diff] [blame]	2439
Lai Jiangshan	b310410	2013-02-19 12:17:02 -0800	[diff] [blame]	2440	rescuer->pool = NULL;
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	2441	spin_unlock(&pool->lock);
				2442	spin_lock(&workqueue_lock);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2443	}
				2444
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	2445	spin_unlock_irq(&workqueue_lock);
				2446
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	2447	/* rescuers should never participate in concurrency management */
				2448	WARN_ON_ONCE(!(rescuer->flags & WORKER_NOT_RUNNING));
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2449	schedule();
				2450	goto repeat;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2451	}
				2452
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2453	struct wq_barrier {
				2454	struct work_struct work;
				2455	struct completion done;
				2456	};
				2457
				2458	static void wq_barrier_func(struct work_struct *work)
				2459	{
				2460	struct wq_barrier *barr = container_of(work, struct wq_barrier, work);
				2461	complete(&barr->done);
				2462	}
				2463
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2464	/**
				2465	* insert_wq_barrier - insert a barrier work
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2466	* @pwq: pwq to insert barrier into
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2467	* @barr: wq_barrier to insert
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2468	* @target: target work to attach @barr to
				2469	* @worker: worker currently executing @target, NULL if @target is not executing
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2470	*
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2471	* @barr is linked to @target such that @barr is completed only after
				2472	* @target finishes execution. Please note that the ordering
				2473	* guarantee is observed only with respect to @target and on the local
				2474	* cpu.
				2475	*
				2476	* Currently, a queued barrier can't be canceled. This is because
				2477	* try_to_grab_pending() can't determine whether the work to be
				2478	* grabbed is at the head of the queue and thus can't clear LINKED
				2479	* flag of the previous work while there must be a valid next work
				2480	* after a work with LINKED flag set.
				2481	*
				2482	* Note that when @worker is non-NULL, @target may be modified
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2483	* underneath us, so we can't reliably determine pwq from @target.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2484	*
				2485	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2486	* spin_lock_irq(pool->lock).
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2487	*/
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2488	static void insert_wq_barrier(struct pool_workqueue *pwq,
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2489	struct wq_barrier *barr,
				2490	struct work_struct target, struct worker worker)
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2491	{
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2492	struct list_head *head;
				2493	unsigned int linked = 0;
				2494
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2495	/*
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2496	* debugobject calls are safe here even with pool->lock locked
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2497	* as we know for sure that this will not trigger any of the
				2498	* checks and call back into the fixup functions where we
				2499	* might deadlock.
				2500	*/
Andrew Morton	ca1cab3	2010-10-26 14:22:34 -0700	[diff] [blame]	2501	INIT_WORK_ONSTACK(&barr->work, wq_barrier_func);
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	2502	__set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(&barr->work));
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2503	init_completion(&barr->done);
Oleg Nesterov	83c2252	2007-05-09 02:33:54 -0700	[diff] [blame]	2504
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2505	/*
				2506	* If @target is currently being executed, schedule the
				2507	* barrier to the worker; otherwise, put it after @target.
				2508	*/
				2509	if (worker)
				2510	head = worker->scheduled.next;
				2511	else {
				2512	unsigned long *bits = work_data_bits(target);
				2513
				2514	head = target->entry.next;
				2515	/* there can already be other linked works, inherit and set */
				2516	linked = *bits & WORK_STRUCT_LINKED;
				2517	__set_bit(WORK_STRUCT_LINKED_BIT, bits);
				2518	}
				2519
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2520	debug_work_activate(&barr->work);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2521	insert_work(pwq, &barr->work, head,
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2522	work_color_to_flags(WORK_NO_COLOR) \| linked);
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2523	}
				2524
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2525	/**
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2526	* flush_workqueue_prep_pwqs - prepare pwqs for workqueue flushing
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2527	* @wq: workqueue being flushed
				2528	* @flush_color: new flush color, < 0 for no-op
				2529	* @work_color: new work color, < 0 for no-op
				2530	*
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2531	* Prepare pwqs for workqueue flushing.
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2532	*
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2533	* If @flush_color is non-negative, flush_color on all pwqs should be
				2534	* -1. If no pwq has in-flight commands at the specified color, all
				2535	* pwq->flush_color's stay at -1 and %false is returned. If any pwq
				2536	* has in flight commands, its pwq->flush_color is set to
				2537	* @flush_color, @wq->nr_pwqs_to_flush is updated accordingly, pwq
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2538	* wakeup logic is armed and %true is returned.
				2539	*
				2540	* The caller should have initialized @wq->first_flusher prior to
				2541	* calling this function with non-negative @flush_color. If
				2542	* @flush_color is negative, no flush color update is done and %false
				2543	* is returned.
				2544	*
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2545	* If @work_color is non-negative, all pwqs should have the same
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2546	* work_color which is previous to @work_color and all will be
				2547	* advanced to @work_color.
				2548	*
				2549	* CONTEXT:
				2550	* mutex_lock(wq->flush_mutex).
				2551	*
				2552	* RETURNS:
				2553	* %true if @flush_color >= 0 and there's something to flush. %false
				2554	* otherwise.
				2555	*/
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2556	static bool flush_workqueue_prep_pwqs(struct workqueue_struct *wq,
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2557	int flush_color, int work_color)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2558	{
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2559	bool wait = false;
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	2560	struct pool_workqueue *pwq;
Oleg Nesterov	1444196	2007-05-23 13:57:57 -0700	[diff] [blame]	2561
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2562	if (flush_color >= 0) {
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2563	WARN_ON_ONCE(atomic_read(&wq->nr_pwqs_to_flush));
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2564	atomic_set(&wq->nr_pwqs_to_flush, 1);
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2565	}
Oleg Nesterov	1444196	2007-05-23 13:57:57 -0700	[diff] [blame]	2566
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	2567	local_irq_disable();
				2568
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	2569	for_each_pwq(pwq, wq) {
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2570	struct worker_pool *pool = pwq->pool;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2571
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	2572	spin_lock(&pool->lock);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2573
				2574	if (flush_color >= 0) {
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2575	WARN_ON_ONCE(pwq->flush_color != -1);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2576
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2577	if (pwq->nr_in_flight[flush_color]) {
				2578	pwq->flush_color = flush_color;
				2579	atomic_inc(&wq->nr_pwqs_to_flush);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2580	wait = true;
				2581	}
				2582	}
				2583
				2584	if (work_color >= 0) {
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2585	WARN_ON_ONCE(work_color != work_next_color(pwq->work_color));
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2586	pwq->work_color = work_color;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2587	}
				2588
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	2589	spin_unlock(&pool->lock);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2590	}
				2591
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	2592	local_irq_enable();
				2593
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2594	if (flush_color >= 0 && atomic_dec_and_test(&wq->nr_pwqs_to_flush))
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2595	complete(&wq->first_flusher->done);
				2596
				2597	return wait;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2598	}
				2599
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2600	/**
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2601	* flush_workqueue - ensure that any scheduled work has run to completion.
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2602	* @wq: workqueue to flush
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2603	*
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	2604	* This function sleeps until all work items which were queued on entry
				2605	* have finished execution, but it is not livelocked by new incoming ones.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2606	*/
Harvey Harrison	7ad5b3a	2008-02-08 04:19:53 -0800	[diff] [blame]	2607	void flush_workqueue(struct workqueue_struct *wq)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2608	{
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2609	struct wq_flusher this_flusher = {
				2610	.list = LIST_HEAD_INIT(this_flusher.list),
				2611	.flush_color = -1,
				2612	.done = COMPLETION_INITIALIZER_ONSTACK(this_flusher.done),
				2613	};
				2614	int next_color;
Oleg Nesterov	b1f4ec1	2007-05-09 02:34:12 -0700	[diff] [blame]	2615
Ingo Molnar	3295f0e	2008-08-11 10:30:30 +0200	[diff] [blame]	2616	lock_map_acquire(&wq->lockdep_map);
				2617	lock_map_release(&wq->lockdep_map);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2618
				2619	mutex_lock(&wq->flush_mutex);
				2620
				2621	/*
				2622	* Start-to-wait phase
				2623	*/
				2624	next_color = work_next_color(wq->work_color);
				2625
				2626	if (next_color != wq->flush_color) {
				2627	/*
				2628	* Color space is not full. The current work_color
				2629	* becomes our flush_color and work_color is advanced
				2630	* by one.
				2631	*/
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2632	WARN_ON_ONCE(!list_empty(&wq->flusher_overflow));
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2633	this_flusher.flush_color = wq->work_color;
				2634	wq->work_color = next_color;
				2635
				2636	if (!wq->first_flusher) {
				2637	/* no flush in progress, become the first flusher */
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2638	WARN_ON_ONCE(wq->flush_color != this_flusher.flush_color);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2639
				2640	wq->first_flusher = &this_flusher;
				2641
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2642	if (!flush_workqueue_prep_pwqs(wq, wq->flush_color,
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2643	wq->work_color)) {
				2644	/* nothing to flush, done */
				2645	wq->flush_color = next_color;
				2646	wq->first_flusher = NULL;
				2647	goto out_unlock;
				2648	}
				2649	} else {
				2650	/* wait in queue */
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2651	WARN_ON_ONCE(wq->flush_color == this_flusher.flush_color);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2652	list_add_tail(&this_flusher.list, &wq->flusher_queue);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2653	flush_workqueue_prep_pwqs(wq, -1, wq->work_color);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2654	}
				2655	} else {
				2656	/*
				2657	* Oops, color space is full, wait on overflow queue.
				2658	* The next flush completion will assign us
				2659	* flush_color and transfer to flusher_queue.
				2660	*/
				2661	list_add_tail(&this_flusher.list, &wq->flusher_overflow);
				2662	}
				2663
				2664	mutex_unlock(&wq->flush_mutex);
				2665
				2666	wait_for_completion(&this_flusher.done);
				2667
				2668	/*
				2669	* Wake-up-and-cascade phase
				2670	*
				2671	* First flushers are responsible for cascading flushes and
				2672	* handling overflow. Non-first flushers can simply return.
				2673	*/
				2674	if (wq->first_flusher != &this_flusher)
				2675	return;
				2676
				2677	mutex_lock(&wq->flush_mutex);
				2678
Tejun Heo	4ce48b3	2010-07-02 10:03:51 +0200	[diff] [blame]	2679	/* we might have raced, check again with mutex held */
				2680	if (wq->first_flusher != &this_flusher)
				2681	goto out_unlock;
				2682
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2683	wq->first_flusher = NULL;
				2684
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2685	WARN_ON_ONCE(!list_empty(&this_flusher.list));
				2686	WARN_ON_ONCE(wq->flush_color != this_flusher.flush_color);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2687
				2688	while (true) {
				2689	struct wq_flusher next, tmp;
				2690
				2691	/* complete all the flushers sharing the current flush color */
				2692	list_for_each_entry_safe(next, tmp, &wq->flusher_queue, list) {
				2693	if (next->flush_color != wq->flush_color)
				2694	break;
				2695	list_del_init(&next->list);
				2696	complete(&next->done);
				2697	}
				2698
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2699	WARN_ON_ONCE(!list_empty(&wq->flusher_overflow) &&
				2700	wq->flush_color != work_next_color(wq->work_color));
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2701
				2702	/* this flush_color is finished, advance by one */
				2703	wq->flush_color = work_next_color(wq->flush_color);
				2704
				2705	/* one color has been freed, handle overflow queue */
				2706	if (!list_empty(&wq->flusher_overflow)) {
				2707	/*
				2708	* Assign the same color to all overflowed
				2709	* flushers, advance work_color and append to
				2710	* flusher_queue. This is the start-to-wait
				2711	* phase for these overflowed flushers.
				2712	*/
				2713	list_for_each_entry(tmp, &wq->flusher_overflow, list)
				2714	tmp->flush_color = wq->work_color;
				2715
				2716	wq->work_color = work_next_color(wq->work_color);
				2717
				2718	list_splice_tail_init(&wq->flusher_overflow,
				2719	&wq->flusher_queue);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2720	flush_workqueue_prep_pwqs(wq, -1, wq->work_color);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2721	}
				2722
				2723	if (list_empty(&wq->flusher_queue)) {
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2724	WARN_ON_ONCE(wq->flush_color != wq->work_color);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2725	break;
				2726	}
				2727
				2728	/*
				2729	* Need to flush more colors. Make the next flusher
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2730	* the new first flusher and arm pwqs.
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2731	*/
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2732	WARN_ON_ONCE(wq->flush_color == wq->work_color);
				2733	WARN_ON_ONCE(wq->flush_color != next->flush_color);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2734
				2735	list_del_init(&next->list);
				2736	wq->first_flusher = next;
				2737
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2738	if (flush_workqueue_prep_pwqs(wq, wq->flush_color, -1))
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2739	break;
				2740
				2741	/*
				2742	* Meh... this color is already done, clear first
				2743	* flusher and repeat cascading.
				2744	*/
				2745	wq->first_flusher = NULL;
				2746	}
				2747
				2748	out_unlock:
				2749	mutex_unlock(&wq->flush_mutex);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2750	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	2751	EXPORT_SYMBOL_GPL(flush_workqueue);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2752
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2753	/**
				2754	* drain_workqueue - drain a workqueue
				2755	* @wq: workqueue to drain
				2756	*
				2757	* Wait until the workqueue becomes empty. While draining is in progress,
				2758	* only chain queueing is allowed. IOW, only currently pending or running
				2759	* work items on @wq can queue further work items on it. @wq is flushed
				2760	* repeatedly until it becomes empty. The number of flushing is detemined
				2761	* by the depth of chaining and should be relatively short. Whine if it
				2762	* takes too long.
				2763	*/
				2764	void drain_workqueue(struct workqueue_struct *wq)
				2765	{
				2766	unsigned int flush_cnt = 0;
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	2767	struct pool_workqueue *pwq;
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2768
				2769	/*
				2770	* __queue_work() needs to test whether there are drainers, is much
				2771	* hotter than drain_workqueue() and already looks at @wq->flags.
Tejun Heo	618b01e	2013-03-12 11:30:04 -0700	[diff] [blame]	2772	* Use __WQ_DRAINING so that queue doesn't have to check nr_drainers.
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2773	*/
Tejun Heo	e98d5b1	2013-03-12 11:29:57 -0700	[diff] [blame]	2774	spin_lock_irq(&workqueue_lock);
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2775	if (!wq->nr_drainers++)
Tejun Heo	618b01e	2013-03-12 11:30:04 -0700	[diff] [blame]	2776	wq->flags \|= __WQ_DRAINING;
Tejun Heo	e98d5b1	2013-03-12 11:29:57 -0700	[diff] [blame]	2777	spin_unlock_irq(&workqueue_lock);
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2778	reflush:
				2779	flush_workqueue(wq);
				2780
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	2781	local_irq_disable();
				2782
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	2783	for_each_pwq(pwq, wq) {
Thomas Tuttle	fa2563e	2011-09-14 16:22:28 -0700	[diff] [blame]	2784	bool drained;
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2785
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	2786	spin_lock(&pwq->pool->lock);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2787	drained = !pwq->nr_active && list_empty(&pwq->delayed_works);
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	2788	spin_unlock(&pwq->pool->lock);
Thomas Tuttle	fa2563e	2011-09-14 16:22:28 -0700	[diff] [blame]	2789
				2790	if (drained)
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2791	continue;
				2792
				2793	if (++flush_cnt == 10 \|\|
				2794	(flush_cnt % 100 == 0 && flush_cnt <= 1000))
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	2795	pr_warn("workqueue %s: drain_workqueue() isn't complete after %u tries\n",
Valentin Ilie	044c782	2012-08-19 00:52:42 +0300	[diff] [blame]	2796	wq->name, flush_cnt);
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	2797
				2798	local_irq_enable();
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2799	goto reflush;
				2800	}
				2801
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	2802	spin_lock(&workqueue_lock);
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2803	if (!--wq->nr_drainers)
Tejun Heo	618b01e	2013-03-12 11:30:04 -0700	[diff] [blame]	2804	wq->flags &= ~__WQ_DRAINING;
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	2805	spin_unlock(&workqueue_lock);
				2806
				2807	local_irq_enable();
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2808	}
				2809	EXPORT_SYMBOL_GPL(drain_workqueue);
				2810
Tejun Heo	606a502	2012-08-20 14:51:23 -0700	[diff] [blame]	2811	static bool start_flush_work(struct work_struct work, struct wq_barrier barr)
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2812	{
				2813	struct worker *worker = NULL;
Tejun Heo	c9e7cf2	2013-01-24 11:01:33 -0800	[diff] [blame]	2814	struct worker_pool *pool;
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2815	struct pool_workqueue *pwq;
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2816
				2817	might_sleep();
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2818
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	2819	local_irq_disable();
				2820	pool = get_work_pool(work);
				2821	if (!pool) {
				2822	local_irq_enable();
				2823	return false;
				2824	}
				2825
				2826	spin_lock(&pool->lock);
Lai Jiangshan	0b3dae6	2013-02-06 18:04:53 -0800	[diff] [blame]	2827	/* see the comment in try_to_grab_pending() with the same code */
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2828	pwq = get_work_pwq(work);
				2829	if (pwq) {
				2830	if (unlikely(pwq->pool != pool))
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2831	goto already_gone;
Tejun Heo	606a502	2012-08-20 14:51:23 -0700	[diff] [blame]	2832	} else {
Tejun Heo	c9e7cf2	2013-01-24 11:01:33 -0800	[diff] [blame]	2833	worker = find_worker_executing_work(pool, work);
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2834	if (!worker)
				2835	goto already_gone;
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2836	pwq = worker->current_pwq;
Tejun Heo	606a502	2012-08-20 14:51:23 -0700	[diff] [blame]	2837	}
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2838
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2839	insert_wq_barrier(pwq, barr, work, worker);
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2840	spin_unlock_irq(&pool->lock);
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2841
Tejun Heo	e159489	2011-01-09 23:32:15 +0100	[diff] [blame]	2842	/*
				2843	* If @max_active is 1 or rescuer is in use, flushing another work
				2844	* item on the same workqueue may lead to deadlock. Make sure the
				2845	* flusher is not running on the same workqueue by verifying write
				2846	* access.
				2847	*/
Tejun Heo	493008a	2013-03-12 11:30:03 -0700	[diff] [blame]	2848	if (pwq->wq->saved_max_active == 1 \|\| pwq->wq->rescuer)
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2849	lock_map_acquire(&pwq->wq->lockdep_map);
Tejun Heo	e159489	2011-01-09 23:32:15 +0100	[diff] [blame]	2850	else
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2851	lock_map_acquire_read(&pwq->wq->lockdep_map);
				2852	lock_map_release(&pwq->wq->lockdep_map);
Tejun Heo	e159489	2011-01-09 23:32:15 +0100	[diff] [blame]	2853
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2854	return true;
				2855	already_gone:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2856	spin_unlock_irq(&pool->lock);
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2857	return false;
				2858	}
				2859
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2860	/**
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2861	* flush_work - wait for a work to finish executing the last queueing instance
				2862	* @work: the work to flush
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2863	*
Tejun Heo	606a502	2012-08-20 14:51:23 -0700	[diff] [blame]	2864	* Wait until @work has finished execution. @work is guaranteed to be idle
				2865	* on return if it hasn't been requeued since flush started.
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2866	*
				2867	* RETURNS:
				2868	* %true if flush_work() waited for the work to finish execution,
				2869	* %false if it was already idle.
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2870	*/
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2871	bool flush_work(struct work_struct *work)
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2872	{
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2873	struct wq_barrier barr;
				2874
Stephen Boyd	0976dfc	2012-04-20 17:28:50 -0700	[diff] [blame]	2875	lock_map_acquire(&work->lockdep_map);
				2876	lock_map_release(&work->lockdep_map);
				2877
Tejun Heo	606a502	2012-08-20 14:51:23 -0700	[diff] [blame]	2878	if (start_flush_work(work, &barr)) {
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2879	wait_for_completion(&barr.done);
				2880	destroy_work_on_stack(&barr.work);
				2881	return true;
Tejun Heo	606a502	2012-08-20 14:51:23 -0700	[diff] [blame]	2882	} else {
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2883	return false;
Tejun Heo	606a502	2012-08-20 14:51:23 -0700	[diff] [blame]	2884	}
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2885	}
				2886	EXPORT_SYMBOL_GPL(flush_work);
				2887
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	2888	static bool __cancel_work_timer(struct work_struct *work, bool is_dwork)
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2889	{
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	2890	unsigned long flags;
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2891	int ret;
				2892
				2893	do {
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	2894	ret = try_to_grab_pending(work, is_dwork, &flags);
				2895	/*
				2896	* If someone else is canceling, wait for the same event it
				2897	* would be waiting for before retrying.
				2898	*/
				2899	if (unlikely(ret == -ENOENT))
Tejun Heo	606a502	2012-08-20 14:51:23 -0700	[diff] [blame]	2900	flush_work(work);
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2901	} while (unlikely(ret < 0));
				2902
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	2903	/* tell other tasks trying to grab @work to back off */
				2904	mark_work_canceling(work);
				2905	local_irq_restore(flags);
				2906
Tejun Heo	606a502	2012-08-20 14:51:23 -0700	[diff] [blame]	2907	flush_work(work);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	2908	clear_work_data(work);
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2909	return ret;
				2910	}
				2911
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2912	/**
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2913	* cancel_work_sync - cancel a work and wait for it to finish
				2914	* @work: the work to cancel
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2915	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2916	* Cancel @work and wait for its execution to finish. This function
				2917	* can be used even if the work re-queues itself or migrates to
				2918	* another workqueue. On return from this function, @work is
				2919	* guaranteed to be not pending or executing on any CPU.
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2920	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2921	* cancel_work_sync(&delayed_work->work) must not be used for
				2922	* delayed_work's. Use cancel_delayed_work_sync() instead.
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2923	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2924	* The caller must ensure that the workqueue on which @work was last
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2925	* queued can't be destroyed before this function returns.
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2926	*
				2927	* RETURNS:
				2928	* %true if @work was pending, %false otherwise.
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2929	*/
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2930	bool cancel_work_sync(struct work_struct *work)
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2931	{
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	2932	return __cancel_work_timer(work, false);
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	2933	}
Oleg Nesterov	28e53bd	2007-05-09 02:34:22 -0700	[diff] [blame]	2934	EXPORT_SYMBOL_GPL(cancel_work_sync);
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	2935
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2936	/**
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2937	* flush_delayed_work - wait for a dwork to finish executing the last queueing
				2938	* @dwork: the delayed work to flush
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2939	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2940	* Delayed timer is cancelled and the pending work is queued for
				2941	* immediate execution. Like flush_work(), this function only
				2942	* considers the last queueing instance of @dwork.
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2943	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2944	* RETURNS:
				2945	* %true if flush_work() waited for the work to finish execution,
				2946	* %false if it was already idle.
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2947	*/
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2948	bool flush_delayed_work(struct delayed_work *dwork)
				2949	{
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	2950	local_irq_disable();
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2951	if (del_timer_sync(&dwork->timer))
Lai Jiangshan	60c057b	2013-02-06 18:04:53 -0800	[diff] [blame]	2952	__queue_work(dwork->cpu, dwork->wq, &dwork->work);
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	2953	local_irq_enable();
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2954	return flush_work(&dwork->work);
				2955	}
				2956	EXPORT_SYMBOL(flush_delayed_work);
				2957
				2958	/**
Tejun Heo	57b30ae	2012-08-21 13:18:24 -0700	[diff] [blame]	2959	* cancel_delayed_work - cancel a delayed work
				2960	* @dwork: delayed_work to cancel
Tejun Heo	0938349	2010-09-16 10:48:29 +0200	[diff] [blame]	2961	*
Tejun Heo	57b30ae	2012-08-21 13:18:24 -0700	[diff] [blame]	2962	* Kill off a pending delayed_work. Returns %true if @dwork was pending
				2963	* and canceled; %false if wasn't pending. Note that the work callback
				2964	* function may still be running on return, unless it returns %true and the
				2965	* work doesn't re-arm itself. Explicitly flush or use
				2966	* cancel_delayed_work_sync() to wait on it.
Tejun Heo	0938349	2010-09-16 10:48:29 +0200	[diff] [blame]	2967	*
Tejun Heo	57b30ae	2012-08-21 13:18:24 -0700	[diff] [blame]	2968	* This function is safe to call from any context including IRQ handler.
Tejun Heo	0938349	2010-09-16 10:48:29 +0200	[diff] [blame]	2969	*/
Tejun Heo	57b30ae	2012-08-21 13:18:24 -0700	[diff] [blame]	2970	bool cancel_delayed_work(struct delayed_work *dwork)
Tejun Heo	0938349	2010-09-16 10:48:29 +0200	[diff] [blame]	2971	{
Tejun Heo	57b30ae	2012-08-21 13:18:24 -0700	[diff] [blame]	2972	unsigned long flags;
				2973	int ret;
				2974
				2975	do {
				2976	ret = try_to_grab_pending(&dwork->work, true, &flags);
				2977	} while (unlikely(ret == -EAGAIN));
				2978
				2979	if (unlikely(ret < 0))
				2980	return false;
				2981
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	2982	set_work_pool_and_clear_pending(&dwork->work,
				2983	get_work_pool_id(&dwork->work));
Tejun Heo	57b30ae	2012-08-21 13:18:24 -0700	[diff] [blame]	2984	local_irq_restore(flags);
Dan Magenheimer	c0158ca	2012-10-18 16:31:37 -0700	[diff] [blame]	2985	return ret;
Tejun Heo	0938349	2010-09-16 10:48:29 +0200	[diff] [blame]	2986	}
Tejun Heo	57b30ae	2012-08-21 13:18:24 -0700	[diff] [blame]	2987	EXPORT_SYMBOL(cancel_delayed_work);
Tejun Heo	0938349	2010-09-16 10:48:29 +0200	[diff] [blame]	2988
				2989	/**
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2990	* cancel_delayed_work_sync - cancel a delayed work and wait for it to finish
				2991	* @dwork: the delayed work cancel
				2992	*
				2993	* This is cancel_work_sync() for delayed works.
				2994	*
				2995	* RETURNS:
				2996	* %true if @dwork was pending, %false otherwise.
				2997	*/
				2998	bool cancel_delayed_work_sync(struct delayed_work *dwork)
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2999	{
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	3000	return __cancel_work_timer(&dwork->work, true);
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	3001	}
Oleg Nesterov	f5a421a	2007-07-15 23:41:44 -0700	[diff] [blame]	3002	EXPORT_SYMBOL(cancel_delayed_work_sync);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3003
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	3004	/**
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	3005	* schedule_work_on - put work task on a specific cpu
				3006	* @cpu: cpu to put the work task on
				3007	* @work: job to be done
				3008	*
				3009	* This puts a job on a specific cpu
				3010	*/
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	3011	bool schedule_work_on(int cpu, struct work_struct *work)
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	3012	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3013	return queue_work_on(cpu, system_wq, work);
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	3014	}
				3015	EXPORT_SYMBOL(schedule_work_on);
				3016
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	3017	/**
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	3018	* schedule_work - put work task in global workqueue
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3019	* @work: job to be done
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3020	*
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	3021	* Returns %false if @work was already on the kernel-global workqueue and
				3022	* %true otherwise.
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	3023	*
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	3024	* This puts a job in the kernel-global workqueue if it was not already
				3025	* queued and leaves it in the same position on the kernel-global
				3026	* workqueue otherwise.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3027	*/
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	3028	bool schedule_work(struct work_struct *work)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3029	{
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	3030	return queue_work(system_wq, work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3031	}
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	3032	EXPORT_SYMBOL(schedule_work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3033
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	3034	/**
				3035	* schedule_delayed_work_on - queue work in global workqueue on CPU after delay
				3036	* @cpu: cpu to use
				3037	* @dwork: job to be done
				3038	* @delay: number of jiffies to wait
				3039	*
				3040	* After waiting for a given time this puts a job in the kernel-global
				3041	* workqueue on the specified CPU.
				3042	*/
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	3043	bool schedule_delayed_work_on(int cpu, struct delayed_work *dwork,
				3044	unsigned long delay)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3045	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3046	return queue_delayed_work_on(cpu, system_wq, dwork, delay);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3047	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	3048	EXPORT_SYMBOL(schedule_delayed_work_on);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3049
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	3050	/**
Tejun Heo	0a13c00	2012-08-03 10:30:44 -0700	[diff] [blame]	3051	* schedule_delayed_work - put work task in global workqueue after delay
				3052	* @dwork: job to be done
				3053	* @delay: number of jiffies to wait or 0 for immediate execution
				3054	*
				3055	* After waiting for a given time this puts a job in the kernel-global
				3056	* workqueue.
				3057	*/
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	3058	bool schedule_delayed_work(struct delayed_work *dwork, unsigned long delay)
Tejun Heo	0a13c00	2012-08-03 10:30:44 -0700	[diff] [blame]	3059	{
				3060	return queue_delayed_work(system_wq, dwork, delay);
				3061	}
				3062	EXPORT_SYMBOL(schedule_delayed_work);
				3063
				3064	/**
Tejun Heo	31ddd87	2010-10-19 11:14:49 +0200	[diff] [blame]	3065	* schedule_on_each_cpu - execute a function synchronously on each online CPU
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	3066	* @func: the function to call
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	3067	*
Tejun Heo	31ddd87	2010-10-19 11:14:49 +0200	[diff] [blame]	3068	* schedule_on_each_cpu() executes @func on each online CPU using the
				3069	* system workqueue and blocks until all CPUs have completed.
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	3070	* schedule_on_each_cpu() is very slow.
Tejun Heo	31ddd87	2010-10-19 11:14:49 +0200	[diff] [blame]	3071	*
				3072	* RETURNS:
				3073	* 0 on success, -errno on failure.
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	3074	*/
David Howells	65f27f3	2006-11-22 14:55:48 +0000	[diff] [blame]	3075	int schedule_on_each_cpu(work_func_t func)
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	3076	{
				3077	int cpu;
Namhyung Kim	38f5156	2010-08-08 14:24:09 +0200	[diff] [blame]	3078	struct work_struct __percpu *works;
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	3079
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	3080	works = alloc_percpu(struct work_struct);
				3081	if (!works)
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	3082	return -ENOMEM;
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	3083
Gautham R Shenoy	95402b3	2008-01-25 21:08:02 +0100	[diff] [blame]	3084	get_online_cpus();
Tejun Heo	9398180	2009-11-17 14:06:20 -0800	[diff] [blame]	3085
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	3086	for_each_online_cpu(cpu) {
Ingo Molnar	9bfb183	2006-12-18 20:05:09 +0100	[diff] [blame]	3087	struct work_struct *work = per_cpu_ptr(works, cpu);
				3088
				3089	INIT_WORK(work, func);
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	3090	schedule_work_on(cpu, work);
Andi Kleen	65a6446	2009-10-14 06:22:47 +0200	[diff] [blame]	3091	}
Tejun Heo	9398180	2009-11-17 14:06:20 -0800	[diff] [blame]	3092
				3093	for_each_online_cpu(cpu)
				3094	flush_work(per_cpu_ptr(works, cpu));
				3095
Gautham R Shenoy	95402b3	2008-01-25 21:08:02 +0100	[diff] [blame]	3096	put_online_cpus();
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	3097	free_percpu(works);
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	3098	return 0;
				3099	}
				3100
Alan Stern	eef6a7d	2010-02-12 17:39:21 +0900	[diff] [blame]	3101	/**
				3102	* flush_scheduled_work - ensure that any scheduled work has run to completion.
				3103	*
				3104	* Forces execution of the kernel-global workqueue and blocks until its
				3105	* completion.
				3106	*
				3107	* Think twice before calling this function! It's very easy to get into
				3108	* trouble if you don't take great care. Either of the following situations
				3109	* will lead to deadlock:
				3110	*
				3111	* One of the work items currently on the workqueue needs to acquire
				3112	* a lock held by your code or its caller.
				3113	*
				3114	* Your code is running in the context of a work routine.
				3115	*
				3116	* They will be detected by lockdep when they occur, but the first might not
				3117	* occur very often. It depends on what work items are on the workqueue and
				3118	* what locks they need, which you have no control over.
				3119	*
				3120	* In most situations flushing the entire workqueue is overkill; you merely
				3121	* need to know that a particular work item isn't queued and isn't running.
				3122	* In such cases you should use cancel_delayed_work_sync() or
				3123	* cancel_work_sync() instead.
				3124	*/
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3125	void flush_scheduled_work(void)
				3126	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3127	flush_workqueue(system_wq);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3128	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	3129	EXPORT_SYMBOL(flush_scheduled_work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3130
				3131	/**
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	3132	* execute_in_process_context - reliably execute the routine with user context
				3133	* @fn: the function to execute
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	3134	* @ew: guaranteed storage for the execute work structure (must
				3135	* be available when the work executes)
				3136	*
				3137	* Executes the function immediately if process context is available,
				3138	* otherwise schedules the function for delayed execution.
				3139	*
				3140	* Returns: 0 - function was executed
				3141	* 1 - function was scheduled for execution
				3142	*/
David Howells	65f27f3	2006-11-22 14:55:48 +0000	[diff] [blame]	3143	int execute_in_process_context(work_func_t fn, struct execute_work *ew)
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	3144	{
				3145	if (!in_interrupt()) {
David Howells	65f27f3	2006-11-22 14:55:48 +0000	[diff] [blame]	3146	fn(&ew->work);
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	3147	return 0;
				3148	}
				3149
David Howells	65f27f3	2006-11-22 14:55:48 +0000	[diff] [blame]	3150	INIT_WORK(&ew->work, fn);
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	3151	schedule_work(&ew->work);
				3152
				3153	return 1;
				3154	}
				3155	EXPORT_SYMBOL_GPL(execute_in_process_context);
				3156
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3157	int keventd_up(void)
				3158	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3159	return system_wq != NULL;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3160	}
				3161
Tejun Heo	226223a	2013-03-12 11:30:05 -0700	[diff] [blame]	3162	#ifdef CONFIG_SYSFS
				3163	/*
				3164	* Workqueues with WQ_SYSFS flag set is visible to userland via
				3165	* /sys/bus/workqueue/devices/WQ_NAME. All visible workqueues have the
				3166	* following attributes.
				3167	*
				3168	* per_cpu RO bool : whether the workqueue is per-cpu or unbound
				3169	* max_active RW int : maximum number of in-flight work items
				3170	*
				3171	* Unbound workqueues have the following extra attributes.
				3172	*
				3173	* id RO int : the associated pool ID
				3174	* nice RW int : nice value of the workers
				3175	* cpumask RW mask : bitmask of allowed CPUs for the workers
				3176	*/
				3177	struct wq_device {
				3178	struct workqueue_struct *wq;
				3179	struct device dev;
				3180	};
				3181
				3182	static struct workqueue_struct dev_to_wq(struct device dev)
				3183	{
				3184	struct wq_device *wq_dev = container_of(dev, struct wq_device, dev);
				3185
				3186	return wq_dev->wq;
				3187	}
				3188
				3189	static ssize_t wq_per_cpu_show(struct device *dev,
				3190	struct device_attribute attr, char buf)
				3191	{
				3192	struct workqueue_struct *wq = dev_to_wq(dev);
				3193
				3194	return scnprintf(buf, PAGE_SIZE, "%d\n", (bool)!(wq->flags & WQ_UNBOUND));
				3195	}
				3196
				3197	static ssize_t wq_max_active_show(struct device *dev,
				3198	struct device_attribute attr, char buf)
				3199	{
				3200	struct workqueue_struct *wq = dev_to_wq(dev);
				3201
				3202	return scnprintf(buf, PAGE_SIZE, "%d\n", wq->saved_max_active);
				3203	}
				3204
				3205	static ssize_t wq_max_active_store(struct device *dev,
				3206	struct device_attribute *attr,
				3207	const char *buf, size_t count)
				3208	{
				3209	struct workqueue_struct *wq = dev_to_wq(dev);
				3210	int val;
				3211
				3212	if (sscanf(buf, "%d", &val) != 1 \|\| val <= 0)
				3213	return -EINVAL;
				3214
				3215	workqueue_set_max_active(wq, val);
				3216	return count;
				3217	}
				3218
				3219	static struct device_attribute wq_sysfs_attrs[] = {
				3220	__ATTR(per_cpu, 0444, wq_per_cpu_show, NULL),
				3221	__ATTR(max_active, 0644, wq_max_active_show, wq_max_active_store),
				3222	__ATTR_NULL,
				3223	};
				3224
				3225	static ssize_t wq_pool_id_show(struct device *dev,
				3226	struct device_attribute attr, char buf)
				3227	{
				3228	struct workqueue_struct *wq = dev_to_wq(dev);
				3229	struct worker_pool *pool;
				3230	int written;
				3231
				3232	rcu_read_lock_sched();
				3233	pool = first_pwq(wq)->pool;
				3234	written = scnprintf(buf, PAGE_SIZE, "%d\n", pool->id);
				3235	rcu_read_unlock_sched();
				3236
				3237	return written;
				3238	}
				3239
				3240	static ssize_t wq_nice_show(struct device dev, struct device_attribute attr,
				3241	char *buf)
				3242	{
				3243	struct workqueue_struct *wq = dev_to_wq(dev);
				3244	int written;
				3245
				3246	rcu_read_lock_sched();
				3247	written = scnprintf(buf, PAGE_SIZE, "%d\n",
				3248	first_pwq(wq)->pool->attrs->nice);
				3249	rcu_read_unlock_sched();
				3250
				3251	return written;
				3252	}
				3253
				3254	/* prepare workqueue_attrs for sysfs store operations */
				3255	static struct workqueue_attrs wq_sysfs_prep_attrs(struct workqueue_struct wq)
				3256	{
				3257	struct workqueue_attrs *attrs;
				3258
				3259	attrs = alloc_workqueue_attrs(GFP_KERNEL);
				3260	if (!attrs)
				3261	return NULL;
				3262
				3263	rcu_read_lock_sched();
				3264	copy_workqueue_attrs(attrs, first_pwq(wq)->pool->attrs);
				3265	rcu_read_unlock_sched();
				3266	return attrs;
				3267	}
				3268
				3269	static ssize_t wq_nice_store(struct device dev, struct device_attribute attr,
				3270	const char *buf, size_t count)
				3271	{
				3272	struct workqueue_struct *wq = dev_to_wq(dev);
				3273	struct workqueue_attrs *attrs;
				3274	int ret;
				3275
				3276	attrs = wq_sysfs_prep_attrs(wq);
				3277	if (!attrs)
				3278	return -ENOMEM;
				3279
				3280	if (sscanf(buf, "%d", &attrs->nice) == 1 &&
				3281	attrs->nice >= -20 && attrs->nice <= 19)
				3282	ret = apply_workqueue_attrs(wq, attrs);
				3283	else
				3284	ret = -EINVAL;
				3285
				3286	free_workqueue_attrs(attrs);
				3287	return ret ?: count;
				3288	}
				3289
				3290	static ssize_t wq_cpumask_show(struct device *dev,
				3291	struct device_attribute attr, char buf)
				3292	{
				3293	struct workqueue_struct *wq = dev_to_wq(dev);
				3294	int written;
				3295
				3296	rcu_read_lock_sched();
				3297	written = cpumask_scnprintf(buf, PAGE_SIZE,
				3298	first_pwq(wq)->pool->attrs->cpumask);
				3299	rcu_read_unlock_sched();
				3300
				3301	written += scnprintf(buf + written, PAGE_SIZE - written, "\n");
				3302	return written;
				3303	}
				3304
				3305	static ssize_t wq_cpumask_store(struct device *dev,
				3306	struct device_attribute *attr,
				3307	const char *buf, size_t count)
				3308	{
				3309	struct workqueue_struct *wq = dev_to_wq(dev);
				3310	struct workqueue_attrs *attrs;
				3311	int ret;
				3312
				3313	attrs = wq_sysfs_prep_attrs(wq);
				3314	if (!attrs)
				3315	return -ENOMEM;
				3316
				3317	ret = cpumask_parse(buf, attrs->cpumask);
				3318	if (!ret)
				3319	ret = apply_workqueue_attrs(wq, attrs);
				3320
				3321	free_workqueue_attrs(attrs);
				3322	return ret ?: count;
				3323	}
				3324
				3325	static struct device_attribute wq_sysfs_unbound_attrs[] = {
				3326	__ATTR(pool_id, 0444, wq_pool_id_show, NULL),
				3327	__ATTR(nice, 0644, wq_nice_show, wq_nice_store),
				3328	__ATTR(cpumask, 0644, wq_cpumask_show, wq_cpumask_store),
				3329	__ATTR_NULL,
				3330	};
				3331
				3332	static struct bus_type wq_subsys = {
				3333	.name = "workqueue",
				3334	.dev_attrs = wq_sysfs_attrs,
				3335	};
				3336
				3337	static int __init wq_sysfs_init(void)
				3338	{
				3339	return subsys_virtual_register(&wq_subsys, NULL);
				3340	}
				3341	core_initcall(wq_sysfs_init);
				3342
				3343	static void wq_device_release(struct device *dev)
				3344	{
				3345	struct wq_device *wq_dev = container_of(dev, struct wq_device, dev);
				3346
				3347	kfree(wq_dev);
				3348	}
				3349
				3350	/**
				3351	* workqueue_sysfs_register - make a workqueue visible in sysfs
				3352	* @wq: the workqueue to register
				3353	*
				3354	* Expose @wq in sysfs under /sys/bus/workqueue/devices.
				3355	* alloc_workqueue*() automatically calls this function if WQ_SYSFS is set
				3356	* which is the preferred method.
				3357	*
				3358	* Workqueue user should use this function directly iff it wants to apply
				3359	* workqueue_attrs before making the workqueue visible in sysfs; otherwise,
				3360	* apply_workqueue_attrs() may race against userland updating the
				3361	* attributes.
				3362	*
				3363	* Returns 0 on success, -errno on failure.
				3364	*/
				3365	int workqueue_sysfs_register(struct workqueue_struct *wq)
				3366	{
				3367	struct wq_device *wq_dev;
				3368	int ret;
				3369
				3370	/*
				3371	* Adjusting max_active or creating new pwqs by applyting
				3372	* attributes breaks ordering guarantee. Disallow exposing ordered
				3373	* workqueues.
				3374	*/
				3375	if (WARN_ON(wq->flags & __WQ_ORDERED))
				3376	return -EINVAL;
				3377
				3378	wq->wq_dev = wq_dev = kzalloc(sizeof(*wq_dev), GFP_KERNEL);
				3379	if (!wq_dev)
				3380	return -ENOMEM;
				3381
				3382	wq_dev->wq = wq;
				3383	wq_dev->dev.bus = &wq_subsys;
				3384	wq_dev->dev.init_name = wq->name;
				3385	wq_dev->dev.release = wq_device_release;
				3386
				3387	/*
				3388	* unbound_attrs are created separately. Suppress uevent until
				3389	* everything is ready.
				3390	*/
				3391	dev_set_uevent_suppress(&wq_dev->dev, true);
				3392
				3393	ret = device_register(&wq_dev->dev);
				3394	if (ret) {
				3395	kfree(wq_dev);
				3396	wq->wq_dev = NULL;
				3397	return ret;
				3398	}
				3399
				3400	if (wq->flags & WQ_UNBOUND) {
				3401	struct device_attribute *attr;
				3402
				3403	for (attr = wq_sysfs_unbound_attrs; attr->attr.name; attr++) {
				3404	ret = device_create_file(&wq_dev->dev, attr);
				3405	if (ret) {
				3406	device_unregister(&wq_dev->dev);
				3407	wq->wq_dev = NULL;
				3408	return ret;
				3409	}
				3410	}
				3411	}
				3412
				3413	kobject_uevent(&wq_dev->dev.kobj, KOBJ_ADD);
				3414	return 0;
				3415	}
				3416
				3417	/**
				3418	* workqueue_sysfs_unregister - undo workqueue_sysfs_register()
				3419	* @wq: the workqueue to unregister
				3420	*
				3421	* If @wq is registered to sysfs by workqueue_sysfs_register(), unregister.
				3422	*/
				3423	static void workqueue_sysfs_unregister(struct workqueue_struct *wq)
				3424	{
				3425	struct wq_device *wq_dev = wq->wq_dev;
				3426
				3427	if (!wq->wq_dev)
				3428	return;
				3429
				3430	wq->wq_dev = NULL;
				3431	device_unregister(&wq_dev->dev);
				3432	}
				3433	#else /* CONFIG_SYSFS */
				3434	static void workqueue_sysfs_unregister(struct workqueue_struct *wq) { }
				3435	#endif /* CONFIG_SYSFS */
				3436
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	3437	/**
				3438	* free_workqueue_attrs - free a workqueue_attrs
				3439	* @attrs: workqueue_attrs to free
				3440	*
				3441	* Undo alloc_workqueue_attrs().
				3442	*/
				3443	void free_workqueue_attrs(struct workqueue_attrs *attrs)
				3444	{
				3445	if (attrs) {
				3446	free_cpumask_var(attrs->cpumask);
				3447	kfree(attrs);
				3448	}
				3449	}
				3450
				3451	/**
				3452	* alloc_workqueue_attrs - allocate a workqueue_attrs
				3453	* @gfp_mask: allocation mask to use
				3454	*
				3455	* Allocate a new workqueue_attrs, initialize with default settings and
				3456	* return it. Returns NULL on failure.
				3457	*/
				3458	struct workqueue_attrs *alloc_workqueue_attrs(gfp_t gfp_mask)
				3459	{
				3460	struct workqueue_attrs *attrs;
				3461
				3462	attrs = kzalloc(sizeof(*attrs), gfp_mask);
				3463	if (!attrs)
				3464	goto fail;
				3465	if (!alloc_cpumask_var(&attrs->cpumask, gfp_mask))
				3466	goto fail;
				3467
				3468	cpumask_setall(attrs->cpumask);
				3469	return attrs;
				3470	fail:
				3471	free_workqueue_attrs(attrs);
				3472	return NULL;
				3473	}
				3474
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3475	static void copy_workqueue_attrs(struct workqueue_attrs *to,
				3476	const struct workqueue_attrs *from)
				3477	{
				3478	to->nice = from->nice;
				3479	cpumask_copy(to->cpumask, from->cpumask);
				3480	}
				3481
				3482	/*
				3483	* Hacky implementation of jhash of bitmaps which only considers the
				3484	* specified number of bits. We probably want a proper implementation in
				3485	* include/linux/jhash.h.
				3486	*/
				3487	static u32 jhash_bitmap(const unsigned long *bitmap, int bits, u32 hash)
				3488	{
				3489	int nr_longs = bits / BITS_PER_LONG;
				3490	int nr_leftover = bits % BITS_PER_LONG;
				3491	unsigned long leftover = 0;
				3492
				3493	if (nr_longs)
				3494	hash = jhash(bitmap, nr_longs * sizeof(long), hash);
				3495	if (nr_leftover) {
				3496	bitmap_copy(&leftover, bitmap + nr_longs, nr_leftover);
				3497	hash = jhash(&leftover, sizeof(long), hash);
				3498	}
				3499	return hash;
				3500	}
				3501
				3502	/* hash value of the content of @attr */
				3503	static u32 wqattrs_hash(const struct workqueue_attrs *attrs)
				3504	{
				3505	u32 hash = 0;
				3506
				3507	hash = jhash_1word(attrs->nice, hash);
				3508	hash = jhash_bitmap(cpumask_bits(attrs->cpumask), nr_cpu_ids, hash);
				3509	return hash;
				3510	}
				3511
				3512	/* content equality test */
				3513	static bool wqattrs_equal(const struct workqueue_attrs *a,
				3514	const struct workqueue_attrs *b)
				3515	{
				3516	if (a->nice != b->nice)
				3517	return false;
				3518	if (!cpumask_equal(a->cpumask, b->cpumask))
				3519	return false;
				3520	return true;
				3521	}
				3522
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	3523	/**
				3524	* init_worker_pool - initialize a newly zalloc'd worker_pool
				3525	* @pool: worker_pool to initialize
				3526	*
				3527	* Initiailize a newly zalloc'd @pool. It also allocates @pool->attrs.
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3528	* Returns 0 on success, -errno on failure. Even on failure, all fields
				3529	* inside @pool proper are initialized and put_unbound_pool() can be called
				3530	* on @pool safely to release it.
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	3531	*/
				3532	static int init_worker_pool(struct worker_pool *pool)
Tejun Heo	4e1a1f9	2013-03-12 11:30:00 -0700	[diff] [blame]	3533	{
				3534	spin_lock_init(&pool->lock);
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3535	pool->id = -1;
				3536	pool->cpu = -1;
Tejun Heo	4e1a1f9	2013-03-12 11:30:00 -0700	[diff] [blame]	3537	pool->flags \|= POOL_DISASSOCIATED;
				3538	INIT_LIST_HEAD(&pool->worklist);
				3539	INIT_LIST_HEAD(&pool->idle_list);
				3540	hash_init(pool->busy_hash);
				3541
				3542	init_timer_deferrable(&pool->idle_timer);
				3543	pool->idle_timer.function = idle_worker_timeout;
				3544	pool->idle_timer.data = (unsigned long)pool;
				3545
				3546	setup_timer(&pool->mayday_timer, pool_mayday_timeout,
				3547	(unsigned long)pool);
				3548
				3549	mutex_init(&pool->manager_arb);
				3550	mutex_init(&pool->assoc_mutex);
				3551	ida_init(&pool->worker_ida);
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	3552
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3553	INIT_HLIST_NODE(&pool->hash_node);
				3554	pool->refcnt = 1;
				3555
				3556	/* shouldn't fail above this point */
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	3557	pool->attrs = alloc_workqueue_attrs(GFP_KERNEL);
				3558	if (!pool->attrs)
				3559	return -ENOMEM;
				3560	return 0;
Tejun Heo	4e1a1f9	2013-03-12 11:30:00 -0700	[diff] [blame]	3561	}
				3562
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3563	static void rcu_free_pool(struct rcu_head *rcu)
				3564	{
				3565	struct worker_pool *pool = container_of(rcu, struct worker_pool, rcu);
				3566
				3567	ida_destroy(&pool->worker_ida);
				3568	free_workqueue_attrs(pool->attrs);
				3569	kfree(pool);
				3570	}
				3571
				3572	/**
				3573	* put_unbound_pool - put a worker_pool
				3574	* @pool: worker_pool to put
				3575	*
				3576	* Put @pool. If its refcnt reaches zero, it gets destroyed in sched-RCU
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	3577	* safe manner. get_unbound_pool() calls this function on its failure path
				3578	* and this function should be able to release pools which went through,
				3579	* successfully or not, init_worker_pool().
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3580	*/
				3581	static void put_unbound_pool(struct worker_pool *pool)
				3582	{
				3583	struct worker *worker;
				3584
				3585	spin_lock_irq(&workqueue_lock);
				3586	if (--pool->refcnt) {
				3587	spin_unlock_irq(&workqueue_lock);
				3588	return;
				3589	}
				3590
				3591	/* sanity checks */
				3592	if (WARN_ON(!(pool->flags & POOL_DISASSOCIATED)) \|\|
				3593	WARN_ON(!list_empty(&pool->worklist))) {
				3594	spin_unlock_irq(&workqueue_lock);
				3595	return;
				3596	}
				3597
				3598	/* release id and unhash */
				3599	if (pool->id >= 0)
				3600	idr_remove(&worker_pool_idr, pool->id);
				3601	hash_del(&pool->hash_node);
				3602
				3603	spin_unlock_irq(&workqueue_lock);
				3604
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	3605	/*
				3606	* Become the manager and destroy all workers. Grabbing
				3607	* manager_arb prevents @pool's workers from blocking on
				3608	* manager_mutex.
				3609	*/
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3610	mutex_lock(&pool->manager_arb);
				3611	spin_lock_irq(&pool->lock);
				3612
				3613	while ((worker = first_worker(pool)))
				3614	destroy_worker(worker);
				3615	WARN_ON(pool->nr_workers \|\| pool->nr_idle);
				3616
				3617	spin_unlock_irq(&pool->lock);
				3618	mutex_unlock(&pool->manager_arb);
				3619
				3620	/* shut down the timers */
				3621	del_timer_sync(&pool->idle_timer);
				3622	del_timer_sync(&pool->mayday_timer);
				3623
				3624	/* sched-RCU protected to allow dereferences from get_work_pool() */
				3625	call_rcu_sched(&pool->rcu, rcu_free_pool);
				3626	}
				3627
				3628	/**
				3629	* get_unbound_pool - get a worker_pool with the specified attributes
				3630	* @attrs: the attributes of the worker_pool to get
				3631	*
				3632	* Obtain a worker_pool which has the same attributes as @attrs, bump the
				3633	* reference count and return it. If there already is a matching
				3634	* worker_pool, it will be used; otherwise, this function attempts to
				3635	* create a new one. On failure, returns NULL.
				3636	*/
				3637	static struct worker_pool get_unbound_pool(const struct workqueue_attrs attrs)
				3638	{
				3639	static DEFINE_MUTEX(create_mutex);
				3640	u32 hash = wqattrs_hash(attrs);
				3641	struct worker_pool *pool;
				3642	struct worker *worker;
				3643
				3644	mutex_lock(&create_mutex);
				3645
				3646	/* do we already have a matching pool? */
				3647	spin_lock_irq(&workqueue_lock);
				3648	hash_for_each_possible(unbound_pool_hash, pool, hash_node, hash) {
				3649	if (wqattrs_equal(pool->attrs, attrs)) {
				3650	pool->refcnt++;
				3651	goto out_unlock;
				3652	}
				3653	}
				3654	spin_unlock_irq(&workqueue_lock);
				3655
				3656	/* nope, create a new one */
				3657	pool = kzalloc(sizeof(*pool), GFP_KERNEL);
				3658	if (!pool \|\| init_worker_pool(pool) < 0)
				3659	goto fail;
				3660
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	3661	lockdep_set_subclass(&pool->lock, 1); /* see put_pwq() */
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3662	copy_workqueue_attrs(pool->attrs, attrs);
				3663
				3664	if (worker_pool_assign_id(pool) < 0)
				3665	goto fail;
				3666
				3667	/* create and start the initial worker */
				3668	worker = create_worker(pool);
				3669	if (!worker)
				3670	goto fail;
				3671
				3672	spin_lock_irq(&pool->lock);
				3673	start_worker(worker);
				3674	spin_unlock_irq(&pool->lock);
				3675
				3676	/* install */
				3677	spin_lock_irq(&workqueue_lock);
				3678	hash_add(unbound_pool_hash, &pool->hash_node, hash);
				3679	out_unlock:
				3680	spin_unlock_irq(&workqueue_lock);
				3681	mutex_unlock(&create_mutex);
				3682	return pool;
				3683	fail:
				3684	mutex_unlock(&create_mutex);
				3685	if (pool)
				3686	put_unbound_pool(pool);
				3687	return NULL;
				3688	}
				3689
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	3690	static void rcu_free_pwq(struct rcu_head *rcu)
				3691	{
				3692	kmem_cache_free(pwq_cache,
				3693	container_of(rcu, struct pool_workqueue, rcu));
				3694	}
				3695
				3696	/*
				3697	* Scheduled on system_wq by put_pwq() when an unbound pwq hits zero refcnt
				3698	* and needs to be destroyed.
				3699	*/
				3700	static void pwq_unbound_release_workfn(struct work_struct *work)
				3701	{
				3702	struct pool_workqueue *pwq = container_of(work, struct pool_workqueue,
				3703	unbound_release_work);
				3704	struct workqueue_struct *wq = pwq->wq;
				3705	struct worker_pool *pool = pwq->pool;
				3706
				3707	if (WARN_ON_ONCE(!(wq->flags & WQ_UNBOUND)))
				3708	return;
				3709
Tejun Heo	75ccf59	2013-03-12 11:30:04 -0700	[diff] [blame]	3710	/*
				3711	* Unlink @pwq. Synchronization against flush_mutex isn't strictly
				3712	* necessary on release but do it anyway. It's easier to verify
				3713	* and consistent with the linking path.
				3714	*/
				3715	mutex_lock(&wq->flush_mutex);
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	3716	spin_lock_irq(&workqueue_lock);
				3717	list_del_rcu(&pwq->pwqs_node);
				3718	spin_unlock_irq(&workqueue_lock);
Tejun Heo	75ccf59	2013-03-12 11:30:04 -0700	[diff] [blame]	3719	mutex_unlock(&wq->flush_mutex);
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	3720
				3721	put_unbound_pool(pool);
				3722	call_rcu_sched(&pwq->rcu, rcu_free_pwq);
				3723
				3724	/*
				3725	* If we're the last pwq going away, @wq is already dead and no one
				3726	* is gonna access it anymore. Free it.
				3727	*/
				3728	if (list_empty(&wq->pwqs))
				3729	kfree(wq);
				3730	}
				3731
Tejun Heo	0fbd95a	2013-03-13 16:51:35 -0700	[diff] [blame]	3732	/**
Tejun Heo	699ce09	2013-03-13 16:51:35 -0700	[diff] [blame]	3733	* pwq_adjust_max_active - update a pwq's max_active to the current setting
Tejun Heo	0fbd95a	2013-03-13 16:51:35 -0700	[diff] [blame]	3734	* @pwq: target pool_workqueue
Tejun Heo	0fbd95a	2013-03-13 16:51:35 -0700	[diff] [blame]	3735	*
Tejun Heo	699ce09	2013-03-13 16:51:35 -0700	[diff] [blame]	3736	* If @pwq isn't freezing, set @pwq->max_active to the associated
				3737	* workqueue's saved_max_active and activate delayed work items
				3738	* accordingly. If @pwq is freezing, clear @pwq->max_active to zero.
Tejun Heo	0fbd95a	2013-03-13 16:51:35 -0700	[diff] [blame]	3739	*/
Tejun Heo	699ce09	2013-03-13 16:51:35 -0700	[diff] [blame]	3740	static void pwq_adjust_max_active(struct pool_workqueue *pwq)
Tejun Heo	0fbd95a	2013-03-13 16:51:35 -0700	[diff] [blame]	3741	{
Tejun Heo	699ce09	2013-03-13 16:51:35 -0700	[diff] [blame]	3742	struct workqueue_struct *wq = pwq->wq;
				3743	bool freezable = wq->flags & WQ_FREEZABLE;
Tejun Heo	0fbd95a	2013-03-13 16:51:35 -0700	[diff] [blame]	3744
Tejun Heo	699ce09	2013-03-13 16:51:35 -0700	[diff] [blame]	3745	/* for @wq->saved_max_active */
				3746	lockdep_assert_held(&workqueue_lock);
				3747
				3748	/* fast exit for non-freezable wqs */
				3749	if (!freezable && pwq->max_active == wq->saved_max_active)
				3750	return;
				3751
				3752	spin_lock(&pwq->pool->lock);
				3753
				3754	if (!freezable \|\| !(pwq->pool->flags & POOL_FREEZING)) {
				3755	pwq->max_active = wq->saved_max_active;
				3756
				3757	while (!list_empty(&pwq->delayed_works) &&
				3758	pwq->nr_active < pwq->max_active)
				3759	pwq_activate_first_delayed(pwq);
				3760	} else {
				3761	pwq->max_active = 0;
				3762	}
				3763
				3764	spin_unlock(&pwq->pool->lock);
Tejun Heo	0fbd95a	2013-03-13 16:51:35 -0700	[diff] [blame]	3765	}
				3766
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3767	static void init_and_link_pwq(struct pool_workqueue *pwq,
				3768	struct workqueue_struct *wq,
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	3769	struct worker_pool *pool,
				3770	struct pool_workqueue **p_last_pwq)
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3771	{
				3772	BUG_ON((unsigned long)pwq & WORK_STRUCT_FLAG_MASK);
				3773
				3774	pwq->pool = pool;
				3775	pwq->wq = wq;
				3776	pwq->flush_color = -1;
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	3777	pwq->refcnt = 1;
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3778	INIT_LIST_HEAD(&pwq->delayed_works);
				3779	INIT_LIST_HEAD(&pwq->mayday_node);
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	3780	INIT_WORK(&pwq->unbound_release_work, pwq_unbound_release_workfn);
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3781
Tejun Heo	75ccf59	2013-03-12 11:30:04 -0700	[diff] [blame]	3782	mutex_lock(&wq->flush_mutex);
				3783	spin_lock_irq(&workqueue_lock);
				3784
Tejun Heo	983ca25	2013-03-13 16:51:35 -0700	[diff] [blame]	3785	/*
				3786	* Set the matching work_color. This is synchronized with
				3787	* flush_mutex to avoid confusing flush_workqueue().
				3788	*/
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	3789	if (p_last_pwq)
				3790	*p_last_pwq = first_pwq(wq);
Tejun Heo	75ccf59	2013-03-12 11:30:04 -0700	[diff] [blame]	3791	pwq->work_color = wq->work_color;
Tejun Heo	983ca25	2013-03-13 16:51:35 -0700	[diff] [blame]	3792
				3793	/* sync max_active to the current setting */
				3794	pwq_adjust_max_active(pwq);
				3795
				3796	/* link in @pwq */
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	3797	list_add_rcu(&pwq->pwqs_node, &wq->pwqs);
Tejun Heo	75ccf59	2013-03-12 11:30:04 -0700	[diff] [blame]	3798
				3799	spin_unlock_irq(&workqueue_lock);
				3800	mutex_unlock(&wq->flush_mutex);
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3801	}
				3802
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	3803	/**
				3804	* apply_workqueue_attrs - apply new workqueue_attrs to an unbound workqueue
				3805	* @wq: the target workqueue
				3806	* @attrs: the workqueue_attrs to apply, allocated with alloc_workqueue_attrs()
				3807	*
				3808	* Apply @attrs to an unbound workqueue @wq. If @attrs doesn't match the
				3809	* current attributes, a new pwq is created and made the first pwq which
				3810	* will serve all new work items. Older pwqs are released as in-flight
				3811	* work items finish. Note that a work item which repeatedly requeues
				3812	* itself back-to-back will stay on its current pwq.
				3813	*
				3814	* Performs GFP_KERNEL allocations. Returns 0 on success and -errno on
				3815	* failure.
				3816	*/
				3817	int apply_workqueue_attrs(struct workqueue_struct *wq,
				3818	const struct workqueue_attrs *attrs)
				3819	{
				3820	struct pool_workqueue pwq, last_pwq;
				3821	struct worker_pool *pool;
				3822
Tejun Heo	8719dce	2013-03-12 11:30:04 -0700	[diff] [blame]	3823	/* only unbound workqueues can change attributes */
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	3824	if (WARN_ON(!(wq->flags & WQ_UNBOUND)))
				3825	return -EINVAL;
				3826
Tejun Heo	8719dce	2013-03-12 11:30:04 -0700	[diff] [blame]	3827	/* creating multiple pwqs breaks ordering guarantee */
				3828	if (WARN_ON((wq->flags & __WQ_ORDERED) && !list_empty(&wq->pwqs)))
				3829	return -EINVAL;
				3830
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	3831	pwq = kmem_cache_zalloc(pwq_cache, GFP_KERNEL);
				3832	if (!pwq)
				3833	return -ENOMEM;
				3834
				3835	pool = get_unbound_pool(attrs);
				3836	if (!pool) {
				3837	kmem_cache_free(pwq_cache, pwq);
				3838	return -ENOMEM;
				3839	}
				3840
				3841	init_and_link_pwq(pwq, wq, pool, &last_pwq);
				3842	if (last_pwq) {
				3843	spin_lock_irq(&last_pwq->pool->lock);
				3844	put_pwq(last_pwq);
				3845	spin_unlock_irq(&last_pwq->pool->lock);
				3846	}
				3847
				3848	return 0;
				3849	}
				3850
Tejun Heo	30cdf24	2013-03-12 11:29:57 -0700	[diff] [blame]	3851	static int alloc_and_link_pwqs(struct workqueue_struct *wq)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3852	{
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	3853	bool highpri = wq->flags & WQ_HIGHPRI;
Tejun Heo	30cdf24	2013-03-12 11:29:57 -0700	[diff] [blame]	3854	int cpu;
Frederic Weisbecker	e1d8aa9	2009-01-12 23:15:46 +0100	[diff] [blame]	3855
Tejun Heo	30cdf24	2013-03-12 11:29:57 -0700	[diff] [blame]	3856	if (!(wq->flags & WQ_UNBOUND)) {
Tejun Heo	420c0dd	2013-03-12 11:29:59 -0700	[diff] [blame]	3857	wq->cpu_pwqs = alloc_percpu(struct pool_workqueue);
				3858	if (!wq->cpu_pwqs)
Tejun Heo	30cdf24	2013-03-12 11:29:57 -0700	[diff] [blame]	3859	return -ENOMEM;
				3860
				3861	for_each_possible_cpu(cpu) {
Tejun Heo	7fb98ea	2013-03-12 11:30:00 -0700	[diff] [blame]	3862	struct pool_workqueue *pwq =
				3863	per_cpu_ptr(wq->cpu_pwqs, cpu);
Tejun Heo	7a62c2c	2013-03-12 11:30:03 -0700	[diff] [blame]	3864	struct worker_pool *cpu_pools =
Tejun Heo	f02ae73	2013-03-12 11:30:03 -0700	[diff] [blame]	3865	per_cpu(cpu_worker_pools, cpu);
Tejun Heo	30cdf24	2013-03-12 11:29:57 -0700	[diff] [blame]	3866
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	3867	init_and_link_pwq(pwq, wq, &cpu_pools[highpri], NULL);
Tejun Heo	30cdf24	2013-03-12 11:29:57 -0700	[diff] [blame]	3868	}
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	3869	return 0;
Tejun Heo	30cdf24	2013-03-12 11:29:57 -0700	[diff] [blame]	3870	} else {
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	3871	return apply_workqueue_attrs(wq, unbound_std_wq_attrs[highpri]);
Tejun Heo	30cdf24	2013-03-12 11:29:57 -0700	[diff] [blame]	3872	}
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3873	}
				3874
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3875	static int wq_clamp_max_active(int max_active, unsigned int flags,
				3876	const char *name)
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	3877	{
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3878	int lim = flags & WQ_UNBOUND ? WQ_UNBOUND_MAX_ACTIVE : WQ_MAX_ACTIVE;
				3879
				3880	if (max_active < 1 \|\| max_active > lim)
Valentin Ilie	044c782	2012-08-19 00:52:42 +0300	[diff] [blame]	3881	pr_warn("workqueue: max_active %d requested for %s is out of range, clamping between %d and %d\n",
				3882	max_active, name, 1, lim);
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	3883
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3884	return clamp_val(max_active, 1, lim);
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	3885	}
				3886
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3887	struct workqueue_struct __alloc_workqueue_key(const char fmt,
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3888	unsigned int flags,
				3889	int max_active,
				3890	struct lock_class_key *key,
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3891	const char *lock_name, ...)
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3892	{
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3893	va_list args, args1;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3894	struct workqueue_struct *wq;
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	3895	struct pool_workqueue *pwq;
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3896	size_t namelen;
				3897
				3898	/* determine namelen, allocate wq and format name */
				3899	va_start(args, lock_name);
				3900	va_copy(args1, args);
				3901	namelen = vsnprintf(NULL, 0, fmt, args) + 1;
				3902
				3903	wq = kzalloc(sizeof(*wq) + namelen, GFP_KERNEL);
				3904	if (!wq)
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3905	return NULL;
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3906
				3907	vsnprintf(wq->name, namelen, fmt, args1);
				3908	va_end(args);
				3909	va_end(args1);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3910
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3911	max_active = max_active ?: WQ_DFL_ACTIVE;
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3912	max_active = wq_clamp_max_active(max_active, flags, wq->name);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3913
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3914	/* init wq */
Tejun Heo	97e37d7	2010-06-29 10:07:10 +0200	[diff] [blame]	3915	wq->flags = flags;
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3916	wq->saved_max_active = max_active;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	3917	mutex_init(&wq->flush_mutex);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	3918	atomic_set(&wq->nr_pwqs_to_flush, 0);
Tejun Heo	30cdf24	2013-03-12 11:29:57 -0700	[diff] [blame]	3919	INIT_LIST_HEAD(&wq->pwqs);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	3920	INIT_LIST_HEAD(&wq->flusher_queue);
				3921	INIT_LIST_HEAD(&wq->flusher_overflow);
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	3922	INIT_LIST_HEAD(&wq->maydays);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3923
Johannes Berg	eb13ba8	2008-01-16 09:51:58 +0100	[diff] [blame]	3924	lockdep_init_map(&wq->lockdep_map, lock_name, key, 0);
Oleg Nesterov	cce1a16	2007-05-09 02:34:13 -0700	[diff] [blame]	3925	INIT_LIST_HEAD(&wq->list);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3926
Tejun Heo	30cdf24	2013-03-12 11:29:57 -0700	[diff] [blame]	3927	if (alloc_and_link_pwqs(wq) < 0)
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3928	goto err_free_wq;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3929
Tejun Heo	493008a	2013-03-12 11:30:03 -0700	[diff] [blame]	3930	/*
				3931	* Workqueues which may be used during memory reclaim should
				3932	* have a rescuer to guarantee forward progress.
				3933	*/
				3934	if (flags & WQ_MEM_RECLAIM) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3935	struct worker *rescuer;
				3936
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3937	rescuer = alloc_worker();
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3938	if (!rescuer)
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3939	goto err_destroy;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3940
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	3941	rescuer->rescue_wq = wq;
				3942	rescuer->task = kthread_create(rescuer_thread, rescuer, "%s",
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3943	wq->name);
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3944	if (IS_ERR(rescuer->task)) {
				3945	kfree(rescuer);
				3946	goto err_destroy;
				3947	}
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3948
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3949	wq->rescuer = rescuer;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3950	rescuer->task->flags \|= PF_THREAD_BOUND;
				3951	wake_up_process(rescuer->task);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3952	}
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3953
Tejun Heo	226223a	2013-03-12 11:30:05 -0700	[diff] [blame]	3954	if ((wq->flags & WQ_SYSFS) && workqueue_sysfs_register(wq))
				3955	goto err_destroy;
				3956
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3957	/*
Tejun Heo	699ce09	2013-03-13 16:51:35 -0700	[diff] [blame]	3958	* workqueue_lock protects global freeze state and workqueues list.
				3959	* Grab it, adjust max_active and add the new workqueue to
				3960	* workqueues list.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3961	*/
Tejun Heo	e98d5b1	2013-03-12 11:29:57 -0700	[diff] [blame]	3962	spin_lock_irq(&workqueue_lock);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3963
Tejun Heo	699ce09	2013-03-13 16:51:35 -0700	[diff] [blame]	3964	for_each_pwq(pwq, wq)
				3965	pwq_adjust_max_active(pwq);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3966
Tejun Heo	1537663	2010-06-29 10:07:11 +0200	[diff] [blame]	3967	list_add(&wq->list, &workqueues);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3968
Tejun Heo	e98d5b1	2013-03-12 11:29:57 -0700	[diff] [blame]	3969	spin_unlock_irq(&workqueue_lock);
Tejun Heo	1537663	2010-06-29 10:07:11 +0200	[diff] [blame]	3970
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3971	return wq;
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3972
				3973	err_free_wq:
				3974	kfree(wq);
				3975	return NULL;
				3976	err_destroy:
				3977	destroy_workqueue(wq);
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	3978	return NULL;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3979	}
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3980	EXPORT_SYMBOL_GPL(__alloc_workqueue_key);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3981
				3982	/**
				3983	* destroy_workqueue - safely terminate a workqueue
				3984	* @wq: target workqueue
				3985	*
				3986	* Safely destroy a workqueue. All work currently pending will be done first.
				3987	*/
				3988	void destroy_workqueue(struct workqueue_struct *wq)
				3989	{
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	3990	struct pool_workqueue *pwq;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3991
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	3992	/* drain it before proceeding with destruction */
				3993	drain_workqueue(wq);
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	3994
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	3995	spin_lock_irq(&workqueue_lock);
				3996
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	3997	/* sanity checks */
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	3998	for_each_pwq(pwq, wq) {
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	3999	int i;
				4000
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	4001	for (i = 0; i < WORK_NR_COLORS; i++) {
				4002	if (WARN_ON(pwq->nr_in_flight[i])) {
				4003	spin_unlock_irq(&workqueue_lock);
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	4004	return;
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	4005	}
				4006	}
				4007
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	4008	if (WARN_ON(pwq->refcnt > 1) \|\|
				4009	WARN_ON(pwq->nr_active) \|\|
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	4010	WARN_ON(!list_empty(&pwq->delayed_works))) {
				4011	spin_unlock_irq(&workqueue_lock);
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	4012	return;
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	4013	}
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	4014	}
				4015
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4016	/*
				4017	* wq list is used to freeze wq, remove from list after
				4018	* flushing is complete in case freeze races us.
				4019	*/
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	4020	list_del_init(&wq->list);
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	4021
Tejun Heo	e98d5b1	2013-03-12 11:29:57 -0700	[diff] [blame]	4022	spin_unlock_irq(&workqueue_lock);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	4023
Tejun Heo	226223a	2013-03-12 11:30:05 -0700	[diff] [blame]	4024	workqueue_sysfs_unregister(wq);
				4025
Tejun Heo	493008a	2013-03-12 11:30:03 -0700	[diff] [blame]	4026	if (wq->rescuer) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	4027	kthread_stop(wq->rescuer->task);
Xiaotian Feng	8d9df9f	2010-08-16 09:54:28 +0200	[diff] [blame]	4028	kfree(wq->rescuer);
Tejun Heo	493008a	2013-03-12 11:30:03 -0700	[diff] [blame]	4029	wq->rescuer = NULL;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	4030	}
				4031
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	4032	if (!(wq->flags & WQ_UNBOUND)) {
				4033	/*
				4034	* The base ref is never dropped on per-cpu pwqs. Directly
				4035	* free the pwqs and wq.
				4036	*/
				4037	free_percpu(wq->cpu_pwqs);
				4038	kfree(wq);
				4039	} else {
				4040	/*
				4041	* We're the sole accessor of @wq at this point. Directly
				4042	* access the first pwq and put the base ref. As both pwqs
				4043	* and pools are sched-RCU protected, the lock operations
				4044	* are safe. @wq will be freed when the last pwq is
				4045	* released.
				4046	*/
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	4047	pwq = list_first_entry(&wq->pwqs, struct pool_workqueue,
				4048	pwqs_node);
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	4049	spin_lock_irq(&pwq->pool->lock);
				4050	put_pwq(pwq);
				4051	spin_unlock_irq(&pwq->pool->lock);
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	4052	}
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	4053	}
				4054	EXPORT_SYMBOL_GPL(destroy_workqueue);
				4055
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4056	/**
				4057	* workqueue_set_max_active - adjust max_active of a workqueue
				4058	* @wq: target workqueue
				4059	* @max_active: new max_active value.
				4060	*
				4061	* Set max_active of @wq to @max_active.
				4062	*
				4063	* CONTEXT:
				4064	* Don't call from IRQ context.
				4065	*/
				4066	void workqueue_set_max_active(struct workqueue_struct *wq, int max_active)
				4067	{
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	4068	struct pool_workqueue *pwq;
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4069
Tejun Heo	8719dce	2013-03-12 11:30:04 -0700	[diff] [blame]	4070	/* disallow meddling with max_active for ordered workqueues */
				4071	if (WARN_ON(wq->flags & __WQ_ORDERED))
				4072	return;
				4073
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	4074	max_active = wq_clamp_max_active(max_active, wq->flags, wq->name);
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4075
Tejun Heo	e98d5b1	2013-03-12 11:29:57 -0700	[diff] [blame]	4076	spin_lock_irq(&workqueue_lock);
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4077
				4078	wq->saved_max_active = max_active;
				4079
Tejun Heo	699ce09	2013-03-13 16:51:35 -0700	[diff] [blame]	4080	for_each_pwq(pwq, wq)
				4081	pwq_adjust_max_active(pwq);
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4082
Tejun Heo	e98d5b1	2013-03-12 11:29:57 -0700	[diff] [blame]	4083	spin_unlock_irq(&workqueue_lock);
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4084	}
				4085	EXPORT_SYMBOL_GPL(workqueue_set_max_active);
				4086
				4087	/**
Tejun Heo	e626761	2013-03-12 17:41:37 -0700	[diff] [blame]	4088	* current_is_workqueue_rescuer - is %current workqueue rescuer?
				4089	*
				4090	* Determine whether %current is a workqueue rescuer. Can be used from
				4091	* work functions to determine whether it's being run off the rescuer task.
				4092	*/
				4093	bool current_is_workqueue_rescuer(void)
				4094	{
				4095	struct worker *worker = current_wq_worker();
				4096
				4097	return worker && worker == worker->current_pwq->wq->rescuer;
				4098	}
				4099
				4100	/**
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4101	* workqueue_congested - test whether a workqueue is congested
				4102	* @cpu: CPU in question
				4103	* @wq: target workqueue
				4104	*
				4105	* Test whether @wq's cpu workqueue for @cpu is congested. There is
				4106	* no synchronization around this function and the test result is
				4107	* unreliable and only useful as advisory hints or for debugging.
				4108	*
				4109	* RETURNS:
				4110	* %true if congested, %false otherwise.
				4111	*/
Tejun Heo	d84ff05	2013-03-12 11:29:59 -0700	[diff] [blame]	4112	bool workqueue_congested(int cpu, struct workqueue_struct *wq)
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4113	{
Tejun Heo	7fb98ea	2013-03-12 11:30:00 -0700	[diff] [blame]	4114	struct pool_workqueue *pwq;
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	4115	bool ret;
				4116
				4117	preempt_disable();
Tejun Heo	7fb98ea	2013-03-12 11:30:00 -0700	[diff] [blame]	4118
				4119	if (!(wq->flags & WQ_UNBOUND))
				4120	pwq = per_cpu_ptr(wq->cpu_pwqs, cpu);
				4121	else
				4122	pwq = first_pwq(wq);
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4123
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	4124	ret = !list_empty(&pwq->delayed_works);
				4125	preempt_enable();
				4126
				4127	return ret;
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4128	}
				4129	EXPORT_SYMBOL_GPL(workqueue_congested);
				4130
				4131	/**
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4132	* work_busy - test whether a work is currently pending or running
				4133	* @work: the work to be tested
				4134	*
				4135	* Test whether @work is currently pending or running. There is no
				4136	* synchronization around this function and the test result is
				4137	* unreliable and only useful as advisory hints or for debugging.
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4138	*
				4139	* RETURNS:
				4140	* OR'd bitmask of WORK_BUSY_* bits.
				4141	*/
				4142	unsigned int work_busy(struct work_struct *work)
				4143	{
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	4144	struct worker_pool *pool;
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4145	unsigned long flags;
				4146	unsigned int ret = 0;
				4147
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4148	if (work_pending(work))
				4149	ret \|= WORK_BUSY_PENDING;
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4150
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	4151	local_irq_save(flags);
				4152	pool = get_work_pool(work);
Lai Jiangshan	038366c	2013-02-06 18:04:53 -0800	[diff] [blame]	4153	if (pool) {
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	4154	spin_lock(&pool->lock);
Lai Jiangshan	038366c	2013-02-06 18:04:53 -0800	[diff] [blame]	4155	if (find_worker_executing_work(pool, work))
				4156	ret \|= WORK_BUSY_RUNNING;
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	4157	spin_unlock(&pool->lock);
Lai Jiangshan	038366c	2013-02-06 18:04:53 -0800	[diff] [blame]	4158	}
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	4159	local_irq_restore(flags);
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4160
				4161	return ret;
				4162	}
				4163	EXPORT_SYMBOL_GPL(work_busy);
				4164
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	4165	/*
				4166	* CPU hotplug.
				4167	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	4168	* There are two challenges in supporting CPU hotplug. Firstly, there
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	4169	* are a lot of assumptions on strong associations among work, pwq and
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	4170	* pool which make migrating pending and scheduled works very
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	4171	* difficult to implement without impacting hot paths. Secondly,
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	4172	* worker pools serve mix of short, long and very long running works making
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	4173	* blocked draining impractical.
				4174	*
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	4175	* This is solved by allowing the pools to be disassociated from the CPU
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	4176	* running as an unbound one and allowing it to be reattached later if the
				4177	* cpu comes back online.
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	4178	*/
				4179
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	4180	static void wq_unbind_fn(struct work_struct *work)
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	4181	{
Tejun Heo	38db41d	2013-01-24 11:01:34 -0800	[diff] [blame]	4182	int cpu = smp_processor_id();
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	4183	struct worker_pool *pool;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	4184	struct worker *worker;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	4185	int i;
				4186
Tejun Heo	f02ae73	2013-03-12 11:30:03 -0700	[diff] [blame]	4187	for_each_cpu_worker_pool(pool, cpu) {
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	4188	WARN_ON_ONCE(cpu != smp_processor_id());
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	4189
				4190	mutex_lock(&pool->assoc_mutex);
				4191	spin_lock_irq(&pool->lock);
				4192
				4193	/*
				4194	* We've claimed all manager positions. Make all workers
				4195	* unbound and set DISASSOCIATED. Before this, all workers
				4196	* except for the ones which are still executing works from
				4197	* before the last CPU down must be on the cpu. After
				4198	* this, they may become diasporas.
				4199	*/
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	4200	list_for_each_entry(worker, &pool->idle_list, entry)
Tejun Heo	403c821	2012-07-17 12:39:27 -0700	[diff] [blame]	4201	worker->flags \|= WORKER_UNBOUND;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	4202
Sasha Levin	b67bfe0	2013-02-27 17:06:00 -0800	[diff] [blame]	4203	for_each_busy_worker(worker, i, pool)
Tejun Heo	c9e7cf2	2013-01-24 11:01:33 -0800	[diff] [blame]	4204	worker->flags \|= WORKER_UNBOUND;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	4205
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	4206	pool->flags \|= POOL_DISASSOCIATED;
Tejun Heo	f2d5a0e	2012-07-17 12:39:26 -0700	[diff] [blame]	4207
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	4208	spin_unlock_irq(&pool->lock);
				4209	mutex_unlock(&pool->assoc_mutex);
				4210	}
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	4211
				4212	/*
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	4213	* Call schedule() so that we cross rq->lock and thus can guarantee
				4214	* sched callbacks see the %WORKER_UNBOUND flag. This is necessary
				4215	* as scheduler callbacks may be invoked from other cpus.
				4216	*/
				4217	schedule();
				4218
				4219	/*
				4220	* Sched callbacks are disabled now. Zap nr_running. After this,
				4221	* nr_running stays zero and need_more_worker() and keep_working()
Tejun Heo	38db41d	2013-01-24 11:01:34 -0800	[diff] [blame]	4222	* are always true as long as the worklist is not empty. Pools on
				4223	* @cpu now behave as unbound (in terms of concurrency management)
				4224	* pools which are served by workers tied to the CPU.
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	4225	*
				4226	* On return from this function, the current worker would trigger
				4227	* unbound chain execution of pending work items if other workers
				4228	* didn't already.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	4229	*/
Tejun Heo	f02ae73	2013-03-12 11:30:03 -0700	[diff] [blame]	4230	for_each_cpu_worker_pool(pool, cpu)
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	4231	atomic_set(&pool->nr_running, 0);
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	4232	}
				4233
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	4234	/*
				4235	* Workqueues should be brought up before normal priority CPU notifiers.
				4236	* This will be registered high priority CPU notifier.
				4237	*/
Lai Jiangshan	9fdf9b7	2012-09-18 09:59:23 -0700	[diff] [blame]	4238	static int __cpuinit workqueue_cpu_up_callback(struct notifier_block *nfb,
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	4239	unsigned long action,
				4240	void *hcpu)
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	4241	{
Tejun Heo	d84ff05	2013-03-12 11:29:59 -0700	[diff] [blame]	4242	int cpu = (unsigned long)hcpu;
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	4243	struct worker_pool *pool;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	4244
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	4245	switch (action & ~CPU_TASKS_FROZEN) {
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	4246	case CPU_UP_PREPARE:
Tejun Heo	f02ae73	2013-03-12 11:30:03 -0700	[diff] [blame]	4247	for_each_cpu_worker_pool(pool, cpu) {
Tejun Heo	3ce6337	2012-07-17 12:39:27 -0700	[diff] [blame]	4248	struct worker *worker;
				4249
				4250	if (pool->nr_workers)
				4251	continue;
				4252
				4253	worker = create_worker(pool);
				4254	if (!worker)
				4255	return NOTIFY_BAD;
				4256
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	4257	spin_lock_irq(&pool->lock);
Tejun Heo	3ce6337	2012-07-17 12:39:27 -0700	[diff] [blame]	4258	start_worker(worker);
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	4259	spin_unlock_irq(&pool->lock);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	4260	}
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	4261	break;
Oleg Nesterov	00dfcaf	2008-04-29 01:00:27 -0700	[diff] [blame]	4262
Tejun Heo	6575820	2012-07-17 12:39:26 -0700	[diff] [blame]	4263	case CPU_DOWN_FAILED:
				4264	case CPU_ONLINE:
Tejun Heo	f02ae73	2013-03-12 11:30:03 -0700	[diff] [blame]	4265	for_each_cpu_worker_pool(pool, cpu) {
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	4266	mutex_lock(&pool->assoc_mutex);
				4267	spin_lock_irq(&pool->lock);
				4268
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	4269	pool->flags &= ~POOL_DISASSOCIATED;
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	4270	rebind_workers(pool);
				4271
				4272	spin_unlock_irq(&pool->lock);
				4273	mutex_unlock(&pool->assoc_mutex);
				4274	}
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	4275	break;
Tejun Heo	6575820	2012-07-17 12:39:26 -0700	[diff] [blame]	4276	}
				4277	return NOTIFY_OK;
				4278	}
				4279
				4280	/*
				4281	* Workqueues should be brought down after normal priority CPU notifiers.
				4282	* This will be registered as low priority CPU notifier.
				4283	*/
Lai Jiangshan	9fdf9b7	2012-09-18 09:59:23 -0700	[diff] [blame]	4284	static int __cpuinit workqueue_cpu_down_callback(struct notifier_block *nfb,
Tejun Heo	6575820	2012-07-17 12:39:26 -0700	[diff] [blame]	4285	unsigned long action,
				4286	void *hcpu)
				4287	{
Tejun Heo	d84ff05	2013-03-12 11:29:59 -0700	[diff] [blame]	4288	int cpu = (unsigned long)hcpu;
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	4289	struct work_struct unbind_work;
				4290
Tejun Heo	6575820	2012-07-17 12:39:26 -0700	[diff] [blame]	4291	switch (action & ~CPU_TASKS_FROZEN) {
				4292	case CPU_DOWN_PREPARE:
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	4293	/* unbinding should happen on the local CPU */
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	4294	INIT_WORK_ONSTACK(&unbind_work, wq_unbind_fn);
Joonsoo Kim	7635d2f	2012-08-15 23:25:41 +0900	[diff] [blame]	4295	queue_work_on(cpu, system_highpri_wq, &unbind_work);
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	4296	flush_work(&unbind_work);
				4297	break;
Tejun Heo	6575820	2012-07-17 12:39:26 -0700	[diff] [blame]	4298	}
				4299	return NOTIFY_OK;
				4300	}
				4301
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	4302	#ifdef CONFIG_SMP
Rusty Russell	8ccad40	2009-01-16 15:31:15 -0800	[diff] [blame]	4303
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	4304	struct work_for_cpu {
Tejun Heo	ed48ece	2012-09-18 12:48:43 -0700	[diff] [blame]	4305	struct work_struct work;
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	4306	long (fn)(void );
				4307	void *arg;
				4308	long ret;
				4309	};
				4310
Tejun Heo	ed48ece	2012-09-18 12:48:43 -0700	[diff] [blame]	4311	static void work_for_cpu_fn(struct work_struct *work)
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	4312	{
Tejun Heo	ed48ece	2012-09-18 12:48:43 -0700	[diff] [blame]	4313	struct work_for_cpu *wfc = container_of(work, struct work_for_cpu, work);
				4314
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	4315	wfc->ret = wfc->fn(wfc->arg);
				4316	}
				4317
				4318	/**
				4319	* work_on_cpu - run a function in user context on a particular cpu
				4320	* @cpu: the cpu to run on
				4321	* @fn: the function to run
				4322	* @arg: the function arg
				4323	*
Rusty Russell	31ad908	2009-01-16 15:31:15 -0800	[diff] [blame]	4324	* This will return the value @fn returns.
				4325	* It is up to the caller to ensure that the cpu doesn't go offline.
Andrew Morton	6b44003	2009-04-09 09:50:37 -0600	[diff] [blame]	4326	* The caller must not hold any locks which would prevent @fn from completing.
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	4327	*/
Tejun Heo	d84ff05	2013-03-12 11:29:59 -0700	[diff] [blame]	4328	long work_on_cpu(int cpu, long (fn)(void ), void *arg)
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	4329	{
Tejun Heo	ed48ece	2012-09-18 12:48:43 -0700	[diff] [blame]	4330	struct work_for_cpu wfc = { .fn = fn, .arg = arg };
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	4331
Tejun Heo	ed48ece	2012-09-18 12:48:43 -0700	[diff] [blame]	4332	INIT_WORK_ONSTACK(&wfc.work, work_for_cpu_fn);
				4333	schedule_work_on(cpu, &wfc.work);
				4334	flush_work(&wfc.work);
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	4335	return wfc.ret;
				4336	}
				4337	EXPORT_SYMBOL_GPL(work_on_cpu);
				4338	#endif /* CONFIG_SMP */
				4339
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4340	#ifdef CONFIG_FREEZER
Rusty Russell	e7577c5	2009-01-01 10:12:25 +1030	[diff] [blame]	4341
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4342	/**
				4343	* freeze_workqueues_begin - begin freezing workqueues
				4344	*
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	4345	* Start freezing workqueues. After this function returns, all freezable
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	4346	* workqueues will queue new works to their delayed_works list instead of
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	4347	* pool->worklist.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4348	*
				4349	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	4350	* Grabs and releases workqueue_lock and pool->lock's.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4351	*/
				4352	void freeze_workqueues_begin(void)
				4353	{
Tejun Heo	1711696	2013-03-12 11:29:58 -0700	[diff] [blame]	4354	struct worker_pool *pool;
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4355	struct workqueue_struct *wq;
				4356	struct pool_workqueue *pwq;
Tejun Heo	611c92a	2013-03-13 16:51:36 -0700	[diff] [blame^]	4357	int pi;
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4358
Tejun Heo	e98d5b1	2013-03-12 11:29:57 -0700	[diff] [blame]	4359	spin_lock_irq(&workqueue_lock);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4360
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	4361	WARN_ON_ONCE(workqueue_freezing);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4362	workqueue_freezing = true;
				4363
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4364	/* set FREEZING */
Tejun Heo	611c92a	2013-03-13 16:51:36 -0700	[diff] [blame^]	4365	for_each_pool(pool, pi) {
Tejun Heo	1711696	2013-03-12 11:29:58 -0700	[diff] [blame]	4366	spin_lock(&pool->lock);
Tejun Heo	1711696	2013-03-12 11:29:58 -0700	[diff] [blame]	4367	WARN_ON_ONCE(pool->flags & POOL_FREEZING);
				4368	pool->flags \|= POOL_FREEZING;
Tejun Heo	1711696	2013-03-12 11:29:58 -0700	[diff] [blame]	4369	spin_unlock(&pool->lock);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4370	}
				4371
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4372	/* suppress further executions by setting max_active to zero */
				4373	list_for_each_entry(wq, &workqueues, list) {
Tejun Heo	699ce09	2013-03-13 16:51:35 -0700	[diff] [blame]	4374	for_each_pwq(pwq, wq)
				4375	pwq_adjust_max_active(pwq);
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4376	}
				4377
Tejun Heo	e98d5b1	2013-03-12 11:29:57 -0700	[diff] [blame]	4378	spin_unlock_irq(&workqueue_lock);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	4379	}
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4380
				4381	/**
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	4382	* freeze_workqueues_busy - are freezable workqueues still busy?
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4383	*
				4384	* Check whether freezing is complete. This function must be called
				4385	* between freeze_workqueues_begin() and thaw_workqueues().
				4386	*
				4387	* CONTEXT:
				4388	* Grabs and releases workqueue_lock.
				4389	*
				4390	* RETURNS:
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	4391	* %true if some freezable workqueues are still busy. %false if freezing
				4392	* is complete.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4393	*/
				4394	bool freeze_workqueues_busy(void)
				4395	{
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4396	bool busy = false;
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4397	struct workqueue_struct *wq;
				4398	struct pool_workqueue *pwq;
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4399
Tejun Heo	e98d5b1	2013-03-12 11:29:57 -0700	[diff] [blame]	4400	spin_lock_irq(&workqueue_lock);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4401
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	4402	WARN_ON_ONCE(!workqueue_freezing);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4403
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4404	list_for_each_entry(wq, &workqueues, list) {
				4405	if (!(wq->flags & WQ_FREEZABLE))
				4406	continue;
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4407	/*
				4408	* nr_active is monotonically decreasing. It's safe
				4409	* to peek without lock.
				4410	*/
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4411	for_each_pwq(pwq, wq) {
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	4412	WARN_ON_ONCE(pwq->nr_active < 0);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	4413	if (pwq->nr_active) {
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4414	busy = true;
				4415	goto out_unlock;
				4416	}
				4417	}
				4418	}
				4419	out_unlock:
Tejun Heo	e98d5b1	2013-03-12 11:29:57 -0700	[diff] [blame]	4420	spin_unlock_irq(&workqueue_lock);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4421	return busy;
				4422	}
				4423
				4424	/**
				4425	* thaw_workqueues - thaw workqueues
				4426	*
				4427	* Thaw workqueues. Normal queueing is restored and all collected
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	4428	* frozen works are transferred to their respective pool worklists.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4429	*
				4430	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	4431	* Grabs and releases workqueue_lock and pool->lock's.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4432	*/
				4433	void thaw_workqueues(void)
				4434	{
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4435	struct workqueue_struct *wq;
				4436	struct pool_workqueue *pwq;
				4437	struct worker_pool *pool;
Tejun Heo	611c92a	2013-03-13 16:51:36 -0700	[diff] [blame^]	4438	int pi;
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4439
Tejun Heo	e98d5b1	2013-03-12 11:29:57 -0700	[diff] [blame]	4440	spin_lock_irq(&workqueue_lock);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4441
				4442	if (!workqueue_freezing)
				4443	goto out_unlock;
				4444
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4445	/* clear FREEZING */
Tejun Heo	611c92a	2013-03-13 16:51:36 -0700	[diff] [blame^]	4446	for_each_pool(pool, pi) {
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4447	spin_lock(&pool->lock);
				4448	WARN_ON_ONCE(!(pool->flags & POOL_FREEZING));
				4449	pool->flags &= ~POOL_FREEZING;
				4450	spin_unlock(&pool->lock);
				4451	}
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	4452
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4453	/* restore max_active and repopulate worklist */
				4454	list_for_each_entry(wq, &workqueues, list) {
Tejun Heo	699ce09	2013-03-13 16:51:35 -0700	[diff] [blame]	4455	for_each_pwq(pwq, wq)
				4456	pwq_adjust_max_active(pwq);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4457	}
				4458
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4459	/* kick workers */
Tejun Heo	611c92a	2013-03-13 16:51:36 -0700	[diff] [blame^]	4460	for_each_pool(pool, pi) {
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4461	spin_lock(&pool->lock);
				4462	wake_up_worker(pool);
				4463	spin_unlock(&pool->lock);
				4464	}
				4465
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4466	workqueue_freezing = false;
				4467	out_unlock:
Tejun Heo	e98d5b1	2013-03-12 11:29:57 -0700	[diff] [blame]	4468	spin_unlock_irq(&workqueue_lock);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4469	}
				4470	#endif /* CONFIG_FREEZER */
				4471
Suresh Siddha	6ee0578	2010-07-30 14:57:37 -0700	[diff] [blame]	4472	static int __init init_workqueues(void)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	4473	{
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	4474	int std_nice[NR_STD_WORKER_POOLS] = { 0, HIGHPRI_NICE_LEVEL };
				4475	int i, cpu;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	4476
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	4477	/* make sure we have enough bits for OFFQ pool ID */
				4478	BUILD_BUG_ON((1LU << (BITS_PER_LONG - WORK_OFFQ_POOL_SHIFT)) <
Lai Jiangshan	6be1958	2013-02-06 18:04:53 -0800	[diff] [blame]	4479	WORK_CPU_END * NR_STD_WORKER_POOLS);
Tejun Heo	b549007	2012-08-03 10:30:46 -0700	[diff] [blame]	4480
Tejun Heo	e904e6c	2013-03-12 11:29:57 -0700	[diff] [blame]	4481	WARN_ON(__alignof__(struct pool_workqueue) < __alignof__(long long));
				4482
				4483	pwq_cache = KMEM_CACHE(pool_workqueue, SLAB_PANIC);
				4484
Tejun Heo	6575820	2012-07-17 12:39:26 -0700	[diff] [blame]	4485	cpu_notifier(workqueue_cpu_up_callback, CPU_PRI_WORKQUEUE_UP);
Lai Jiangshan	a5b4e57	2012-09-18 09:59:23 -0700	[diff] [blame]	4486	hotcpu_notifier(workqueue_cpu_down_callback, CPU_PRI_WORKQUEUE_DOWN);
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	4487
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	4488	/* initialize CPU pools */
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	4489	for_each_possible_cpu(cpu) {
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	4490	struct worker_pool *pool;
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	4491
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	4492	i = 0;
Tejun Heo	f02ae73	2013-03-12 11:30:03 -0700	[diff] [blame]	4493	for_each_cpu_worker_pool(pool, cpu) {
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	4494	BUG_ON(init_worker_pool(pool));
Tejun Heo	ec22ca5	2013-01-24 11:01:33 -0800	[diff] [blame]	4495	pool->cpu = cpu;
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	4496	cpumask_copy(pool->attrs->cpumask, cpumask_of(cpu));
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	4497	pool->attrs->nice = std_nice[i++];
				4498
Tejun Heo	9daf9e6	2013-01-24 11:01:33 -0800	[diff] [blame]	4499	/* alloc pool ID */
				4500	BUG_ON(worker_pool_assign_id(pool));
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	4501	}
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	4502	}
				4503
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	4504	/* create the initial worker */
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	4505	for_each_online_cpu(cpu) {
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	4506	struct worker_pool *pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	4507
Tejun Heo	f02ae73	2013-03-12 11:30:03 -0700	[diff] [blame]	4508	for_each_cpu_worker_pool(pool, cpu) {
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	4509	struct worker *worker;
				4510
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	4511	pool->flags &= ~POOL_DISASSOCIATED;
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	4512
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	4513	worker = create_worker(pool);
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	4514	BUG_ON(!worker);
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	4515	spin_lock_irq(&pool->lock);
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	4516	start_worker(worker);
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	4517	spin_unlock_irq(&pool->lock);
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	4518	}
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	4519	}
				4520
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	4521	/* create default unbound wq attrs */
				4522	for (i = 0; i < NR_STD_WORKER_POOLS; i++) {
				4523	struct workqueue_attrs *attrs;
				4524
				4525	BUG_ON(!(attrs = alloc_workqueue_attrs(GFP_KERNEL)));
				4526
				4527	attrs->nice = std_nice[i];
				4528	cpumask_setall(attrs->cpumask);
				4529
				4530	unbound_std_wq_attrs[i] = attrs;
				4531	}
				4532
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	4533	system_wq = alloc_workqueue("events", 0, 0);
Joonsoo Kim	1aabe90	2012-08-15 23:25:39 +0900	[diff] [blame]	4534	system_highpri_wq = alloc_workqueue("events_highpri", WQ_HIGHPRI, 0);
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	4535	system_long_wq = alloc_workqueue("events_long", 0, 0);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	4536	system_unbound_wq = alloc_workqueue("events_unbound", WQ_UNBOUND,
				4537	WQ_UNBOUND_MAX_ACTIVE);
Tejun Heo	24d51ad	2011-02-21 09:52:50 +0100	[diff] [blame]	4538	system_freezable_wq = alloc_workqueue("events_freezable",
				4539	WQ_FREEZABLE, 0);
Joonsoo Kim	1aabe90	2012-08-15 23:25:39 +0900	[diff] [blame]	4540	BUG_ON(!system_wq \|\| !system_highpri_wq \|\| !system_long_wq \|\|
Tejun Heo	ae930e0	2012-08-20 14:51:23 -0700	[diff] [blame]	4541	!system_unbound_wq \|\| !system_freezable_wq);
Suresh Siddha	6ee0578	2010-07-30 14:57:37 -0700	[diff] [blame]	4542	return 0;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	4543	}
Suresh Siddha	6ee0578	2010-07-30 14:57:37 -0700	[diff] [blame]	4544	early_initcall(init_workqueues);