Blame - kernel/workqueue.c - linux-4.4

blob: 3e297c574be86bc32c0bd34fd6526c51a426db1c [file] [log] [blame]

Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1	/*
Tejun Heo	c54fce6	2010-09-10 16:51:36 +0200	[diff] [blame]	2	* kernel/workqueue.c - generic async execution with shared worker pool
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3	*
Tejun Heo	c54fce6	2010-09-10 16:51:36 +0200	[diff] [blame]	4	* Copyright (C) 2002 Ingo Molnar
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	5	*
Tejun Heo	c54fce6	2010-09-10 16:51:36 +0200	[diff] [blame]	6	* Derived from the taskqueue/keventd code by:
				7	* David Woodhouse <dwmw2@infradead.org>
				8	* Andrew Morton
				9	* Kai Petzke <wpp@marie.physik.tu-berlin.de>
				10	* Theodore Ts'o <tytso@mit.edu>
Christoph Lameter	89ada67	2005-10-30 15:01:59 -0800	[diff] [blame]	11	*
Christoph Lameter	cde5353	2008-07-04 09:59:22 -0700	[diff] [blame]	12	* Made to use alloc_percpu by Christoph Lameter.
Tejun Heo	c54fce6	2010-09-10 16:51:36 +0200	[diff] [blame]	13	*
				14	* Copyright (C) 2010 SUSE Linux Products GmbH
				15	* Copyright (C) 2010 Tejun Heo <tj@kernel.org>
				16	*
				17	* This is the generic async execution mechanism. Work items as are
				18	* executed in process context. The worker pool is shared and
				19	* automatically managed. There is one worker pool for each CPU and
				20	* one extra for works which are better served by workers which are
				21	* not bound to any specific CPU.
				22	*
				23	* Please read Documentation/workqueue.txt for details.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	24	*/
				25
Paul Gortmaker	9984de1	2011-05-23 14:51:41 -0400	[diff] [blame]	26	#include <linux/export.h>
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	27	#include <linux/kernel.h>
				28	#include <linux/sched.h>
				29	#include <linux/init.h>
				30	#include <linux/signal.h>
				31	#include <linux/completion.h>
				32	#include <linux/workqueue.h>
				33	#include <linux/slab.h>
				34	#include <linux/cpu.h>
				35	#include <linux/notifier.h>
				36	#include <linux/kthread.h>
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	37	#include <linux/hardirq.h>
Christoph Lameter	4693402	2006-10-11 01:21:26 -0700	[diff] [blame]	38	#include <linux/mempolicy.h>
Rafael J. Wysocki	341a595	2006-12-06 20:34:49 -0800	[diff] [blame]	39	#include <linux/freezer.h>
Peter Zijlstra	d5abe66	2006-12-06 20:37:26 -0800	[diff] [blame]	40	#include <linux/kallsyms.h>
				41	#include <linux/debug_locks.h>
Johannes Berg	4e6045f	2007-10-18 23:39:55 -0700	[diff] [blame]	42	#include <linux/lockdep.h>
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	43	#include <linux/idr.h>
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	44	#include <linux/jhash.h>
Sasha Levin	42f8570	2012-12-17 10:01:23 -0500	[diff] [blame]	45	#include <linux/hashtable.h>
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	46	#include <linux/rculist.h>
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	47
Tejun Heo	ea13844	2013-01-18 14:05:55 -0800	[diff] [blame]	48	#include "workqueue_internal.h"
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	49
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	50	enum {
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	51	/*
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	52	* worker_pool flags
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	53	*
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	54	* A bound pool is either associated or disassociated with its CPU.
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	55	* While associated (!DISASSOCIATED), all workers are bound to the
				56	* CPU and none has %WORKER_UNBOUND set and concurrency management
				57	* is in effect.
				58	*
				59	* While DISASSOCIATED, the cpu may be offline and all workers have
				60	* %WORKER_UNBOUND set and concurrency management disabled, and may
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	61	* be executing on any CPU. The pool behaves as an unbound one.
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	62	*
Tejun Heo	bc3a1af	2013-03-13 19:47:39 -0700	[diff] [blame]	63	* Note that DISASSOCIATED should be flipped only while holding
				64	* manager_mutex to avoid changing binding state while
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	65	* create_worker() is in progress.
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	66	*/
Tejun Heo	11ebea5	2012-07-12 14:46:37 -0700	[diff] [blame]	67	POOL_MANAGE_WORKERS = 1 << 0, /* need to manage workers */
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	68	POOL_DISASSOCIATED = 1 << 2, /* cpu can't serve workers */
Tejun Heo	35b6bb6	2013-01-24 11:01:33 -0800	[diff] [blame]	69	POOL_FREEZING = 1 << 3, /* freeze in progress */
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	70
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	71	/* worker flags */
				72	WORKER_STARTED = 1 << 0, /* started */
				73	WORKER_DIE = 1 << 1, /* die die die */
				74	WORKER_IDLE = 1 << 2, /* is idle */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	75	WORKER_PREP = 1 << 3, /* preparing to run works */
Tejun Heo	fb0e7be	2010-06-29 10:07:15 +0200	[diff] [blame]	76	WORKER_CPU_INTENSIVE = 1 << 6, /* cpu intensive */
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	77	WORKER_UNBOUND = 1 << 7, /* worker is unbound */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	78
Lai Jiangshan	5f7dabf	2012-09-18 09:59:23 -0700	[diff] [blame]	79	WORKER_NOT_RUNNING = WORKER_PREP \| WORKER_UNBOUND \|
Tejun Heo	403c821	2012-07-17 12:39:27 -0700	[diff] [blame]	80	WORKER_CPU_INTENSIVE,
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	81
Tejun Heo	e34cdddb	2013-01-24 11:01:33 -0800	[diff] [blame]	82	NR_STD_WORKER_POOLS = 2, /* # standard pools per cpu */
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	83
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	84	UNBOUND_POOL_HASH_ORDER = 6, /* hashed by pool->attrs */
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	85	BUSY_WORKER_HASH_ORDER = 6, /* 64 pointers */
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	86
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	87	MAX_IDLE_WORKERS_RATIO = 4, /* 1/4 of busy can be idle */
				88	IDLE_WORKER_TIMEOUT = 300 * HZ, /* keep idle ones for 5 mins */
				89
Tejun Heo	3233cdb	2011-02-16 18:10:19 +0100	[diff] [blame]	90	MAYDAY_INITIAL_TIMEOUT = HZ / 100 >= 2 ? HZ / 100 : 2,
				91	/* call for help after 10ms
				92	(min two ticks) */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	93	MAYDAY_INTERVAL = HZ / 10, /* and then every 100ms */
				94	CREATE_COOLDOWN = HZ, /* time to breath after fail */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	95
				96	/*
				97	* Rescue workers are used only on emergencies and shared by
				98	* all cpus. Give -20.
				99	*/
				100	RESCUER_NICE_LEVEL = -20,
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	101	HIGHPRI_NICE_LEVEL = -20,
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	102	};
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	103
				104	/*
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	105	* Structure fields follow one of the following exclusion rules.
				106	*
Tejun Heo	e41e704	2010-08-24 14:22:47 +0200	[diff] [blame]	107	* I: Modifiable by initialization/destruction paths and read-only for
				108	* everyone else.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	109	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	110	* P: Preemption protected. Disabling preemption is enough and should
				111	* only be modified and accessed from the local cpu.
				112	*
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	113	* L: pool->lock protected. Access with pool->lock held.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	114	*
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	115	* X: During normal operation, modification requires pool->lock and should
				116	* be done only from local cpu. Either disabling preemption on local
				117	* cpu or grabbing pool->lock is enough for read access. If
				118	* POOL_DISASSOCIATED is set, it's identical to L.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	119	*
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	120	* F: wq->flush_mutex protected.
				121	*
Tejun Heo	822d840	2013-03-19 13:45:21 -0700	[diff] [blame]	122	* MG: pool->manager_mutex and pool->lock protected. Writes require both
				123	* locks. Reads can happen under either lock.
				124	*
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	125	* WQ: wq_mutex protected.
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	126	*
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	127	* WR: wq_mutex protected for writes. Sched-RCU protected for reads.
				128	*
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	129	* PW: pwq_lock protected.
				130	*
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	131	* FR: wq->flush_mutex and pwq_lock protected for writes. Sched-RCU
Tejun Heo	75ccf59	2013-03-12 11:30:04 -0700	[diff] [blame]	132	* protected for reads.
Tejun Heo	2e109a2	2013-03-13 19:47:40 -0700	[diff] [blame]	133	*
				134	* MD: wq_mayday_lock protected.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	135	*/
				136
Tejun Heo	2eaebdb	2013-01-18 14:05:55 -0800	[diff] [blame]	137	/* struct worker is defined in workqueue_internal.h */
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	138
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	139	struct worker_pool {
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	140	spinlock_t lock; /* the pool lock */
Tejun Heo	d84ff05	2013-03-12 11:29:59 -0700	[diff] [blame]	141	int cpu; /* I: the associated cpu */
Tejun Heo	9daf9e6	2013-01-24 11:01:33 -0800	[diff] [blame]	142	int id; /* I: pool ID */
Tejun Heo	11ebea5	2012-07-12 14:46:37 -0700	[diff] [blame]	143	unsigned int flags; /* X: flags */
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	144
				145	struct list_head worklist; /* L: list of pending works */
				146	int nr_workers; /* L: total number of workers */
Lai Jiangshan	ea1abd6	2012-09-18 09:59:22 -0700	[diff] [blame]	147
				148	/* nr_idle includes the ones off idle_list for rebinding */
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	149	int nr_idle; /* L: currently idle ones */
				150
				151	struct list_head idle_list; /* X: list of idle workers */
				152	struct timer_list idle_timer; /* L: worker idle timeout */
				153	struct timer_list mayday_timer; /* L: SOS timer for workers */
				154
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	155	/* a workers is either on busy_hash or idle_list, or the manager */
Tejun Heo	c9e7cf2	2013-01-24 11:01:33 -0800	[diff] [blame]	156	DECLARE_HASHTABLE(busy_hash, BUSY_WORKER_HASH_ORDER);
				157	/* L: hash of busy workers */
				158
Tejun Heo	bc3a1af	2013-03-13 19:47:39 -0700	[diff] [blame]	159	/* see manage_workers() for details on the two manager mutexes */
Tejun Heo	34a06bd	2013-03-12 11:30:00 -0700	[diff] [blame]	160	struct mutex manager_arb; /* manager arbitration */
Tejun Heo	bc3a1af	2013-03-13 19:47:39 -0700	[diff] [blame]	161	struct mutex manager_mutex; /* manager exclusion */
Tejun Heo	822d840	2013-03-19 13:45:21 -0700	[diff] [blame]	162	struct idr worker_idr; /* MG: worker IDs and iteration */
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	163
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	164	struct workqueue_attrs attrs; / I: worker attributes */
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	165	struct hlist_node hash_node; /* WQ: unbound_pool_hash node */
				166	int refcnt; /* WQ: refcnt for unbound pools */
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	167
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	168	/*
				169	* The current concurrency level. As it's likely to be accessed
				170	* from other CPUs during try_to_wake_up(), put it in a separate
				171	* cacheline.
				172	*/
				173	atomic_t nr_running ____cacheline_aligned_in_smp;
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	174
				175	/*
				176	* Destruction of pool is sched-RCU protected to allow dereferences
				177	* from get_work_pool().
				178	*/
				179	struct rcu_head rcu;
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	180	} ____cacheline_aligned_in_smp;
				181
				182	/*
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	183	* The per-pool workqueue. While queued, the lower WORK_STRUCT_FLAG_BITS
				184	* of work_struct->data are used for flags and the remaining high bits
				185	* point to the pwq; thus, pwqs need to be aligned at two's power of the
				186	* number of flag bits.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	187	*/
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	188	struct pool_workqueue {
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	189	struct worker_pool pool; / I: the associated pool */
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	190	struct workqueue_struct wq; / I: the owning workqueue */
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	191	int work_color; /* L: current color */
				192	int flush_color; /* L: flushing color */
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	193	int refcnt; /* L: reference count */
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	194	int nr_in_flight[WORK_NR_COLORS];
				195	/* L: nr of in_flight works */
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	196	int nr_active; /* L: nr of active works */
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	197	int max_active; /* L: max active works */
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	198	struct list_head delayed_works; /* L: delayed works */
Tejun Heo	75ccf59	2013-03-12 11:30:04 -0700	[diff] [blame]	199	struct list_head pwqs_node; /* FR: node on wq->pwqs */
Tejun Heo	2e109a2	2013-03-13 19:47:40 -0700	[diff] [blame]	200	struct list_head mayday_node; /* MD: node on wq->maydays */
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	201
				202	/*
				203	* Release of unbound pwq is punted to system_wq. See put_pwq()
				204	* and pwq_unbound_release_workfn() for details. pool_workqueue
				205	* itself is also sched-RCU protected so that the first pwq can be
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	206	* determined without grabbing pwq_lock.
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	207	*/
				208	struct work_struct unbound_release_work;
				209	struct rcu_head rcu;
Tejun Heo	e904e6c	2013-03-12 11:29:57 -0700	[diff] [blame]	210	} __aligned(1 << WORK_STRUCT_FLAG_BITS);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	211
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	212	/*
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	213	* Structure used to wait for workqueue flush.
				214	*/
				215	struct wq_flusher {
				216	struct list_head list; /* F: list of flushers */
				217	int flush_color; /* F: flush color waiting for */
				218	struct completion done; /* flush completion */
				219	};
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	220
Tejun Heo	226223a	2013-03-12 11:30:05 -0700	[diff] [blame]	221	struct wq_device;
				222
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	223	/*
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	224	* The externally visible workqueue. It relays the issued work items to
				225	* the appropriate worker_pool through its pool_workqueues.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	226	*/
				227	struct workqueue_struct {
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	228	unsigned int flags; /* WQ: WQ_* flags */
Tejun Heo	420c0dd	2013-03-12 11:29:59 -0700	[diff] [blame]	229	struct pool_workqueue __percpu cpu_pwqs; / I: per-cpu pwq's */
Tejun Heo	75ccf59	2013-03-12 11:30:04 -0700	[diff] [blame]	230	struct list_head pwqs; /* FR: all pwqs of this wq */
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	231	struct list_head list; /* WQ: list of all workqueues */
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	232
				233	struct mutex flush_mutex; /* protects wq flushing */
				234	int work_color; /* F: current work color */
				235	int flush_color; /* F: current flush color */
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	236	atomic_t nr_pwqs_to_flush; /* flush in progress */
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	237	struct wq_flusher first_flusher; / F: first flusher */
				238	struct list_head flusher_queue; /* F: flush waiters */
				239	struct list_head flusher_overflow; /* F: flush overflow list */
				240
Tejun Heo	2e109a2	2013-03-13 19:47:40 -0700	[diff] [blame]	241	struct list_head maydays; /* MD: pwqs requesting rescue */
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	242	struct worker rescuer; / I: rescue worker */
				243
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	244	int nr_drainers; /* WQ: drain in progress */
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	245	int saved_max_active; /* PW: saved pwq max_active */
Tejun Heo	226223a	2013-03-12 11:30:05 -0700	[diff] [blame]	246
				247	#ifdef CONFIG_SYSFS
				248	struct wq_device wq_dev; / I: for sysfs interface */
				249	#endif
Johannes Berg	4e6045f	2007-10-18 23:39:55 -0700	[diff] [blame]	250	#ifdef CONFIG_LOCKDEP
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	251	struct lockdep_map lockdep_map;
Johannes Berg	4e6045f	2007-10-18 23:39:55 -0700	[diff] [blame]	252	#endif
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	253	char name[]; /* I: workqueue name */
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	254	};
				255
Tejun Heo	e904e6c	2013-03-12 11:29:57 -0700	[diff] [blame]	256	static struct kmem_cache *pwq_cache;
				257
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	258	static DEFINE_MUTEX(wq_mutex); /* protects workqueues and pools */
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	259	static DEFINE_SPINLOCK(pwq_lock); /* protects pool_workqueues */
Tejun Heo	2e109a2	2013-03-13 19:47:40 -0700	[diff] [blame]	260	static DEFINE_SPINLOCK(wq_mayday_lock); /* protects wq->maydays list */
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	261
				262	static LIST_HEAD(workqueues); /* WQ: list of all workqueues */
				263	static bool workqueue_freezing; /* WQ: have wqs started freezing? */
Tejun Heo	7d19c5c	2013-03-13 19:47:40 -0700	[diff] [blame]	264
				265	/* the per-cpu worker pools */
				266	static DEFINE_PER_CPU_SHARED_ALIGNED(struct worker_pool [NR_STD_WORKER_POOLS],
				267	cpu_worker_pools);
				268
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	269	static DEFINE_IDR(worker_pool_idr); /* WR: idr of all pools */
Tejun Heo	7d19c5c	2013-03-13 19:47:40 -0700	[diff] [blame]	270
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	271	/* WQ: hash of all unbound pools keyed by pool->attrs */
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	272	static DEFINE_HASHTABLE(unbound_pool_hash, UNBOUND_POOL_HASH_ORDER);
				273
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	274	/* I: attributes used when instantiating standard unbound pools on demand */
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	275	static struct workqueue_attrs *unbound_std_wq_attrs[NR_STD_WORKER_POOLS];
				276
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	277	struct workqueue_struct *system_wq __read_mostly;
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	278	EXPORT_SYMBOL_GPL(system_wq);
Valentin Ilie	044c782	2012-08-19 00:52:42 +0300	[diff] [blame]	279	struct workqueue_struct *system_highpri_wq __read_mostly;
Joonsoo Kim	1aabe90	2012-08-15 23:25:39 +0900	[diff] [blame]	280	EXPORT_SYMBOL_GPL(system_highpri_wq);
Valentin Ilie	044c782	2012-08-19 00:52:42 +0300	[diff] [blame]	281	struct workqueue_struct *system_long_wq __read_mostly;
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	282	EXPORT_SYMBOL_GPL(system_long_wq);
Valentin Ilie	044c782	2012-08-19 00:52:42 +0300	[diff] [blame]	283	struct workqueue_struct *system_unbound_wq __read_mostly;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	284	EXPORT_SYMBOL_GPL(system_unbound_wq);
Valentin Ilie	044c782	2012-08-19 00:52:42 +0300	[diff] [blame]	285	struct workqueue_struct *system_freezable_wq __read_mostly;
Tejun Heo	24d51ad	2011-02-21 09:52:50 +0100	[diff] [blame]	286	EXPORT_SYMBOL_GPL(system_freezable_wq);
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	287
Tejun Heo	7d19c5c	2013-03-13 19:47:40 -0700	[diff] [blame]	288	static int worker_thread(void *__worker);
				289	static void copy_workqueue_attrs(struct workqueue_attrs *to,
				290	const struct workqueue_attrs *from);
				291
Tejun Heo	97bd234	2010-10-05 10:41:14 +0200	[diff] [blame]	292	#define CREATE_TRACE_POINTS
				293	#include <trace/events/workqueue.h>
				294
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	295	#define assert_rcu_or_wq_mutex() \
				296	rcu_lockdep_assert(rcu_read_lock_sched_held() \|\| \
				297	lockdep_is_held(&wq_mutex), \
				298	"sched RCU or wq_mutex should be held")
				299
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	300	#define assert_rcu_or_pwq_lock() \
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	301	rcu_lockdep_assert(rcu_read_lock_sched_held() \|\| \
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	302	lockdep_is_held(&pwq_lock), \
				303	"sched RCU or pwq_lock should be held")
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	304
Tejun Heo	822d840	2013-03-19 13:45:21 -0700	[diff] [blame]	305	#ifdef CONFIG_LOCKDEP
				306	#define assert_manager_or_pool_lock(pool) \
				307	WARN_ONCE(!lockdep_is_held(&(pool)->manager_mutex) && \
				308	!lockdep_is_held(&(pool)->lock), \
				309	"pool->manager_mutex or ->lock should be held")
				310	#else
				311	#define assert_manager_or_pool_lock(pool) do { } while (0)
				312	#endif
				313
Tejun Heo	f02ae73	2013-03-12 11:30:03 -0700	[diff] [blame]	314	#define for_each_cpu_worker_pool(pool, cpu) \
				315	for ((pool) = &per_cpu(cpu_worker_pools, cpu)[0]; \
				316	(pool) < &per_cpu(cpu_worker_pools, cpu)[NR_STD_WORKER_POOLS]; \
Tejun Heo	7a62c2c	2013-03-12 11:30:03 -0700	[diff] [blame]	317	(pool)++)
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	318
Sasha Levin	b67bfe0	2013-02-27 17:06:00 -0800	[diff] [blame]	319	#define for_each_busy_worker(worker, i, pool) \
				320	hash_for_each(pool->busy_hash, i, worker, hentry)
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	321
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	322	/**
Tejun Heo	1711696	2013-03-12 11:29:58 -0700	[diff] [blame]	323	* for_each_pool - iterate through all worker_pools in the system
				324	* @pool: iteration cursor
Tejun Heo	611c92a	2013-03-13 16:51:36 -0700	[diff] [blame]	325	* @pi: integer used for iteration
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	326	*
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	327	* This must be called either with wq_mutex held or sched RCU read locked.
				328	* If the pool needs to be used beyond the locking in effect, the caller is
				329	* responsible for guaranteeing that the pool stays online.
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	330	*
				331	* The if/else clause exists only for the lockdep assertion and can be
				332	* ignored.
Tejun Heo	1711696	2013-03-12 11:29:58 -0700	[diff] [blame]	333	*/
Tejun Heo	611c92a	2013-03-13 16:51:36 -0700	[diff] [blame]	334	#define for_each_pool(pool, pi) \
				335	idr_for_each_entry(&worker_pool_idr, pool, pi) \
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	336	if (({ assert_rcu_or_wq_mutex(); false; })) { } \
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	337	else
Tejun Heo	1711696	2013-03-12 11:29:58 -0700	[diff] [blame]	338
				339	/**
Tejun Heo	822d840	2013-03-19 13:45:21 -0700	[diff] [blame]	340	* for_each_pool_worker - iterate through all workers of a worker_pool
				341	* @worker: iteration cursor
				342	* @wi: integer used for iteration
				343	* @pool: worker_pool to iterate workers of
				344	*
				345	* This must be called with either @pool->manager_mutex or ->lock held.
				346	*
				347	* The if/else clause exists only for the lockdep assertion and can be
				348	* ignored.
				349	*/
				350	#define for_each_pool_worker(worker, wi, pool) \
				351	idr_for_each_entry(&(pool)->worker_idr, (worker), (wi)) \
				352	if (({ assert_manager_or_pool_lock((pool)); false; })) { } \
				353	else
				354
				355	/**
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	356	* for_each_pwq - iterate through all pool_workqueues of the specified workqueue
				357	* @pwq: iteration cursor
				358	* @wq: the target workqueue
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	359	*
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	360	* This must be called either with pwq_lock held or sched RCU read locked.
				361	* If the pwq needs to be used beyond the locking in effect, the caller is
				362	* responsible for guaranteeing that the pwq stays online.
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	363	*
				364	* The if/else clause exists only for the lockdep assertion and can be
				365	* ignored.
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	366	*/
				367	#define for_each_pwq(pwq, wq) \
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	368	list_for_each_entry_rcu((pwq), &(wq)->pwqs, pwqs_node) \
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	369	if (({ assert_rcu_or_pwq_lock(); false; })) { } \
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	370	else
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	371
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	372	#ifdef CONFIG_DEBUG_OBJECTS_WORK
				373
				374	static struct debug_obj_descr work_debug_descr;
				375
Stanislaw Gruszka	9977728	2011-03-07 09:58:33 +0100	[diff] [blame]	376	static void work_debug_hint(void addr)
				377	{
				378	return ((struct work_struct *) addr)->func;
				379	}
				380
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	381	/*
				382	* fixup_init is called when:
				383	* - an active object is initialized
				384	*/
				385	static int work_fixup_init(void *addr, enum debug_obj_state state)
				386	{
				387	struct work_struct *work = addr;
				388
				389	switch (state) {
				390	case ODEBUG_STATE_ACTIVE:
				391	cancel_work_sync(work);
				392	debug_object_init(work, &work_debug_descr);
				393	return 1;
				394	default:
				395	return 0;
				396	}
				397	}
				398
				399	/*
				400	* fixup_activate is called when:
				401	* - an active object is activated
				402	* - an unknown object is activated (might be a statically initialized object)
				403	*/
				404	static int work_fixup_activate(void *addr, enum debug_obj_state state)
				405	{
				406	struct work_struct *work = addr;
				407
				408	switch (state) {
				409
				410	case ODEBUG_STATE_NOTAVAILABLE:
				411	/*
				412	* This is not really a fixup. The work struct was
				413	* statically initialized. We just make sure that it
				414	* is tracked in the object tracker.
				415	*/
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	416	if (test_bit(WORK_STRUCT_STATIC_BIT, work_data_bits(work))) {
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	417	debug_object_init(work, &work_debug_descr);
				418	debug_object_activate(work, &work_debug_descr);
				419	return 0;
				420	}
				421	WARN_ON_ONCE(1);
				422	return 0;
				423
				424	case ODEBUG_STATE_ACTIVE:
				425	WARN_ON(1);
				426
				427	default:
				428	return 0;
				429	}
				430	}
				431
				432	/*
				433	* fixup_free is called when:
				434	* - an active object is freed
				435	*/
				436	static int work_fixup_free(void *addr, enum debug_obj_state state)
				437	{
				438	struct work_struct *work = addr;
				439
				440	switch (state) {
				441	case ODEBUG_STATE_ACTIVE:
				442	cancel_work_sync(work);
				443	debug_object_free(work, &work_debug_descr);
				444	return 1;
				445	default:
				446	return 0;
				447	}
				448	}
				449
				450	static struct debug_obj_descr work_debug_descr = {
				451	.name = "work_struct",
Stanislaw Gruszka	9977728	2011-03-07 09:58:33 +0100	[diff] [blame]	452	.debug_hint = work_debug_hint,
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	453	.fixup_init = work_fixup_init,
				454	.fixup_activate = work_fixup_activate,
				455	.fixup_free = work_fixup_free,
				456	};
				457
				458	static inline void debug_work_activate(struct work_struct *work)
				459	{
				460	debug_object_activate(work, &work_debug_descr);
				461	}
				462
				463	static inline void debug_work_deactivate(struct work_struct *work)
				464	{
				465	debug_object_deactivate(work, &work_debug_descr);
				466	}
				467
				468	void __init_work(struct work_struct *work, int onstack)
				469	{
				470	if (onstack)
				471	debug_object_init_on_stack(work, &work_debug_descr);
				472	else
				473	debug_object_init(work, &work_debug_descr);
				474	}
				475	EXPORT_SYMBOL_GPL(__init_work);
				476
				477	void destroy_work_on_stack(struct work_struct *work)
				478	{
				479	debug_object_free(work, &work_debug_descr);
				480	}
				481	EXPORT_SYMBOL_GPL(destroy_work_on_stack);
				482
				483	#else
				484	static inline void debug_work_activate(struct work_struct *work) { }
				485	static inline void debug_work_deactivate(struct work_struct *work) { }
				486	#endif
				487
Tejun Heo	9daf9e6	2013-01-24 11:01:33 -0800	[diff] [blame]	488	/* allocate ID and assign it to @pool */
				489	static int worker_pool_assign_id(struct worker_pool *pool)
				490	{
				491	int ret;
				492
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	493	lockdep_assert_held(&wq_mutex);
				494
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	495	do {
				496	if (!idr_pre_get(&worker_pool_idr, GFP_KERNEL))
				497	return -ENOMEM;
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	498	ret = idr_get_new(&worker_pool_idr, pool, &pool->id);
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	499	} while (ret == -EAGAIN);
Tejun Heo	9daf9e6	2013-01-24 11:01:33 -0800	[diff] [blame]	500
				501	return ret;
				502	}
				503
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	504	/**
				505	* first_pwq - return the first pool_workqueue of the specified workqueue
				506	* @wq: the target workqueue
				507	*
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	508	* This must be called either with pwq_lock held or sched RCU read locked.
				509	* If the pwq needs to be used beyond the locking in effect, the caller is
				510	* responsible for guaranteeing that the pwq stays online.
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	511	*/
Tejun Heo	7fb98ea	2013-03-12 11:30:00 -0700	[diff] [blame]	512	static struct pool_workqueue first_pwq(struct workqueue_struct wq)
Oleg Nesterov	a848e3b	2007-05-09 02:34:17 -0700	[diff] [blame]	513	{
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	514	assert_rcu_or_pwq_lock();
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	515	return list_first_or_null_rcu(&wq->pwqs, struct pool_workqueue,
				516	pwqs_node);
Oleg Nesterov	a848e3b	2007-05-09 02:34:17 -0700	[diff] [blame]	517	}
				518
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	519	static unsigned int work_color_to_flags(int color)
				520	{
				521	return color << WORK_STRUCT_COLOR_SHIFT;
				522	}
				523
				524	static int get_work_color(struct work_struct *work)
				525	{
				526	return (*work_data_bits(work) >> WORK_STRUCT_COLOR_SHIFT) &
				527	((1 << WORK_STRUCT_COLOR_BITS) - 1);
				528	}
				529
				530	static int work_next_color(int color)
				531	{
				532	return (color + 1) % WORK_NR_COLORS;
Oleg Nesterov	b1f4ec1	2007-05-09 02:34:12 -0700	[diff] [blame]	533	}
				534
David Howells	4594bf1	2006-12-07 11:33:26 +0000	[diff] [blame]	535	/*
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	536	* While queued, %WORK_STRUCT_PWQ is set and non flag bits of a work's data
				537	* contain the pointer to the queued pwq. Once execution starts, the flag
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	538	* is cleared and the high bits contain OFFQ flags and pool ID.
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	539	*
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	540	* set_work_pwq(), set_work_pool_and_clear_pending(), mark_work_canceling()
				541	* and clear_work_data() can be used to set the pwq, pool or clear
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	542	* work->data. These functions should only be called while the work is
				543	* owned - ie. while the PENDING bit is set.
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	544	*
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	545	* get_work_pool() and get_work_pwq() can be used to obtain the pool or pwq
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	546	* corresponding to a work. Pool is available once the work has been
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	547	* queued anywhere after initialization until it is sync canceled. pwq is
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	548	* available only while the work item is queued.
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	549	*
				550	* %WORK_OFFQ_CANCELING is used to mark a work item which is being
				551	* canceled. While being canceled, a work item may have its PENDING set
				552	* but stay off timer and worklist for arbitrarily long and nobody should
				553	* try to steal the PENDING bit.
David Howells	4594bf1	2006-12-07 11:33:26 +0000	[diff] [blame]	554	*/
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	555	static inline void set_work_data(struct work_struct *work, unsigned long data,
				556	unsigned long flags)
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	557	{
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	558	WARN_ON_ONCE(!work_pending(work));
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	559	atomic_long_set(&work->data, data \| flags \| work_static(work));
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	560	}
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	561
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	562	static void set_work_pwq(struct work_struct work, struct pool_workqueue pwq,
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	563	unsigned long extra_flags)
Oleg Nesterov	4d707b9	2010-04-23 17:40:40 +0200	[diff] [blame]	564	{
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	565	set_work_data(work, (unsigned long)pwq,
				566	WORK_STRUCT_PENDING \| WORK_STRUCT_PWQ \| extra_flags);
Oleg Nesterov	4d707b9	2010-04-23 17:40:40 +0200	[diff] [blame]	567	}
				568
Lai Jiangshan	4468a00	2013-02-06 18:04:53 -0800	[diff] [blame]	569	static void set_work_pool_and_keep_pending(struct work_struct *work,
				570	int pool_id)
				571	{
				572	set_work_data(work, (unsigned long)pool_id << WORK_OFFQ_POOL_SHIFT,
				573	WORK_STRUCT_PENDING);
				574	}
				575
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	576	static void set_work_pool_and_clear_pending(struct work_struct *work,
				577	int pool_id)
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	578	{
Tejun Heo	23657bb	2012-08-13 17:08:19 -0700	[diff] [blame]	579	/*
				580	* The following wmb is paired with the implied mb in
				581	* test_and_set_bit(PENDING) and ensures all updates to @work made
				582	* here are visible to and precede any updates by the next PENDING
				583	* owner.
				584	*/
				585	smp_wmb();
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	586	set_work_data(work, (unsigned long)pool_id << WORK_OFFQ_POOL_SHIFT, 0);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	587	}
				588
				589	static void clear_work_data(struct work_struct *work)
				590	{
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	591	smp_wmb(); /* see set_work_pool_and_clear_pending() */
				592	set_work_data(work, WORK_STRUCT_NO_POOL, 0);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	593	}
				594
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	595	static struct pool_workqueue get_work_pwq(struct work_struct work)
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	596	{
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	597	unsigned long data = atomic_long_read(&work->data);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	598
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	599	if (data & WORK_STRUCT_PWQ)
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	600	return (void *)(data & WORK_STRUCT_WQ_DATA_MASK);
				601	else
				602	return NULL;
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	603	}
				604
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	605	/**
				606	* get_work_pool - return the worker_pool a given work was associated with
				607	* @work: the work item of interest
				608	*
				609	* Return the worker_pool @work was last associated with. %NULL if none.
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	610	*
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	611	* Pools are created and destroyed under wq_mutex, and allows read access
				612	* under sched-RCU read lock. As such, this function should be called
				613	* under wq_mutex or with preemption disabled.
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	614	*
				615	* All fields of the returned pool are accessible as long as the above
				616	* mentioned locking is in effect. If the returned pool needs to be used
				617	* beyond the critical section, the caller is responsible for ensuring the
				618	* returned pool is and stays online.
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	619	*/
				620	static struct worker_pool get_work_pool(struct work_struct work)
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	621	{
Tejun Heo	e120153	2010-07-22 14:14:25 +0200	[diff] [blame]	622	unsigned long data = atomic_long_read(&work->data);
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	623	int pool_id;
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	624
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	625	assert_rcu_or_wq_mutex();
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	626
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	627	if (data & WORK_STRUCT_PWQ)
				628	return ((struct pool_workqueue *)
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	629	(data & WORK_STRUCT_WQ_DATA_MASK))->pool;
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	630
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	631	pool_id = data >> WORK_OFFQ_POOL_SHIFT;
				632	if (pool_id == WORK_OFFQ_POOL_NONE)
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	633	return NULL;
				634
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	635	return idr_find(&worker_pool_idr, pool_id);
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	636	}
				637
				638	/**
				639	* get_work_pool_id - return the worker pool ID a given work is associated with
				640	* @work: the work item of interest
				641	*
				642	* Return the worker_pool ID @work was last associated with.
				643	* %WORK_OFFQ_POOL_NONE if none.
				644	*/
				645	static int get_work_pool_id(struct work_struct *work)
				646	{
Lai Jiangshan	54d5b7d	2013-02-07 13:14:20 -0800	[diff] [blame]	647	unsigned long data = atomic_long_read(&work->data);
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	648
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	649	if (data & WORK_STRUCT_PWQ)
				650	return ((struct pool_workqueue *)
Lai Jiangshan	54d5b7d	2013-02-07 13:14:20 -0800	[diff] [blame]	651	(data & WORK_STRUCT_WQ_DATA_MASK))->pool->id;
				652
				653	return data >> WORK_OFFQ_POOL_SHIFT;
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	654	}
				655
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	656	static void mark_work_canceling(struct work_struct *work)
				657	{
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	658	unsigned long pool_id = get_work_pool_id(work);
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	659
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	660	pool_id <<= WORK_OFFQ_POOL_SHIFT;
				661	set_work_data(work, pool_id \| WORK_OFFQ_CANCELING, WORK_STRUCT_PENDING);
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	662	}
				663
				664	static bool work_is_canceling(struct work_struct *work)
				665	{
				666	unsigned long data = atomic_long_read(&work->data);
				667
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	668	return !(data & WORK_STRUCT_PWQ) && (data & WORK_OFFQ_CANCELING);
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	669	}
				670
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	671	/*
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	672	* Policy functions. These define the policies on how the global worker
				673	* pools are managed. Unless noted otherwise, these functions assume that
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	674	* they're being called with pool->lock held.
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	675	*/
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	676
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	677	static bool __need_more_worker(struct worker_pool *pool)
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	678	{
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	679	return !atomic_read(&pool->nr_running);
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	680	}
				681
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	682	/*
				683	* Need to wake up a worker? Called from anything but currently
				684	* running workers.
Tejun Heo	974271c	2012-07-12 14:46:37 -0700	[diff] [blame]	685	*
				686	* Note that, because unbound workers never contribute to nr_running, this
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	687	* function will always return %true for unbound pools as long as the
Tejun Heo	974271c	2012-07-12 14:46:37 -0700	[diff] [blame]	688	* worklist isn't empty.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	689	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	690	static bool need_more_worker(struct worker_pool *pool)
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	691	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	692	return !list_empty(&pool->worklist) && __need_more_worker(pool);
David Howells	365970a	2006-11-22 14:54:49 +0000	[diff] [blame]	693	}
				694
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	695	/* Can I start working? Called from busy but !running workers. */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	696	static bool may_start_working(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	697	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	698	return pool->nr_idle;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	699	}
				700
				701	/* Do I need to keep working? Called from currently running workers. */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	702	static bool keep_working(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	703	{
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	704	return !list_empty(&pool->worklist) &&
				705	atomic_read(&pool->nr_running) <= 1;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	706	}
				707
				708	/* Do we need a new worker? Called from manager. */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	709	static bool need_to_create_worker(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	710	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	711	return need_more_worker(pool) && !may_start_working(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	712	}
				713
				714	/* Do I need to be the manager? */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	715	static bool need_to_manage_workers(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	716	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	717	return need_to_create_worker(pool) \|\|
Tejun Heo	11ebea5	2012-07-12 14:46:37 -0700	[diff] [blame]	718	(pool->flags & POOL_MANAGE_WORKERS);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	719	}
				720
				721	/* Do we have too many workers and should some go away? */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	722	static bool too_many_workers(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	723	{
Tejun Heo	34a06bd	2013-03-12 11:30:00 -0700	[diff] [blame]	724	bool managing = mutex_is_locked(&pool->manager_arb);
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	725	int nr_idle = pool->nr_idle + managing; /* manager is considered idle */
				726	int nr_busy = pool->nr_workers - nr_idle;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	727
Lai Jiangshan	ea1abd6	2012-09-18 09:59:22 -0700	[diff] [blame]	728	/*
				729	* nr_idle and idle_list may disagree if idle rebinding is in
				730	* progress. Never return %true if idle_list is empty.
				731	*/
				732	if (list_empty(&pool->idle_list))
				733	return false;
				734
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	735	return nr_idle > 2 && (nr_idle - 2) * MAX_IDLE_WORKERS_RATIO >= nr_busy;
				736	}
				737
				738	/*
				739	* Wake up functions.
				740	*/
				741
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	742	/* Return the first worker. Safe with preemption disabled */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	743	static struct worker first_worker(struct worker_pool pool)
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	744	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	745	if (unlikely(list_empty(&pool->idle_list)))
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	746	return NULL;
				747
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	748	return list_first_entry(&pool->idle_list, struct worker, entry);
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	749	}
				750
				751	/**
				752	* wake_up_worker - wake up an idle worker
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	753	* @pool: worker pool to wake worker from
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	754	*
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	755	* Wake up the first idle worker of @pool.
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	756	*
				757	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	758	* spin_lock_irq(pool->lock).
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	759	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	760	static void wake_up_worker(struct worker_pool *pool)
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	761	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	762	struct worker *worker = first_worker(pool);
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	763
				764	if (likely(worker))
				765	wake_up_process(worker->task);
				766	}
				767
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	768	/**
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	769	* wq_worker_waking_up - a worker is waking up
				770	* @task: task waking up
				771	* @cpu: CPU @task is waking up to
				772	*
				773	* This function is called during try_to_wake_up() when a worker is
				774	* being awoken.
				775	*
				776	* CONTEXT:
				777	* spin_lock_irq(rq->lock)
				778	*/
Tejun Heo	d84ff05	2013-03-12 11:29:59 -0700	[diff] [blame]	779	void wq_worker_waking_up(struct task_struct *task, int cpu)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	780	{
				781	struct worker *worker = kthread_data(task);
				782
Joonsoo Kim	3657600	2012-10-26 23:03:49 +0900	[diff] [blame]	783	if (!(worker->flags & WORKER_NOT_RUNNING)) {
Tejun Heo	ec22ca5	2013-01-24 11:01:33 -0800	[diff] [blame]	784	WARN_ON_ONCE(worker->pool->cpu != cpu);
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	785	atomic_inc(&worker->pool->nr_running);
Joonsoo Kim	3657600	2012-10-26 23:03:49 +0900	[diff] [blame]	786	}
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	787	}
				788
				789	/**
				790	* wq_worker_sleeping - a worker is going to sleep
				791	* @task: task going to sleep
				792	* @cpu: CPU in question, must be the current CPU number
				793	*
				794	* This function is called during schedule() when a busy worker is
				795	* going to sleep. Worker on the same cpu can be woken up by
				796	* returning pointer to its task.
				797	*
				798	* CONTEXT:
				799	* spin_lock_irq(rq->lock)
				800	*
				801	* RETURNS:
				802	* Worker task on @cpu to wake up, %NULL if none.
				803	*/
Tejun Heo	d84ff05	2013-03-12 11:29:59 -0700	[diff] [blame]	804	struct task_struct wq_worker_sleeping(struct task_struct task, int cpu)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	805	{
				806	struct worker worker = kthread_data(task), to_wakeup = NULL;
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	807	struct worker_pool *pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	808
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	809	/*
				810	* Rescuers, which may not have all the fields set up like normal
				811	* workers, also reach here, let's not access anything before
				812	* checking NOT_RUNNING.
				813	*/
Steven Rostedt	2d64672	2010-12-03 23:12:33 -0500	[diff] [blame]	814	if (worker->flags & WORKER_NOT_RUNNING)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	815	return NULL;
				816
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	817	pool = worker->pool;
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	818
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	819	/* this can only happen on the local cpu */
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	820	if (WARN_ON_ONCE(cpu != raw_smp_processor_id()))
				821	return NULL;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	822
				823	/*
				824	* The counterpart of the following dec_and_test, implied mb,
				825	* worklist not empty test sequence is in insert_work().
				826	* Please read comment there.
				827	*
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	828	* NOT_RUNNING is clear. This means that we're bound to and
				829	* running on the local cpu w/ rq lock held and preemption
				830	* disabled, which in turn means that none else could be
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	831	* manipulating idle_list, so dereferencing idle_list without pool
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	832	* lock is safe.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	833	*/
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	834	if (atomic_dec_and_test(&pool->nr_running) &&
				835	!list_empty(&pool->worklist))
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	836	to_wakeup = first_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	837	return to_wakeup ? to_wakeup->task : NULL;
				838	}
				839
				840	/**
				841	* worker_set_flags - set worker flags and adjust nr_running accordingly
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	842	* @worker: self
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	843	* @flags: flags to set
				844	* @wakeup: wakeup an idle worker if necessary
				845	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	846	* Set @flags in @worker->flags and adjust nr_running accordingly. If
				847	* nr_running becomes zero and @wakeup is %true, an idle worker is
				848	* woken up.
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	849	*
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	850	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	851	* spin_lock_irq(pool->lock)
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	852	*/
				853	static inline void worker_set_flags(struct worker *worker, unsigned int flags,
				854	bool wakeup)
				855	{
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	856	struct worker_pool *pool = worker->pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	857
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	858	WARN_ON_ONCE(worker->task != current);
				859
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	860	/*
				861	* If transitioning into NOT_RUNNING, adjust nr_running and
				862	* wake up an idle worker as necessary if requested by
				863	* @wakeup.
				864	*/
				865	if ((flags & WORKER_NOT_RUNNING) &&
				866	!(worker->flags & WORKER_NOT_RUNNING)) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	867	if (wakeup) {
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	868	if (atomic_dec_and_test(&pool->nr_running) &&
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	869	!list_empty(&pool->worklist))
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	870	wake_up_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	871	} else
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	872	atomic_dec(&pool->nr_running);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	873	}
				874
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	875	worker->flags \|= flags;
				876	}
				877
				878	/**
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	879	* worker_clr_flags - clear worker flags and adjust nr_running accordingly
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	880	* @worker: self
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	881	* @flags: flags to clear
				882	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	883	* Clear @flags in @worker->flags and adjust nr_running accordingly.
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	884	*
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	885	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	886	* spin_lock_irq(pool->lock)
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	887	*/
				888	static inline void worker_clr_flags(struct worker *worker, unsigned int flags)
				889	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	890	struct worker_pool *pool = worker->pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	891	unsigned int oflags = worker->flags;
				892
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	893	WARN_ON_ONCE(worker->task != current);
				894
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	895	worker->flags &= ~flags;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	896
Tejun Heo	42c025f	2011-01-11 15:58:49 +0100	[diff] [blame]	897	/*
				898	* If transitioning out of NOT_RUNNING, increment nr_running. Note
				899	* that the nested NOT_RUNNING is not a noop. NOT_RUNNING is mask
				900	* of multiple flags, not a single flag.
				901	*/
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	902	if ((flags & WORKER_NOT_RUNNING) && (oflags & WORKER_NOT_RUNNING))
				903	if (!(worker->flags & WORKER_NOT_RUNNING))
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	904	atomic_inc(&pool->nr_running);
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	905	}
				906
				907	/**
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	908	* find_worker_executing_work - find worker which is executing a work
Tejun Heo	c9e7cf2	2013-01-24 11:01:33 -0800	[diff] [blame]	909	* @pool: pool of interest
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	910	* @work: work to find worker for
				911	*
Tejun Heo	c9e7cf2	2013-01-24 11:01:33 -0800	[diff] [blame]	912	* Find a worker which is executing @work on @pool by searching
				913	* @pool->busy_hash which is keyed by the address of @work. For a worker
Tejun Heo	a2c1c57	2012-12-18 10:35:02 -0800	[diff] [blame]	914	* to match, its current execution should match the address of @work and
				915	* its work function. This is to avoid unwanted dependency between
				916	* unrelated work executions through a work item being recycled while still
				917	* being executed.
				918	*
				919	* This is a bit tricky. A work item may be freed once its execution
				920	* starts and nothing prevents the freed area from being recycled for
				921	* another work item. If the same work item address ends up being reused
				922	* before the original execution finishes, workqueue will identify the
				923	* recycled work item as currently executing and make it wait until the
				924	* current execution finishes, introducing an unwanted dependency.
				925	*
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	926	* This function checks the work item address and work function to avoid
				927	* false positives. Note that this isn't complete as one may construct a
				928	* work function which can introduce dependency onto itself through a
				929	* recycled work item. Well, if somebody wants to shoot oneself in the
				930	* foot that badly, there's only so much we can do, and if such deadlock
				931	* actually occurs, it should be easy to locate the culprit work function.
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	932	*
				933	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	934	* spin_lock_irq(pool->lock).
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	935	*
				936	* RETURNS:
				937	* Pointer to worker which is executing @work if found, NULL
				938	* otherwise.
				939	*/
Tejun Heo	c9e7cf2	2013-01-24 11:01:33 -0800	[diff] [blame]	940	static struct worker find_worker_executing_work(struct worker_pool pool,
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	941	struct work_struct *work)
				942	{
Sasha Levin	42f8570	2012-12-17 10:01:23 -0500	[diff] [blame]	943	struct worker *worker;
Sasha Levin	42f8570	2012-12-17 10:01:23 -0500	[diff] [blame]	944
Sasha Levin	b67bfe0	2013-02-27 17:06:00 -0800	[diff] [blame]	945	hash_for_each_possible(pool->busy_hash, worker, hentry,
Tejun Heo	a2c1c57	2012-12-18 10:35:02 -0800	[diff] [blame]	946	(unsigned long)work)
				947	if (worker->current_work == work &&
				948	worker->current_func == work->func)
Sasha Levin	42f8570	2012-12-17 10:01:23 -0500	[diff] [blame]	949	return worker;
				950
				951	return NULL;
Tejun Heo	8cca0ee	2010-06-29 10:07:13 +0200	[diff] [blame]	952	}
				953
				954	/**
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	955	* move_linked_works - move linked works to a list
				956	* @work: start of series of works to be scheduled
				957	* @head: target list to append @work to
				958	* @nextp: out paramter for nested worklist walking
				959	*
				960	* Schedule linked works starting from @work to @head. Work series to
				961	* be scheduled starts at @work and includes any consecutive work with
				962	* WORK_STRUCT_LINKED set in its predecessor.
				963	*
				964	* If @nextp is not NULL, it's updated to point to the next work of
				965	* the last scheduled work. This allows move_linked_works() to be
				966	* nested inside outer list_for_each_entry_safe().
				967	*
				968	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	969	* spin_lock_irq(pool->lock).
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	970	*/
				971	static void move_linked_works(struct work_struct work, struct list_head head,
				972	struct work_struct **nextp)
				973	{
				974	struct work_struct *n;
				975
				976	/*
				977	* Linked worklist will always end before the end of the list,
				978	* use NULL for list head.
				979	*/
				980	list_for_each_entry_safe_from(work, n, NULL, entry) {
				981	list_move_tail(&work->entry, head);
				982	if (!(*work_data_bits(work) & WORK_STRUCT_LINKED))
				983	break;
				984	}
				985
				986	/*
				987	* If we're already inside safe list traversal and have moved
				988	* multiple works to the scheduled queue, the next position
				989	* needs to be updated.
				990	*/
				991	if (nextp)
				992	*nextp = n;
				993	}
				994
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	995	/**
				996	* get_pwq - get an extra reference on the specified pool_workqueue
				997	* @pwq: pool_workqueue to get
				998	*
				999	* Obtain an extra reference on @pwq. The caller should guarantee that
				1000	* @pwq has positive refcnt and be holding the matching pool->lock.
				1001	*/
				1002	static void get_pwq(struct pool_workqueue *pwq)
				1003	{
				1004	lockdep_assert_held(&pwq->pool->lock);
				1005	WARN_ON_ONCE(pwq->refcnt <= 0);
				1006	pwq->refcnt++;
				1007	}
				1008
				1009	/**
				1010	* put_pwq - put a pool_workqueue reference
				1011	* @pwq: pool_workqueue to put
				1012	*
				1013	* Drop a reference of @pwq. If its refcnt reaches zero, schedule its
				1014	* destruction. The caller should be holding the matching pool->lock.
				1015	*/
				1016	static void put_pwq(struct pool_workqueue *pwq)
				1017	{
				1018	lockdep_assert_held(&pwq->pool->lock);
				1019	if (likely(--pwq->refcnt))
				1020	return;
				1021	if (WARN_ON_ONCE(!(pwq->wq->flags & WQ_UNBOUND)))
				1022	return;
				1023	/*
				1024	* @pwq can't be released under pool->lock, bounce to
				1025	* pwq_unbound_release_workfn(). This never recurses on the same
				1026	* pool->lock as this path is taken only for unbound workqueues and
				1027	* the release work item is scheduled on a per-cpu workqueue. To
				1028	* avoid lockdep warning, unbound pool->locks are given lockdep
				1029	* subclass of 1 in get_unbound_pool().
				1030	*/
				1031	schedule_work(&pwq->unbound_release_work);
				1032	}
				1033
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1034	static void pwq_activate_delayed_work(struct work_struct *work)
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1035	{
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1036	struct pool_workqueue *pwq = get_work_pwq(work);
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1037
				1038	trace_workqueue_activate_work(work);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1039	move_linked_works(work, &pwq->pool->worklist, NULL);
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1040	__clear_bit(WORK_STRUCT_DELAYED_BIT, work_data_bits(work));
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1041	pwq->nr_active++;
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1042	}
				1043
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1044	static void pwq_activate_first_delayed(struct pool_workqueue *pwq)
Lai Jiangshan	3aa6249	2012-09-18 10:40:00 -0700	[diff] [blame]	1045	{
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1046	struct work_struct *work = list_first_entry(&pwq->delayed_works,
Lai Jiangshan	3aa6249	2012-09-18 10:40:00 -0700	[diff] [blame]	1047	struct work_struct, entry);
				1048
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1049	pwq_activate_delayed_work(work);
Lai Jiangshan	3aa6249	2012-09-18 10:40:00 -0700	[diff] [blame]	1050	}
				1051
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1052	/**
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1053	* pwq_dec_nr_in_flight - decrement pwq's nr_in_flight
				1054	* @pwq: pwq of interest
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1055	* @color: color of work which left the queue
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1056	*
				1057	* A work either has completed or is removed from pending queue,
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1058	* decrement nr_in_flight of its pwq and handle workqueue flushing.
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1059	*
				1060	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1061	* spin_lock_irq(pool->lock).
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1062	*/
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1063	static void pwq_dec_nr_in_flight(struct pool_workqueue *pwq, int color)
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1064	{
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	1065	/* uncolored work items don't participate in flushing or nr_active */
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1066	if (color == WORK_NO_COLOR)
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	1067	goto out_put;
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1068
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1069	pwq->nr_in_flight[color]--;
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1070
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1071	pwq->nr_active--;
				1072	if (!list_empty(&pwq->delayed_works)) {
Lai Jiangshan	b3f9f40	2012-09-18 10:40:00 -0700	[diff] [blame]	1073	/* one down, submit a delayed one */
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1074	if (pwq->nr_active < pwq->max_active)
				1075	pwq_activate_first_delayed(pwq);
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1076	}
				1077
				1078	/* is flush in progress and are we at the flushing tip? */
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1079	if (likely(pwq->flush_color != color))
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	1080	goto out_put;
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1081
				1082	/* are there still in-flight works? */
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1083	if (pwq->nr_in_flight[color])
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	1084	goto out_put;
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1085
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1086	/* this pwq is done, clear flush_color */
				1087	pwq->flush_color = -1;
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1088
				1089	/*
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1090	* If this was the last pwq, wake up the first flusher. It
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1091	* will handle the rest.
				1092	*/
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1093	if (atomic_dec_and_test(&pwq->wq->nr_pwqs_to_flush))
				1094	complete(&pwq->wq->first_flusher->done);
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	1095	out_put:
				1096	put_pwq(pwq);
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1097	}
				1098
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	1099	/**
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	1100	* try_to_grab_pending - steal work item from worklist and disable irq
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	1101	* @work: work item to steal
				1102	* @is_dwork: @work is a delayed_work
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	1103	* @flags: place to store irq state
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	1104	*
				1105	* Try to grab PENDING bit of @work. This function can handle @work in any
				1106	* stable state - idle, on timer or on worklist. Return values are
				1107	*
				1108	* 1 if @work was pending and we successfully stole PENDING
				1109	* 0 if @work was idle and we claimed PENDING
				1110	* -EAGAIN if PENDING couldn't be grabbed at the moment, safe to busy-retry
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	1111	* -ENOENT if someone else is canceling @work, this state may persist
				1112	* for arbitrarily long
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	1113	*
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	1114	* On >= 0 return, the caller owns @work's PENDING bit. To avoid getting
Tejun Heo	e0aecdd	2012-08-21 13:18:24 -0700	[diff] [blame]	1115	* interrupted while holding PENDING and @work off queue, irq must be
				1116	* disabled on entry. This, combined with delayed_work->timer being
				1117	* irqsafe, ensures that we return -EAGAIN for finite short period of time.
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	1118	*
				1119	* On successful return, >= 0, irq is disabled and the caller is
				1120	* responsible for releasing it using local_irq_restore(*@flags).
				1121	*
Tejun Heo	e0aecdd	2012-08-21 13:18:24 -0700	[diff] [blame]	1122	* This function is safe to call from any context including IRQ handler.
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1123	*/
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	1124	static int try_to_grab_pending(struct work_struct *work, bool is_dwork,
				1125	unsigned long *flags)
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1126	{
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1127	struct worker_pool *pool;
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1128	struct pool_workqueue *pwq;
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1129
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	1130	local_irq_save(*flags);
				1131
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	1132	/* try to steal the timer if it exists */
				1133	if (is_dwork) {
				1134	struct delayed_work *dwork = to_delayed_work(work);
				1135
Tejun Heo	e0aecdd	2012-08-21 13:18:24 -0700	[diff] [blame]	1136	/*
				1137	* dwork->timer is irqsafe. If del_timer() fails, it's
				1138	* guaranteed that the timer is not queued anywhere and not
				1139	* running on the local CPU.
				1140	*/
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	1141	if (likely(del_timer(&dwork->timer)))
				1142	return 1;
				1143	}
				1144
				1145	/* try to claim PENDING the normal way */
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1146	if (!test_and_set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(work)))
				1147	return 0;
				1148
				1149	/*
				1150	* The queueing is in progress, or it is already queued. Try to
				1151	* steal it from ->worklist without clearing WORK_STRUCT_PENDING.
				1152	*/
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1153	pool = get_work_pool(work);
				1154	if (!pool)
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	1155	goto fail;
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1156
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1157	spin_lock(&pool->lock);
Lai Jiangshan	0b3dae6	2013-02-06 18:04:53 -0800	[diff] [blame]	1158	/*
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1159	* work->data is guaranteed to point to pwq only while the work
				1160	* item is queued on pwq->wq, and both updating work->data to point
				1161	* to pwq on queueing and to pool on dequeueing are done under
				1162	* pwq->pool->lock. This in turn guarantees that, if work->data
				1163	* points to pwq which is associated with a locked pool, the work
Lai Jiangshan	0b3dae6	2013-02-06 18:04:53 -0800	[diff] [blame]	1164	* item is currently queued on that pool.
				1165	*/
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1166	pwq = get_work_pwq(work);
				1167	if (pwq && pwq->pool == pool) {
Tejun Heo	1606283	2013-02-06 18:04:53 -0800	[diff] [blame]	1168	debug_work_deactivate(work);
Lai Jiangshan	3aa6249	2012-09-18 10:40:00 -0700	[diff] [blame]	1169
Tejun Heo	1606283	2013-02-06 18:04:53 -0800	[diff] [blame]	1170	/*
				1171	* A delayed work item cannot be grabbed directly because
				1172	* it might have linked NO_COLOR work items which, if left
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1173	* on the delayed_list, will confuse pwq->nr_active
Tejun Heo	1606283	2013-02-06 18:04:53 -0800	[diff] [blame]	1174	* management later on and cause stall. Make sure the work
				1175	* item is activated before grabbing.
				1176	*/
				1177	if (*work_data_bits(work) & WORK_STRUCT_DELAYED)
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1178	pwq_activate_delayed_work(work);
Lai Jiangshan	3aa6249	2012-09-18 10:40:00 -0700	[diff] [blame]	1179
Tejun Heo	1606283	2013-02-06 18:04:53 -0800	[diff] [blame]	1180	list_del_init(&work->entry);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1181	pwq_dec_nr_in_flight(get_work_pwq(work), get_work_color(work));
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	1182
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1183	/* work->data points to pwq iff queued, point to pool */
Tejun Heo	1606283	2013-02-06 18:04:53 -0800	[diff] [blame]	1184	set_work_pool_and_keep_pending(work, pool->id);
Lai Jiangshan	4468a00	2013-02-06 18:04:53 -0800	[diff] [blame]	1185
Tejun Heo	1606283	2013-02-06 18:04:53 -0800	[diff] [blame]	1186	spin_unlock(&pool->lock);
				1187	return 1;
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1188	}
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1189	spin_unlock(&pool->lock);
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	1190	fail:
				1191	local_irq_restore(*flags);
				1192	if (work_is_canceling(work))
				1193	return -ENOENT;
				1194	cpu_relax();
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	1195	return -EAGAIN;
Tejun Heo	bf4ede0	2012-08-03 10:30:46 -0700	[diff] [blame]	1196	}
				1197
				1198	/**
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	1199	* insert_work - insert a work into a pool
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1200	* @pwq: pwq @work belongs to
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1201	* @work: work to insert
				1202	* @head: insertion point
				1203	* @extra_flags: extra WORK_STRUCT_* flags to set
				1204	*
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1205	* Insert @work which belongs to @pwq after @head. @extra_flags is or'd to
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	1206	* work_struct flags.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1207	*
				1208	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1209	* spin_lock_irq(pool->lock).
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1210	*/
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1211	static void insert_work(struct pool_workqueue pwq, struct work_struct work,
				1212	struct list_head *head, unsigned int extra_flags)
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	1213	{
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1214	struct worker_pool *pool = pwq->pool;
Frederic Weisbecker	e1d8aa9	2009-01-12 23:15:46 +0100	[diff] [blame]	1215
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1216	/* we own @work, set data and link */
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1217	set_work_pwq(work, pwq, extra_flags);
Oleg Nesterov	1a4d9b0	2008-07-25 01:47:47 -0700	[diff] [blame]	1218	list_add_tail(&work->entry, head);
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	1219	get_pwq(pwq);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1220
				1221	/*
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	1222	* Ensure either wq_worker_sleeping() sees the above
				1223	* list_add_tail() or we see zero nr_running to avoid workers lying
				1224	* around lazily while there are works to be processed.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1225	*/
				1226	smp_mb();
				1227
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1228	if (__need_more_worker(pool))
				1229	wake_up_worker(pool);
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	1230	}
				1231
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	1232	/*
				1233	* Test whether @work is being queued from another work executing on the
Tejun Heo	8d03ecf	2013-02-13 19:29:10 -0800	[diff] [blame]	1234	* same workqueue.
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	1235	*/
				1236	static bool is_chained_work(struct workqueue_struct *wq)
				1237	{
Tejun Heo	8d03ecf	2013-02-13 19:29:10 -0800	[diff] [blame]	1238	struct worker *worker;
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	1239
Tejun Heo	8d03ecf	2013-02-13 19:29:10 -0800	[diff] [blame]	1240	worker = current_wq_worker();
				1241	/*
				1242	* Return %true iff I'm a worker execuing a work item on @wq. If
				1243	* I'm @worker, it's safe to dereference it without locking.
				1244	*/
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1245	return worker && worker->current_pwq->wq == wq;
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	1246	}
				1247
Tejun Heo	d84ff05	2013-03-12 11:29:59 -0700	[diff] [blame]	1248	static void __queue_work(int cpu, struct workqueue_struct *wq,
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1249	struct work_struct *work)
				1250	{
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1251	struct pool_workqueue *pwq;
Tejun Heo	c917808	2013-03-12 11:30:04 -0700	[diff] [blame]	1252	struct worker_pool *last_pool;
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1253	struct list_head *worklist;
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1254	unsigned int work_flags;
Joonsoo Kim	b75cac9	2012-08-15 23:25:37 +0900	[diff] [blame]	1255	unsigned int req_cpu = cpu;
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	1256
				1257	/*
				1258	* While a work item is PENDING && off queue, a task trying to
				1259	* steal the PENDING will busy-loop waiting for it to either get
				1260	* queued or lose PENDING. Grabbing PENDING and queueing should
				1261	* happen with IRQ disabled.
				1262	*/
				1263	WARN_ON_ONCE(!irqs_disabled());
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1264
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	1265	debug_work_activate(work);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1266
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	1267	/* if dying, only works from the same workqueue are allowed */
Tejun Heo	618b01e	2013-03-12 11:30:04 -0700	[diff] [blame]	1268	if (unlikely(wq->flags & __WQ_DRAINING) &&
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	1269	WARN_ON_ONCE(!is_chained_work(wq)))
Tejun Heo	e41e704	2010-08-24 14:22:47 +0200	[diff] [blame]	1270	return;
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	1271	retry:
Tejun Heo	c917808	2013-03-12 11:30:04 -0700	[diff] [blame]	1272	/* pwq which will be used unless @work is executing elsewhere */
Tejun Heo	c7fc77f	2010-07-02 10:03:51 +0200	[diff] [blame]	1273	if (!(wq->flags & WQ_UNBOUND)) {
Tejun Heo	5746982	2012-08-03 10:30:45 -0700	[diff] [blame]	1274	if (cpu == WORK_CPU_UNBOUND)
Tejun Heo	c7fc77f	2010-07-02 10:03:51 +0200	[diff] [blame]	1275	cpu = raw_smp_processor_id();
Tejun Heo	7fb98ea	2013-03-12 11:30:00 -0700	[diff] [blame]	1276	pwq = per_cpu_ptr(wq->cpu_pwqs, cpu);
Tejun Heo	c917808	2013-03-12 11:30:04 -0700	[diff] [blame]	1277	} else {
				1278	pwq = first_pwq(wq);
				1279	}
Tejun Heo	dbf2576	2012-08-20 14:51:23 -0700	[diff] [blame]	1280
Tejun Heo	c917808	2013-03-12 11:30:04 -0700	[diff] [blame]	1281	/*
				1282	* If @work was previously on a different pool, it might still be
				1283	* running there, in which case the work needs to be queued on that
				1284	* pool to guarantee non-reentrancy.
				1285	*/
				1286	last_pool = get_work_pool(work);
				1287	if (last_pool && last_pool != pwq->pool) {
				1288	struct worker *worker;
Tejun Heo	18aa9ef	2010-06-29 10:07:13 +0200	[diff] [blame]	1289
Tejun Heo	c917808	2013-03-12 11:30:04 -0700	[diff] [blame]	1290	spin_lock(&last_pool->lock);
Tejun Heo	18aa9ef	2010-06-29 10:07:13 +0200	[diff] [blame]	1291
Tejun Heo	c917808	2013-03-12 11:30:04 -0700	[diff] [blame]	1292	worker = find_worker_executing_work(last_pool, work);
Tejun Heo	18aa9ef	2010-06-29 10:07:13 +0200	[diff] [blame]	1293
Tejun Heo	c917808	2013-03-12 11:30:04 -0700	[diff] [blame]	1294	if (worker && worker->current_pwq->wq == wq) {
				1295	pwq = worker->current_pwq;
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	1296	} else {
Tejun Heo	c917808	2013-03-12 11:30:04 -0700	[diff] [blame]	1297	/* meh... not running there, queue here */
				1298	spin_unlock(&last_pool->lock);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1299	spin_lock(&pwq->pool->lock);
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	1300	}
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1301	} else {
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1302	spin_lock(&pwq->pool->lock);
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	1303	}
				1304
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	1305	/*
				1306	* pwq is determined and locked. For unbound pools, we could have
				1307	* raced with pwq release and it could already be dead. If its
				1308	* refcnt is zero, repeat pwq selection. Note that pwqs never die
				1309	* without another pwq replacing it as the first pwq or while a
				1310	* work item is executing on it, so the retying is guaranteed to
				1311	* make forward-progress.
				1312	*/
				1313	if (unlikely(!pwq->refcnt)) {
				1314	if (wq->flags & WQ_UNBOUND) {
				1315	spin_unlock(&pwq->pool->lock);
				1316	cpu_relax();
				1317	goto retry;
				1318	}
				1319	/* oops */
				1320	WARN_ONCE(true, "workqueue: per-cpu pwq for %s on cpu%d has 0 refcnt",
				1321	wq->name, cpu);
				1322	}
				1323
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1324	/* pwq determined, queue */
				1325	trace_workqueue_queue_work(req_cpu, pwq, work);
Tejun Heo	502ca9d	2010-06-29 10:07:13 +0200	[diff] [blame]	1326
Dan Carpenter	f5b2552	2012-04-13 22:06:58 +0300	[diff] [blame]	1327	if (WARN_ON(!list_empty(&work->entry))) {
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1328	spin_unlock(&pwq->pool->lock);
Dan Carpenter	f5b2552	2012-04-13 22:06:58 +0300	[diff] [blame]	1329	return;
				1330	}
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1331
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1332	pwq->nr_in_flight[pwq->work_color]++;
				1333	work_flags = work_color_to_flags(pwq->work_color);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1334
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1335	if (likely(pwq->nr_active < pwq->max_active)) {
Tejun Heo	cdadf00	2010-10-05 10:49:55 +0200	[diff] [blame]	1336	trace_workqueue_activate_work(work);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1337	pwq->nr_active++;
				1338	worklist = &pwq->pool->worklist;
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1339	} else {
				1340	work_flags \|= WORK_STRUCT_DELAYED;
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1341	worklist = &pwq->delayed_works;
Tejun Heo	8a2e8e5d	2010-08-25 10:33:56 +0200	[diff] [blame]	1342	}
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1343
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1344	insert_work(pwq, work, worklist, work_flags);
Tejun Heo	1e19ffc	2010-06-29 10:07:12 +0200	[diff] [blame]	1345
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1346	spin_unlock(&pwq->pool->lock);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1347	}
				1348
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1349	/**
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	1350	* queue_work_on - queue work on specific cpu
				1351	* @cpu: CPU number to execute work on
				1352	* @wq: workqueue to use
				1353	* @work: work to queue
				1354	*
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	1355	* Returns %false if @work was already on a queue, %true otherwise.
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	1356	*
				1357	* We queue the work to a specific CPU, the caller must ensure it
				1358	* can't go away.
				1359	*/
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	1360	bool queue_work_on(int cpu, struct workqueue_struct *wq,
				1361	struct work_struct *work)
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	1362	{
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	1363	bool ret = false;
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	1364	unsigned long flags;
				1365
				1366	local_irq_save(flags);
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	1367
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	1368	if (!test_and_set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(work))) {
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	1369	__queue_work(cpu, wq, work);
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	1370	ret = true;
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	1371	}
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	1372
				1373	local_irq_restore(flags);
Zhang Rui	c1a220e	2008-07-23 21:28:39 -0700	[diff] [blame]	1374	return ret;
				1375	}
				1376	EXPORT_SYMBOL_GPL(queue_work_on);
				1377
Tejun Heo	d8e794d	2012-08-03 10:30:45 -0700	[diff] [blame]	1378	void delayed_work_timer_fn(unsigned long __data)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1379	{
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1380	struct delayed_work dwork = (struct delayed_work )__data;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1381
Tejun Heo	e0aecdd	2012-08-21 13:18:24 -0700	[diff] [blame]	1382	/* should have been called from irqsafe timer with irq already off */
Lai Jiangshan	60c057b	2013-02-06 18:04:53 -0800	[diff] [blame]	1383	__queue_work(dwork->cpu, dwork->wq, &dwork->work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1384	}
Konstantin Khlebnikov	1438ade5	2013-01-24 16:36:31 +0400	[diff] [blame]	1385	EXPORT_SYMBOL(delayed_work_timer_fn);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1386
Tejun Heo	7beb2ed	2012-08-03 10:30:46 -0700	[diff] [blame]	1387	static void __queue_delayed_work(int cpu, struct workqueue_struct *wq,
				1388	struct delayed_work *dwork, unsigned long delay)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1389	{
Tejun Heo	7beb2ed	2012-08-03 10:30:46 -0700	[diff] [blame]	1390	struct timer_list *timer = &dwork->timer;
				1391	struct work_struct *work = &dwork->work;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1392
Tejun Heo	7beb2ed	2012-08-03 10:30:46 -0700	[diff] [blame]	1393	WARN_ON_ONCE(timer->function != delayed_work_timer_fn \|\|
				1394	timer->data != (unsigned long)dwork);
Tejun Heo	fc4b514	2012-12-04 07:40:39 -0800	[diff] [blame]	1395	WARN_ON_ONCE(timer_pending(timer));
				1396	WARN_ON_ONCE(!list_empty(&work->entry));
Tejun Heo	7beb2ed	2012-08-03 10:30:46 -0700	[diff] [blame]	1397
Tejun Heo	8852aac	2012-12-01 16:23:42 -0800	[diff] [blame]	1398	/*
				1399	* If @delay is 0, queue @dwork->work immediately. This is for
				1400	* both optimization and correctness. The earliest @timer can
				1401	* expire is on the closest next tick and delayed_work users depend
				1402	* on that there's no such delay when @delay is 0.
				1403	*/
				1404	if (!delay) {
				1405	__queue_work(cpu, wq, &dwork->work);
				1406	return;
				1407	}
				1408
Tejun Heo	7beb2ed	2012-08-03 10:30:46 -0700	[diff] [blame]	1409	timer_stats_timer_set_start_info(&dwork->timer);
				1410
Lai Jiangshan	60c057b	2013-02-06 18:04:53 -0800	[diff] [blame]	1411	dwork->wq = wq;
Tejun Heo	1265057	2012-08-08 09:38:42 -0700	[diff] [blame]	1412	dwork->cpu = cpu;
Tejun Heo	7beb2ed	2012-08-03 10:30:46 -0700	[diff] [blame]	1413	timer->expires = jiffies + delay;
				1414
				1415	if (unlikely(cpu != WORK_CPU_UNBOUND))
				1416	add_timer_on(timer, cpu);
				1417	else
				1418	add_timer(timer);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1419	}
				1420
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1421	/**
				1422	* queue_delayed_work_on - queue work on specific CPU after delay
				1423	* @cpu: CPU number to execute work on
				1424	* @wq: workqueue to use
Randy Dunlap	af9997e	2006-12-22 01:06:52 -0800	[diff] [blame]	1425	* @dwork: work to queue
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1426	* @delay: number of jiffies to wait before queueing
				1427	*
Tejun Heo	715f130	2012-08-03 10:30:46 -0700	[diff] [blame]	1428	* Returns %false if @work was already on a queue, %true otherwise. If
				1429	* @delay is zero and @dwork is idle, it will be scheduled for immediate
				1430	* execution.
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	1431	*/
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	1432	bool queue_delayed_work_on(int cpu, struct workqueue_struct *wq,
				1433	struct delayed_work *dwork, unsigned long delay)
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1434	{
David Howells	52bad64	2006-11-22 14:54:01 +0000	[diff] [blame]	1435	struct work_struct *work = &dwork->work;
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	1436	bool ret = false;
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	1437	unsigned long flags;
				1438
				1439	/* read the comment in __queue_work() */
				1440	local_irq_save(flags);
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1441
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	1442	if (!test_and_set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(work))) {
Tejun Heo	7beb2ed	2012-08-03 10:30:46 -0700	[diff] [blame]	1443	__queue_delayed_work(cpu, wq, dwork, delay);
Tejun Heo	d4283e9	2012-08-03 10:30:44 -0700	[diff] [blame]	1444	ret = true;
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1445	}
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	1446
				1447	local_irq_restore(flags);
Venkatesh Pallipadi	7a6bc1c	2006-06-28 13:50:33 -0700	[diff] [blame]	1448	return ret;
				1449	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	1450	EXPORT_SYMBOL_GPL(queue_delayed_work_on);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1451
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1452	/**
Tejun Heo	8376fe2	2012-08-03 10:30:47 -0700	[diff] [blame]	1453	* mod_delayed_work_on - modify delay of or queue a delayed work on specific CPU
				1454	* @cpu: CPU number to execute work on
				1455	* @wq: workqueue to use
				1456	* @dwork: work to queue
				1457	* @delay: number of jiffies to wait before queueing
				1458	*
				1459	* If @dwork is idle, equivalent to queue_delayed_work_on(); otherwise,
				1460	* modify @dwork's timer so that it expires after @delay. If @delay is
				1461	* zero, @work is guaranteed to be scheduled immediately regardless of its
				1462	* current state.
				1463	*
				1464	* Returns %false if @dwork was idle and queued, %true if @dwork was
				1465	* pending and its timer was modified.
				1466	*
Tejun Heo	e0aecdd	2012-08-21 13:18:24 -0700	[diff] [blame]	1467	* This function is safe to call from any context including IRQ handler.
Tejun Heo	8376fe2	2012-08-03 10:30:47 -0700	[diff] [blame]	1468	* See try_to_grab_pending() for details.
				1469	*/
				1470	bool mod_delayed_work_on(int cpu, struct workqueue_struct *wq,
				1471	struct delayed_work *dwork, unsigned long delay)
				1472	{
				1473	unsigned long flags;
				1474	int ret;
				1475
				1476	do {
				1477	ret = try_to_grab_pending(&dwork->work, true, &flags);
				1478	} while (unlikely(ret == -EAGAIN));
				1479
				1480	if (likely(ret >= 0)) {
				1481	__queue_delayed_work(cpu, wq, dwork, delay);
				1482	local_irq_restore(flags);
				1483	}
				1484
				1485	/* -ENOENT from try_to_grab_pending() becomes %true */
				1486	return ret;
				1487	}
				1488	EXPORT_SYMBOL_GPL(mod_delayed_work_on);
				1489
				1490	/**
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1491	* worker_enter_idle - enter idle state
				1492	* @worker: worker which is entering idle state
				1493	*
				1494	* @worker is entering idle state. Update stats and idle timer if
				1495	* necessary.
				1496	*
				1497	* LOCKING:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1498	* spin_lock_irq(pool->lock).
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1499	*/
				1500	static void worker_enter_idle(struct worker *worker)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1501	{
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1502	struct worker_pool *pool = worker->pool;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1503
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	1504	if (WARN_ON_ONCE(worker->flags & WORKER_IDLE) \|\|
				1505	WARN_ON_ONCE(!list_empty(&worker->entry) &&
				1506	(worker->hentry.next \|\| worker->hentry.pprev)))
				1507	return;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1508
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	1509	/* can't use worker_set_flags(), also called from start_worker() */
				1510	worker->flags \|= WORKER_IDLE;
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1511	pool->nr_idle++;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1512	worker->last_active = jiffies;
Peter Zijlstra	d5abe66	2006-12-06 20:37:26 -0800	[diff] [blame]	1513
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1514	/* idle_list is LIFO */
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1515	list_add(&worker->entry, &pool->idle_list);
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	1516
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	1517	if (too_many_workers(pool) && !timer_pending(&pool->idle_timer))
				1518	mod_timer(&pool->idle_timer, jiffies + IDLE_WORKER_TIMEOUT);
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	1519
Tejun Heo	544ecf3	2012-05-14 15:04:50 -0700	[diff] [blame]	1520	/*
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	1521	* Sanity check nr_running. Because wq_unbind_fn() releases
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1522	* pool->lock between setting %WORKER_UNBOUND and zapping
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	1523	* nr_running, the warning may trigger spuriously. Check iff
				1524	* unbind is not in progress.
Tejun Heo	544ecf3	2012-05-14 15:04:50 -0700	[diff] [blame]	1525	*/
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	1526	WARN_ON_ONCE(!(pool->flags & POOL_DISASSOCIATED) &&
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1527	pool->nr_workers == pool->nr_idle &&
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	1528	atomic_read(&pool->nr_running));
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1529	}
				1530
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1531	/**
				1532	* worker_leave_idle - leave idle state
				1533	* @worker: worker which is leaving idle state
				1534	*
				1535	* @worker is leaving idle state. Update stats.
				1536	*
				1537	* LOCKING:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1538	* spin_lock_irq(pool->lock).
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1539	*/
				1540	static void worker_leave_idle(struct worker *worker)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1541	{
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1542	struct worker_pool *pool = worker->pool;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1543
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	1544	if (WARN_ON_ONCE(!(worker->flags & WORKER_IDLE)))
				1545	return;
Tejun Heo	d302f01	2010-06-29 10:07:13 +0200	[diff] [blame]	1546	worker_clr_flags(worker, WORKER_IDLE);
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1547	pool->nr_idle--;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1548	list_del_init(&worker->entry);
				1549	}
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1550
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1551	/**
Lai Jiangshan	f36dc67	2013-02-19 12:17:02 -0800	[diff] [blame]	1552	* worker_maybe_bind_and_lock - try to bind %current to worker_pool and lock it
				1553	* @pool: target worker_pool
				1554	*
				1555	* Bind %current to the cpu of @pool if it is associated and lock @pool.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1556	*
				1557	* Works which are scheduled while the cpu is online must at least be
				1558	* scheduled to a worker which is bound to the cpu so that if they are
				1559	* flushed from cpu callbacks while cpu is going down, they are
				1560	* guaranteed to execute on the cpu.
				1561	*
Lai Jiangshan	f5faa07	2013-02-19 12:17:02 -0800	[diff] [blame]	1562	* This function is to be used by unbound workers and rescuers to bind
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1563	* themselves to the target cpu and may race with cpu going down or
				1564	* coming online. kthread_bind() can't be used because it may put the
				1565	* worker to already dead cpu and set_cpus_allowed_ptr() can't be used
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	1566	* verbatim as it's best effort and blocking and pool may be
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1567	* [dis]associated in the meantime.
				1568	*
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	1569	* This function tries set_cpus_allowed() and locks pool and verifies the
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	1570	* binding against %POOL_DISASSOCIATED which is set during
Tejun Heo	f2d5a0e	2012-07-17 12:39:26 -0700	[diff] [blame]	1571	* %CPU_DOWN_PREPARE and cleared during %CPU_ONLINE, so if the worker
				1572	* enters idle state or fetches works without dropping lock, it can
				1573	* guarantee the scheduling requirement described in the first paragraph.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1574	*
				1575	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1576	* Might sleep. Called without any lock but returns with pool->lock
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1577	* held.
				1578	*
				1579	* RETURNS:
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	1580	* %true if the associated pool is online (@worker is successfully
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1581	* bound), %false if offline.
				1582	*/
Lai Jiangshan	f36dc67	2013-02-19 12:17:02 -0800	[diff] [blame]	1583	static bool worker_maybe_bind_and_lock(struct worker_pool *pool)
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1584	__acquires(&pool->lock)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1585	{
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1586	while (true) {
				1587	/*
				1588	* The following call may fail, succeed or succeed
				1589	* without actually migrating the task to the cpu if
				1590	* it races with cpu hotunplug operation. Verify
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	1591	* against POOL_DISASSOCIATED.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1592	*/
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	1593	if (!(pool->flags & POOL_DISASSOCIATED))
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	1594	set_cpus_allowed_ptr(current, pool->attrs->cpumask);
Oleg Nesterov	85f4186	2007-05-09 02:34:20 -0700	[diff] [blame]	1595
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1596	spin_lock_irq(&pool->lock);
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	1597	if (pool->flags & POOL_DISASSOCIATED)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1598	return false;
Lai Jiangshan	f5faa07	2013-02-19 12:17:02 -0800	[diff] [blame]	1599	if (task_cpu(current) == pool->cpu &&
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	1600	cpumask_equal(&current->cpus_allowed, pool->attrs->cpumask))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1601	return true;
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1602	spin_unlock_irq(&pool->lock);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	1603
Tejun Heo	5035b20	2011-04-29 18:08:37 +0200	[diff] [blame]	1604	/*
				1605	* We've raced with CPU hot[un]plug. Give it a breather
				1606	* and retry migration. cond_resched() is required here;
				1607	* otherwise, we might deadlock against cpu_stop trying to
				1608	* bring down the CPU on non-preemptive kernel.
				1609	*/
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1610	cpu_relax();
Tejun Heo	5035b20	2011-04-29 18:08:37 +0200	[diff] [blame]	1611	cond_resched();
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1612	}
				1613	}
				1614
				1615	/*
Lai Jiangshan	ea1abd6	2012-09-18 09:59:22 -0700	[diff] [blame]	1616	* Rebind an idle @worker to its CPU. worker_thread() will test
Lai Jiangshan	5f7dabf	2012-09-18 09:59:23 -0700	[diff] [blame]	1617	* list_empty(@worker->entry) before leaving idle and call this function.
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1618	*/
				1619	static void idle_worker_rebind(struct worker *worker)
				1620	{
Lai Jiangshan	5f7dabf	2012-09-18 09:59:23 -0700	[diff] [blame]	1621	/* CPU may go down again inbetween, clear UNBOUND only on success */
Lai Jiangshan	f36dc67	2013-02-19 12:17:02 -0800	[diff] [blame]	1622	if (worker_maybe_bind_and_lock(worker->pool))
Lai Jiangshan	5f7dabf	2012-09-18 09:59:23 -0700	[diff] [blame]	1623	worker_clr_flags(worker, WORKER_UNBOUND);
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1624
Lai Jiangshan	ea1abd6	2012-09-18 09:59:22 -0700	[diff] [blame]	1625	/* rebind complete, become available again */
				1626	list_add(&worker->entry, &worker->pool->idle_list);
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1627	spin_unlock_irq(&worker->pool->lock);
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1628	}
				1629
				1630	/*
				1631	* Function for @worker->rebind.work used to rebind unbound busy workers to
Tejun Heo	403c821	2012-07-17 12:39:27 -0700	[diff] [blame]	1632	* the associated cpu which is coming back online. This is scheduled by
				1633	* cpu up but can race with other cpu hotplug operations and may be
				1634	* executed twice without intervening cpu down.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1635	*/
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1636	static void busy_worker_rebind_fn(struct work_struct *work)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1637	{
				1638	struct worker *worker = container_of(work, struct worker, rebind_work);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1639
Lai Jiangshan	f36dc67	2013-02-19 12:17:02 -0800	[diff] [blame]	1640	if (worker_maybe_bind_and_lock(worker->pool))
Lai Jiangshan	eab6d82	2012-09-18 09:59:22 -0700	[diff] [blame]	1641	worker_clr_flags(worker, WORKER_UNBOUND);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1642
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1643	spin_unlock_irq(&worker->pool->lock);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1644	}
				1645
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1646	static struct worker *alloc_worker(void)
				1647	{
				1648	struct worker *worker;
				1649
				1650	worker = kzalloc(sizeof(*worker), GFP_KERNEL);
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1651	if (worker) {
				1652	INIT_LIST_HEAD(&worker->entry);
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	1653	INIT_LIST_HEAD(&worker->scheduled);
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	1654	INIT_WORK(&worker->rebind_work, busy_worker_rebind_fn);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1655	/* on creation a worker is in !idle && prep state */
				1656	worker->flags = WORKER_PREP;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1657	}
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1658	return worker;
				1659	}
				1660
				1661	/**
				1662	* create_worker - create a new workqueue worker
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1663	* @pool: pool the new worker will belong to
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1664	*
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1665	* Create a new worker which is bound to @pool. The returned worker
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1666	* can be started by calling start_worker() or destroyed using
				1667	* destroy_worker().
				1668	*
				1669	* CONTEXT:
				1670	* Might sleep. Does GFP_KERNEL allocations.
				1671	*
				1672	* RETURNS:
				1673	* Pointer to the newly created worker.
				1674	*/
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	1675	static struct worker create_worker(struct worker_pool pool)
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1676	{
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	1677	const char *pri = pool->attrs->nice < 0 ? "H" : "";
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1678	struct worker *worker = NULL;
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1679	int id = -1;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1680
Tejun Heo	cd54968	2013-03-13 19:47:39 -0700	[diff] [blame]	1681	lockdep_assert_held(&pool->manager_mutex);
				1682
Tejun Heo	822d840	2013-03-19 13:45:21 -0700	[diff] [blame]	1683	/*
				1684	* ID is needed to determine kthread name. Allocate ID first
				1685	* without installing the pointer.
				1686	*/
				1687	idr_preload(GFP_KERNEL);
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1688	spin_lock_irq(&pool->lock);
Tejun Heo	822d840	2013-03-19 13:45:21 -0700	[diff] [blame]	1689
				1690	id = idr_alloc(&pool->worker_idr, NULL, 0, 0, GFP_NOWAIT);
				1691
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1692	spin_unlock_irq(&pool->lock);
Tejun Heo	822d840	2013-03-19 13:45:21 -0700	[diff] [blame]	1693	idr_preload_end();
				1694	if (id < 0)
				1695	goto fail;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1696
				1697	worker = alloc_worker();
				1698	if (!worker)
				1699	goto fail;
				1700
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1701	worker->pool = pool;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1702	worker->id = id;
				1703
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	1704	if (pool->cpu >= 0)
Eric Dumazet	94dcf29	2011-03-22 16:30:45 -0700	[diff] [blame]	1705	worker->task = kthread_create_on_node(worker_thread,
Tejun Heo	ec22ca5	2013-01-24 11:01:33 -0800	[diff] [blame]	1706	worker, cpu_to_node(pool->cpu),
Tejun Heo	d84ff05	2013-03-12 11:29:59 -0700	[diff] [blame]	1707	"kworker/%d:%d%s", pool->cpu, id, pri);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	1708	else
				1709	worker->task = kthread_create(worker_thread, worker,
Tejun Heo	ac6104c	2013-03-12 11:30:03 -0700	[diff] [blame]	1710	"kworker/u%d:%d%s",
				1711	pool->id, id, pri);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1712	if (IS_ERR(worker->task))
				1713	goto fail;
				1714
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	1715	/*
				1716	* set_cpus_allowed_ptr() will fail if the cpumask doesn't have any
				1717	* online CPUs. It'll be re-applied when any of the CPUs come up.
				1718	*/
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	1719	set_user_nice(worker->task, pool->attrs->nice);
				1720	set_cpus_allowed_ptr(worker->task, pool->attrs->cpumask);
Tejun Heo	3270476	2012-07-13 22:16:45 -0700	[diff] [blame]	1721
Tejun Heo	14a40ff	2013-03-19 13:45:20 -0700	[diff] [blame]	1722	/* prevent userland from meddling with cpumask of workqueue workers */
				1723	worker->task->flags \|= PF_NO_SETAFFINITY;
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	1724
				1725	/*
				1726	* The caller is responsible for ensuring %POOL_DISASSOCIATED
				1727	* remains stable across this function. See the comments above the
				1728	* flag definition for details.
				1729	*/
				1730	if (pool->flags & POOL_DISASSOCIATED)
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	1731	worker->flags \|= WORKER_UNBOUND;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	1732
Tejun Heo	822d840	2013-03-19 13:45:21 -0700	[diff] [blame]	1733	/* successful, commit the pointer to idr */
				1734	spin_lock_irq(&pool->lock);
				1735	idr_replace(&pool->worker_idr, worker, worker->id);
				1736	spin_unlock_irq(&pool->lock);
				1737
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1738	return worker;
Tejun Heo	822d840	2013-03-19 13:45:21 -0700	[diff] [blame]	1739
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1740	fail:
				1741	if (id >= 0) {
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1742	spin_lock_irq(&pool->lock);
Tejun Heo	822d840	2013-03-19 13:45:21 -0700	[diff] [blame]	1743	idr_remove(&pool->worker_idr, id);
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1744	spin_unlock_irq(&pool->lock);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1745	}
				1746	kfree(worker);
				1747	return NULL;
				1748	}
				1749
				1750	/**
				1751	* start_worker - start a newly created worker
				1752	* @worker: worker to start
				1753	*
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	1754	* Make the pool aware of @worker and start it.
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1755	*
				1756	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1757	* spin_lock_irq(pool->lock).
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1758	*/
				1759	static void start_worker(struct worker *worker)
				1760	{
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	1761	worker->flags \|= WORKER_STARTED;
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1762	worker->pool->nr_workers++;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1763	worker_enter_idle(worker);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1764	wake_up_process(worker->task);
				1765	}
				1766
				1767	/**
Tejun Heo	ebf44d1	2013-03-13 19:47:39 -0700	[diff] [blame]	1768	* create_and_start_worker - create and start a worker for a pool
				1769	* @pool: the target pool
				1770	*
Tejun Heo	cd54968	2013-03-13 19:47:39 -0700	[diff] [blame]	1771	* Grab the managership of @pool and create and start a new worker for it.
Tejun Heo	ebf44d1	2013-03-13 19:47:39 -0700	[diff] [blame]	1772	*/
				1773	static int create_and_start_worker(struct worker_pool *pool)
				1774	{
				1775	struct worker *worker;
				1776
Tejun Heo	cd54968	2013-03-13 19:47:39 -0700	[diff] [blame]	1777	mutex_lock(&pool->manager_mutex);
				1778
Tejun Heo	ebf44d1	2013-03-13 19:47:39 -0700	[diff] [blame]	1779	worker = create_worker(pool);
				1780	if (worker) {
				1781	spin_lock_irq(&pool->lock);
				1782	start_worker(worker);
				1783	spin_unlock_irq(&pool->lock);
				1784	}
				1785
Tejun Heo	cd54968	2013-03-13 19:47:39 -0700	[diff] [blame]	1786	mutex_unlock(&pool->manager_mutex);
				1787
Tejun Heo	ebf44d1	2013-03-13 19:47:39 -0700	[diff] [blame]	1788	return worker ? 0 : -ENOMEM;
				1789	}
				1790
				1791	/**
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1792	* destroy_worker - destroy a workqueue worker
				1793	* @worker: worker to be destroyed
				1794	*
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	1795	* Destroy @worker and adjust @pool stats accordingly.
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1796	*
				1797	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1798	* spin_lock_irq(pool->lock) which is released and regrabbed.
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1799	*/
				1800	static void destroy_worker(struct worker *worker)
				1801	{
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1802	struct worker_pool *pool = worker->pool;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1803
Tejun Heo	cd54968	2013-03-13 19:47:39 -0700	[diff] [blame]	1804	lockdep_assert_held(&pool->manager_mutex);
				1805	lockdep_assert_held(&pool->lock);
				1806
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1807	/* sanity check frenzy */
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	1808	if (WARN_ON(worker->current_work) \|\|
				1809	WARN_ON(!list_empty(&worker->scheduled)))
				1810	return;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1811
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1812	if (worker->flags & WORKER_STARTED)
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1813	pool->nr_workers--;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1814	if (worker->flags & WORKER_IDLE)
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	1815	pool->nr_idle--;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1816
				1817	list_del_init(&worker->entry);
Tejun Heo	cb44476	2010-07-02 10:03:50 +0200	[diff] [blame]	1818	worker->flags \|= WORKER_DIE;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1819
Tejun Heo	822d840	2013-03-19 13:45:21 -0700	[diff] [blame]	1820	idr_remove(&pool->worker_idr, worker->id);
				1821
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1822	spin_unlock_irq(&pool->lock);
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	1823
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1824	kthread_stop(worker->task);
				1825	kfree(worker);
				1826
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1827	spin_lock_irq(&pool->lock);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	1828	}
				1829
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1830	static void idle_worker_timeout(unsigned long __pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1831	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1832	struct worker_pool pool = (void )__pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1833
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1834	spin_lock_irq(&pool->lock);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1835
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1836	if (too_many_workers(pool)) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1837	struct worker *worker;
				1838	unsigned long expires;
				1839
				1840	/* idle_list is kept in LIFO order, check the last one */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1841	worker = list_entry(pool->idle_list.prev, struct worker, entry);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1842	expires = worker->last_active + IDLE_WORKER_TIMEOUT;
				1843
				1844	if (time_before(jiffies, expires))
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1845	mod_timer(&pool->idle_timer, expires);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1846	else {
				1847	/* it's been idle for too long, wake up manager */
Tejun Heo	11ebea5	2012-07-12 14:46:37 -0700	[diff] [blame]	1848	pool->flags \|= POOL_MANAGE_WORKERS;
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1849	wake_up_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1850	}
				1851	}
				1852
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1853	spin_unlock_irq(&pool->lock);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1854	}
				1855
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	1856	static void send_mayday(struct work_struct *work)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1857	{
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	1858	struct pool_workqueue *pwq = get_work_pwq(work);
				1859	struct workqueue_struct *wq = pwq->wq;
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	1860
Tejun Heo	2e109a2	2013-03-13 19:47:40 -0700	[diff] [blame]	1861	lockdep_assert_held(&wq_mayday_lock);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1862
Tejun Heo	493008a	2013-03-12 11:30:03 -0700	[diff] [blame]	1863	if (!wq->rescuer)
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	1864	return;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1865
				1866	/* mayday mayday mayday */
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	1867	if (list_empty(&pwq->mayday_node)) {
				1868	list_add_tail(&pwq->mayday_node, &wq->maydays);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1869	wake_up_process(wq->rescuer->task);
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	1870	}
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1871	}
				1872
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	1873	static void pool_mayday_timeout(unsigned long __pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1874	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1875	struct worker_pool pool = (void )__pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1876	struct work_struct *work;
				1877
Tejun Heo	2e109a2	2013-03-13 19:47:40 -0700	[diff] [blame]	1878	spin_lock_irq(&wq_mayday_lock); /* for wq->maydays */
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	1879	spin_lock(&pool->lock);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1880
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1881	if (need_to_create_worker(pool)) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1882	/*
				1883	* We've been trying to create a new worker but
				1884	* haven't been successful. We might be hitting an
				1885	* allocation deadlock. Send distress signals to
				1886	* rescuers.
				1887	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1888	list_for_each_entry(work, &pool->worklist, entry)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1889	send_mayday(work);
				1890	}
				1891
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	1892	spin_unlock(&pool->lock);
Tejun Heo	2e109a2	2013-03-13 19:47:40 -0700	[diff] [blame]	1893	spin_unlock_irq(&wq_mayday_lock);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1894
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1895	mod_timer(&pool->mayday_timer, jiffies + MAYDAY_INTERVAL);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1896	}
				1897
				1898	/**
				1899	* maybe_create_worker - create a new worker if necessary
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1900	* @pool: pool to create a new worker for
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1901	*
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1902	* Create a new worker for @pool if necessary. @pool is guaranteed to
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1903	* have at least one idle worker on return from this function. If
				1904	* creating a new worker takes longer than MAYDAY_INTERVAL, mayday is
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1905	* sent to all rescuers with works scheduled on @pool to resolve
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1906	* possible allocation deadlock.
				1907	*
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	1908	* On return, need_to_create_worker() is guaranteed to be %false and
				1909	* may_start_working() %true.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1910	*
				1911	* LOCKING:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1912	* spin_lock_irq(pool->lock) which may be released and regrabbed
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1913	* multiple times. Does GFP_KERNEL allocations. Called only from
				1914	* manager.
				1915	*
				1916	* RETURNS:
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	1917	* %false if no action was taken and pool->lock stayed locked, %true
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1918	* otherwise.
				1919	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1920	static bool maybe_create_worker(struct worker_pool *pool)
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1921	__releases(&pool->lock)
				1922	__acquires(&pool->lock)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1923	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1924	if (!need_to_create_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1925	return false;
				1926	restart:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1927	spin_unlock_irq(&pool->lock);
Tejun Heo	9f9c236	2010-07-14 11:31:20 +0200	[diff] [blame]	1928
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1929	/* if we don't make progress in MAYDAY_INITIAL_TIMEOUT, call for help */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1930	mod_timer(&pool->mayday_timer, jiffies + MAYDAY_INITIAL_TIMEOUT);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1931
				1932	while (true) {
				1933	struct worker *worker;
				1934
Tejun Heo	bc2ae0f	2012-07-17 12:39:27 -0700	[diff] [blame]	1935	worker = create_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1936	if (worker) {
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1937	del_timer_sync(&pool->mayday_timer);
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1938	spin_lock_irq(&pool->lock);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1939	start_worker(worker);
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	1940	if (WARN_ON_ONCE(need_to_create_worker(pool)))
				1941	goto restart;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1942	return true;
				1943	}
				1944
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1945	if (!need_to_create_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1946	break;
				1947
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1948	__set_current_state(TASK_INTERRUPTIBLE);
				1949	schedule_timeout(CREATE_COOLDOWN);
Tejun Heo	9f9c236	2010-07-14 11:31:20 +0200	[diff] [blame]	1950
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1951	if (!need_to_create_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1952	break;
				1953	}
				1954
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1955	del_timer_sync(&pool->mayday_timer);
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1956	spin_lock_irq(&pool->lock);
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1957	if (need_to_create_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1958	goto restart;
				1959	return true;
				1960	}
				1961
				1962	/**
				1963	* maybe_destroy_worker - destroy workers which have been idle for a while
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1964	* @pool: pool to destroy workers for
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1965	*
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1966	* Destroy @pool workers which have been idle for longer than
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1967	* IDLE_WORKER_TIMEOUT.
				1968	*
				1969	* LOCKING:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	1970	* spin_lock_irq(pool->lock) which may be released and regrabbed
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1971	* multiple times. Called only from manager.
				1972	*
				1973	* RETURNS:
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	1974	* %false if no action was taken and pool->lock stayed locked, %true
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1975	* otherwise.
				1976	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1977	static bool maybe_destroy_workers(struct worker_pool *pool)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1978	{
				1979	bool ret = false;
				1980
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1981	while (too_many_workers(pool)) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1982	struct worker *worker;
				1983	unsigned long expires;
				1984
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1985	worker = list_entry(pool->idle_list.prev, struct worker, entry);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1986	expires = worker->last_active + IDLE_WORKER_TIMEOUT;
				1987
				1988	if (time_before(jiffies, expires)) {
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	1989	mod_timer(&pool->idle_timer, expires);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	1990	break;
				1991	}
				1992
				1993	destroy_worker(worker);
				1994	ret = true;
				1995	}
				1996
				1997	return ret;
				1998	}
				1999
				2000	/**
				2001	* manage_workers - manage worker pool
				2002	* @worker: self
				2003	*
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	2004	* Assume the manager role and manage the worker pool @worker belongs
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2005	* to. At any given time, there can be only zero or one manager per
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	2006	* pool. The exclusion is handled automatically by this function.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2007	*
				2008	* The caller can safely start processing works on false return. On
				2009	* true return, it's guaranteed that need_to_create_worker() is false
				2010	* and may_start_working() is true.
				2011	*
				2012	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2013	* spin_lock_irq(pool->lock) which may be released and regrabbed
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2014	* multiple times. Does GFP_KERNEL allocations.
				2015	*
				2016	* RETURNS:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2017	* spin_lock_irq(pool->lock) which may be released and regrabbed
				2018	* multiple times. Does GFP_KERNEL allocations.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2019	*/
				2020	static bool manage_workers(struct worker *worker)
				2021	{
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2022	struct worker_pool *pool = worker->pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2023	bool ret = false;
				2024
Tejun Heo	bc3a1af	2013-03-13 19:47:39 -0700	[diff] [blame]	2025	/*
				2026	* Managership is governed by two mutexes - manager_arb and
				2027	* manager_mutex. manager_arb handles arbitration of manager role.
				2028	* Anyone who successfully grabs manager_arb wins the arbitration
				2029	* and becomes the manager. mutex_trylock() on pool->manager_arb
				2030	* failure while holding pool->lock reliably indicates that someone
				2031	* else is managing the pool and the worker which failed trylock
				2032	* can proceed to executing work items. This means that anyone
				2033	* grabbing manager_arb is responsible for actually performing
				2034	* manager duties. If manager_arb is grabbed and released without
				2035	* actual management, the pool may stall indefinitely.
				2036	*
				2037	* manager_mutex is used for exclusion of actual management
				2038	* operations. The holder of manager_mutex can be sure that none
				2039	* of management operations, including creation and destruction of
				2040	* workers, won't take place until the mutex is released. Because
				2041	* manager_mutex doesn't interfere with manager role arbitration,
				2042	* it is guaranteed that the pool's management, while may be
				2043	* delayed, won't be disturbed by someone else grabbing
				2044	* manager_mutex.
				2045	*/
Tejun Heo	34a06bd	2013-03-12 11:30:00 -0700	[diff] [blame]	2046	if (!mutex_trylock(&pool->manager_arb))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2047	return ret;
				2048
Lai Jiangshan	ee378aa	2012-09-10 10:03:44 -0700	[diff] [blame]	2049	/*
Tejun Heo	bc3a1af	2013-03-13 19:47:39 -0700	[diff] [blame]	2050	* With manager arbitration won, manager_mutex would be free in
				2051	* most cases. trylock first without dropping @pool->lock.
Lai Jiangshan	ee378aa	2012-09-10 10:03:44 -0700	[diff] [blame]	2052	*/
Tejun Heo	bc3a1af	2013-03-13 19:47:39 -0700	[diff] [blame]	2053	if (unlikely(!mutex_trylock(&pool->manager_mutex))) {
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2054	spin_unlock_irq(&pool->lock);
Tejun Heo	bc3a1af	2013-03-13 19:47:39 -0700	[diff] [blame]	2055	mutex_lock(&pool->manager_mutex);
Lai Jiangshan	ee378aa	2012-09-10 10:03:44 -0700	[diff] [blame]	2056	/*
				2057	* CPU hotplug could have happened while we were waiting
Lai Jiangshan	b2eb83d	2012-09-18 09:59:23 -0700	[diff] [blame]	2058	* for assoc_mutex. Hotplug itself can't handle us
Lai Jiangshan	ee378aa	2012-09-10 10:03:44 -0700	[diff] [blame]	2059	* because manager isn't either on idle or busy list, and
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	2060	* @pool's state and ours could have deviated.
Lai Jiangshan	ee378aa	2012-09-10 10:03:44 -0700	[diff] [blame]	2061	*
Tejun Heo	bc3a1af	2013-03-13 19:47:39 -0700	[diff] [blame]	2062	* As hotplug is now excluded via manager_mutex, we can
Lai Jiangshan	ee378aa	2012-09-10 10:03:44 -0700	[diff] [blame]	2063	* simply try to bind. It will succeed or fail depending
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	2064	* on @pool's current state. Try it and adjust
Lai Jiangshan	ee378aa	2012-09-10 10:03:44 -0700	[diff] [blame]	2065	* %WORKER_UNBOUND accordingly.
				2066	*/
Lai Jiangshan	f36dc67	2013-02-19 12:17:02 -0800	[diff] [blame]	2067	if (worker_maybe_bind_and_lock(pool))
Lai Jiangshan	ee378aa	2012-09-10 10:03:44 -0700	[diff] [blame]	2068	worker->flags &= ~WORKER_UNBOUND;
				2069	else
				2070	worker->flags \|= WORKER_UNBOUND;
				2071
				2072	ret = true;
				2073	}
				2074
Tejun Heo	11ebea5	2012-07-12 14:46:37 -0700	[diff] [blame]	2075	pool->flags &= ~POOL_MANAGE_WORKERS;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2076
				2077	/*
				2078	* Destroy and then create so that may_start_working() is true
				2079	* on return.
				2080	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2081	ret \|= maybe_destroy_workers(pool);
				2082	ret \|= maybe_create_worker(pool);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2083
Tejun Heo	bc3a1af	2013-03-13 19:47:39 -0700	[diff] [blame]	2084	mutex_unlock(&pool->manager_mutex);
Tejun Heo	34a06bd	2013-03-12 11:30:00 -0700	[diff] [blame]	2085	mutex_unlock(&pool->manager_arb);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2086	return ret;
				2087	}
				2088
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2089	/**
				2090	* process_one_work - process single work
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2091	* @worker: self
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2092	* @work: work to process
				2093	*
				2094	* Process @work. This function contains all the logics necessary to
				2095	* process a single work including synchronization against and
				2096	* interaction with other workers on the same cpu, queueing and
				2097	* flushing. As long as context requirement is met, any worker can
				2098	* call this function to process a work.
				2099	*
				2100	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2101	* spin_lock_irq(pool->lock) which is released and regrabbed.
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2102	*/
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2103	static void process_one_work(struct worker worker, struct work_struct work)
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2104	__releases(&pool->lock)
				2105	__acquires(&pool->lock)
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2106	{
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2107	struct pool_workqueue *pwq = get_work_pwq(work);
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	2108	struct worker_pool *pool = worker->pool;
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2109	bool cpu_intensive = pwq->wq->flags & WQ_CPU_INTENSIVE;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2110	int work_color;
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	2111	struct worker *collision;
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2112	#ifdef CONFIG_LOCKDEP
				2113	/*
				2114	* It is permissible to free the struct work_struct from
				2115	* inside the function that is called from it, this we need to
				2116	* take into account for lockdep too. To avoid bogus "held
				2117	* lock freed" warnings as well as problems when looking into
				2118	* work->lockdep_map, make a copy and use that here.
				2119	*/
Peter Zijlstra	4d82a1d	2012-05-15 08:06:19 -0700	[diff] [blame]	2120	struct lockdep_map lockdep_map;
				2121
				2122	lockdep_copy_map(&lockdep_map, &work->lockdep_map);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2123	#endif
Tejun Heo	6fec10a	2012-07-22 10:16:34 -0700	[diff] [blame]	2124	/*
				2125	* Ensure we're on the correct CPU. DISASSOCIATED test is
				2126	* necessary to avoid spurious warnings from rescuers servicing the
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	2127	* unbound or a disassociated pool.
Tejun Heo	6fec10a	2012-07-22 10:16:34 -0700	[diff] [blame]	2128	*/
Lai Jiangshan	5f7dabf	2012-09-18 09:59:23 -0700	[diff] [blame]	2129	WARN_ON_ONCE(!(worker->flags & WORKER_UNBOUND) &&
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	2130	!(pool->flags & POOL_DISASSOCIATED) &&
Tejun Heo	ec22ca5	2013-01-24 11:01:33 -0800	[diff] [blame]	2131	raw_smp_processor_id() != pool->cpu);
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	2132
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	2133	/*
				2134	* A single work shouldn't be executed concurrently by
				2135	* multiple workers on a single cpu. Check whether anyone is
				2136	* already processing the work. If so, defer the work to the
				2137	* currently executing one.
				2138	*/
Tejun Heo	c9e7cf2	2013-01-24 11:01:33 -0800	[diff] [blame]	2139	collision = find_worker_executing_work(pool, work);
Tejun Heo	7e11629	2010-06-29 10:07:13 +0200	[diff] [blame]	2140	if (unlikely(collision)) {
				2141	move_linked_works(work, &collision->scheduled, NULL);
				2142	return;
				2143	}
				2144
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	2145	/* claim and dequeue */
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2146	debug_work_deactivate(work);
Tejun Heo	c9e7cf2	2013-01-24 11:01:33 -0800	[diff] [blame]	2147	hash_add(pool->busy_hash, &worker->hentry, (unsigned long)work);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2148	worker->current_work = work;
Tejun Heo	a2c1c57	2012-12-18 10:35:02 -0800	[diff] [blame]	2149	worker->current_func = work->func;
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2150	worker->current_pwq = pwq;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2151	work_color = get_work_color(work);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	2152
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2153	list_del_init(&work->entry);
				2154
Tejun Heo	649027d	2010-06-29 10:07:14 +0200	[diff] [blame]	2155	/*
Tejun Heo	fb0e7be	2010-06-29 10:07:15 +0200	[diff] [blame]	2156	* CPU intensive works don't participate in concurrency
				2157	* management. They're the scheduler's responsibility.
				2158	*/
				2159	if (unlikely(cpu_intensive))
				2160	worker_set_flags(worker, WORKER_CPU_INTENSIVE, true);
				2161
Tejun Heo	974271c	2012-07-12 14:46:37 -0700	[diff] [blame]	2162	/*
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2163	* Unbound pool isn't concurrency managed and work items should be
Tejun Heo	974271c	2012-07-12 14:46:37 -0700	[diff] [blame]	2164	* executed ASAP. Wake up another worker if necessary.
				2165	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2166	if ((worker->flags & WORKER_UNBOUND) && need_more_worker(pool))
				2167	wake_up_worker(pool);
Tejun Heo	974271c	2012-07-12 14:46:37 -0700	[diff] [blame]	2168
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	2169	/*
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	2170	* Record the last pool and clear PENDING which should be the last
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2171	* update to @work. Also, do this inside @pool->lock so that
Tejun Heo	23657bb	2012-08-13 17:08:19 -0700	[diff] [blame]	2172	* PENDING and queued state changes happen together while IRQ is
				2173	* disabled.
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	2174	*/
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	2175	set_work_pool_and_clear_pending(work, pool->id);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2176
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2177	spin_unlock_irq(&pool->lock);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2178
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2179	lock_map_acquire_read(&pwq->wq->lockdep_map);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2180	lock_map_acquire(&lockdep_map);
Arjan van de Ven	e36c886	2010-08-21 13:07:26 -0700	[diff] [blame]	2181	trace_workqueue_execute_start(work);
Tejun Heo	a2c1c57	2012-12-18 10:35:02 -0800	[diff] [blame]	2182	worker->current_func(work);
Arjan van de Ven	e36c886	2010-08-21 13:07:26 -0700	[diff] [blame]	2183	/*
				2184	* While we must be careful to not use "work" after this, the trace
				2185	* point will only record its address.
				2186	*/
				2187	trace_workqueue_execute_end(work);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2188	lock_map_release(&lockdep_map);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2189	lock_map_release(&pwq->wq->lockdep_map);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2190
				2191	if (unlikely(in_atomic() \|\| lockdep_depth(current) > 0)) {
Valentin Ilie	044c782	2012-08-19 00:52:42 +0300	[diff] [blame]	2192	pr_err("BUG: workqueue leaked lock or atomic: %s/0x%08x/%d\n"
				2193	" last function: %pf\n",
Tejun Heo	a2c1c57	2012-12-18 10:35:02 -0800	[diff] [blame]	2194	current->comm, preempt_count(), task_pid_nr(current),
				2195	worker->current_func);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2196	debug_show_held_locks(current);
				2197	dump_stack();
				2198	}
				2199
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2200	spin_lock_irq(&pool->lock);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2201
Tejun Heo	fb0e7be	2010-06-29 10:07:15 +0200	[diff] [blame]	2202	/* clear cpu intensive status */
				2203	if (unlikely(cpu_intensive))
				2204	worker_clr_flags(worker, WORKER_CPU_INTENSIVE);
				2205
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2206	/* we're done with it, release */
Sasha Levin	42f8570	2012-12-17 10:01:23 -0500	[diff] [blame]	2207	hash_del(&worker->hentry);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2208	worker->current_work = NULL;
Tejun Heo	a2c1c57	2012-12-18 10:35:02 -0800	[diff] [blame]	2209	worker->current_func = NULL;
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2210	worker->current_pwq = NULL;
				2211	pwq_dec_nr_in_flight(pwq, work_color);
Tejun Heo	a62428c	2010-06-29 10:07:10 +0200	[diff] [blame]	2212	}
				2213
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2214	/**
				2215	* process_scheduled_works - process scheduled works
				2216	* @worker: self
				2217	*
				2218	* Process all scheduled works. Please note that the scheduled list
				2219	* may change while processing a work, so this function repeatedly
				2220	* fetches a work from the top and executes it.
				2221	*
				2222	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2223	* spin_lock_irq(pool->lock) which may be released and regrabbed
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2224	* multiple times.
				2225	*/
				2226	static void process_scheduled_works(struct worker *worker)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2227	{
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2228	while (!list_empty(&worker->scheduled)) {
				2229	struct work_struct *work = list_first_entry(&worker->scheduled,
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2230	struct work_struct, entry);
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2231	process_one_work(worker, work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2232	}
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2233	}
				2234
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2235	/**
				2236	* worker_thread - the worker thread function
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2237	* @__worker: self
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2238	*
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	2239	* The worker thread function. All workers belong to a worker_pool -
				2240	* either a per-cpu one or dynamic unbound one. These workers process all
				2241	* work items regardless of their specific target workqueue. The only
				2242	* exception is work items which belong to workqueues with a rescuer which
				2243	* will be explained in rescuer_thread().
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2244	*/
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2245	static int worker_thread(void *__worker)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2246	{
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	2247	struct worker *worker = __worker;
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	2248	struct worker_pool *pool = worker->pool;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2249
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2250	/* tell the scheduler that this is a workqueue worker */
				2251	worker->task->flags \|= PF_WQ_WORKER;
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2252	woke_up:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2253	spin_lock_irq(&pool->lock);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2254
Lai Jiangshan	5f7dabf	2012-09-18 09:59:23 -0700	[diff] [blame]	2255	/* we are off idle list if destruction or rebind is requested */
				2256	if (unlikely(list_empty(&worker->entry))) {
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2257	spin_unlock_irq(&pool->lock);
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	2258
Lai Jiangshan	5f7dabf	2012-09-18 09:59:23 -0700	[diff] [blame]	2259	/* if DIE is set, destruction is requested */
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	2260	if (worker->flags & WORKER_DIE) {
				2261	worker->task->flags &= ~PF_WQ_WORKER;
				2262	return 0;
				2263	}
				2264
Lai Jiangshan	5f7dabf	2012-09-18 09:59:23 -0700	[diff] [blame]	2265	/* otherwise, rebind */
Tejun Heo	25511a4	2012-07-17 12:39:27 -0700	[diff] [blame]	2266	idle_worker_rebind(worker);
				2267	goto woke_up;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2268	}
				2269
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2270	worker_leave_idle(worker);
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	2271	recheck:
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2272	/* no more worker necessary? */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2273	if (!need_more_worker(pool))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2274	goto sleep;
				2275
				2276	/* do we need to manage? */
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2277	if (unlikely(!may_start_working(pool)) && manage_workers(worker))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2278	goto recheck;
				2279
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2280	/*
				2281	* ->scheduled list can only be filled while a worker is
				2282	* preparing to process a work or actually processing it.
				2283	* Make sure nobody diddled with it while I was sleeping.
				2284	*/
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2285	WARN_ON_ONCE(!list_empty(&worker->scheduled));
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2286
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2287	/*
				2288	* When control reaches this point, we're guaranteed to have
				2289	* at least one idle worker or that someone else has already
				2290	* assumed the manager role.
				2291	*/
				2292	worker_clr_flags(worker, WORKER_PREP);
				2293
				2294	do {
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2295	struct work_struct *work =
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	2296	list_first_entry(&pool->worklist,
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2297	struct work_struct, entry);
				2298
				2299	if (likely(!(*work_data_bits(work) & WORK_STRUCT_LINKED))) {
				2300	/* optimization path, not strictly necessary */
				2301	process_one_work(worker, work);
				2302	if (unlikely(!list_empty(&worker->scheduled)))
				2303	process_scheduled_works(worker);
				2304	} else {
				2305	move_linked_works(work, &worker->scheduled, NULL);
				2306	process_scheduled_works(worker);
				2307	}
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2308	} while (keep_working(pool));
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2309
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2310	worker_set_flags(worker, WORKER_PREP, false);
Tejun Heo	d313dd8	2010-07-02 10:03:51 +0200	[diff] [blame]	2311	sleep:
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2312	if (unlikely(need_to_manage_workers(pool)) && manage_workers(worker))
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2313	goto recheck;
Tejun Heo	d313dd8	2010-07-02 10:03:51 +0200	[diff] [blame]	2314
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2315	/*
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2316	* pool->lock is held and there's no work to process and no need to
				2317	* manage, sleep. Workers are woken up only while holding
				2318	* pool->lock or from local cpu, so setting the current state
				2319	* before releasing pool->lock is enough to prevent losing any
				2320	* event.
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2321	*/
				2322	worker_enter_idle(worker);
				2323	__set_current_state(TASK_INTERRUPTIBLE);
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2324	spin_unlock_irq(&pool->lock);
Tejun Heo	c8e55f3	2010-06-29 10:07:12 +0200	[diff] [blame]	2325	schedule();
				2326	goto woke_up;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2327	}
				2328
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2329	/**
				2330	* rescuer_thread - the rescuer thread function
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	2331	* @__rescuer: self
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2332	*
				2333	* Workqueue rescuer thread function. There's one rescuer for each
Tejun Heo	493008a	2013-03-12 11:30:03 -0700	[diff] [blame]	2334	* workqueue which has WQ_MEM_RECLAIM set.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2335	*
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	2336	* Regular work processing on a pool may block trying to create a new
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2337	* worker which uses GFP_KERNEL allocation which has slight chance of
				2338	* developing into deadlock if some works currently on the same queue
				2339	* need to be processed to satisfy the GFP_KERNEL allocation. This is
				2340	* the problem rescuer solves.
				2341	*
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	2342	* When such condition is possible, the pool summons rescuers of all
				2343	* workqueues which have works queued on the pool and let them process
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2344	* those works so that forward progress can be guaranteed.
				2345	*
				2346	* This should happen rarely.
				2347	*/
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	2348	static int rescuer_thread(void *__rescuer)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2349	{
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	2350	struct worker *rescuer = __rescuer;
				2351	struct workqueue_struct *wq = rescuer->rescue_wq;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2352	struct list_head *scheduled = &rescuer->scheduled;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2353
				2354	set_user_nice(current, RESCUER_NICE_LEVEL);
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	2355
				2356	/*
				2357	* Mark rescuer as worker too. As WORKER_PREP is never cleared, it
				2358	* doesn't participate in concurrency management.
				2359	*/
				2360	rescuer->task->flags \|= PF_WQ_WORKER;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2361	repeat:
				2362	set_current_state(TASK_INTERRUPTIBLE);
				2363
Mike Galbraith	412d32e	2012-11-28 07:17:18 +0100	[diff] [blame]	2364	if (kthread_should_stop()) {
				2365	__set_current_state(TASK_RUNNING);
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	2366	rescuer->task->flags &= ~PF_WQ_WORKER;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2367	return 0;
Mike Galbraith	412d32e	2012-11-28 07:17:18 +0100	[diff] [blame]	2368	}
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2369
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	2370	/* see whether any pwq is asking for help */
Tejun Heo	2e109a2	2013-03-13 19:47:40 -0700	[diff] [blame]	2371	spin_lock_irq(&wq_mayday_lock);
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	2372
				2373	while (!list_empty(&wq->maydays)) {
				2374	struct pool_workqueue *pwq = list_first_entry(&wq->maydays,
				2375	struct pool_workqueue, mayday_node);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2376	struct worker_pool *pool = pwq->pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2377	struct work_struct work, n;
				2378
				2379	__set_current_state(TASK_RUNNING);
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	2380	list_del_init(&pwq->mayday_node);
				2381
Tejun Heo	2e109a2	2013-03-13 19:47:40 -0700	[diff] [blame]	2382	spin_unlock_irq(&wq_mayday_lock);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2383
				2384	/* migrate to the target cpu if possible */
Lai Jiangshan	f36dc67	2013-02-19 12:17:02 -0800	[diff] [blame]	2385	worker_maybe_bind_and_lock(pool);
Lai Jiangshan	b310410	2013-02-19 12:17:02 -0800	[diff] [blame]	2386	rescuer->pool = pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2387
				2388	/*
				2389	* Slurp in all works issued via this workqueue and
				2390	* process'em.
				2391	*/
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2392	WARN_ON_ONCE(!list_empty(&rescuer->scheduled));
Tejun Heo	bd7bdd4	2012-07-12 14:46:37 -0700	[diff] [blame]	2393	list_for_each_entry_safe(work, n, &pool->worklist, entry)
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2394	if (get_work_pwq(work) == pwq)
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2395	move_linked_works(work, scheduled, &n);
				2396
				2397	process_scheduled_works(rescuer);
Tejun Heo	7576958	2011-02-14 14:04:46 +0100	[diff] [blame]	2398
				2399	/*
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2400	* Leave this pool. If keep_working() is %true, notify a
Tejun Heo	7576958	2011-02-14 14:04:46 +0100	[diff] [blame]	2401	* regular worker; otherwise, we end up with 0 concurrency
				2402	* and stalling the execution.
				2403	*/
Tejun Heo	63d95a9	2012-07-12 14:46:37 -0700	[diff] [blame]	2404	if (keep_working(pool))
				2405	wake_up_worker(pool);
Tejun Heo	7576958	2011-02-14 14:04:46 +0100	[diff] [blame]	2406
Lai Jiangshan	b310410	2013-02-19 12:17:02 -0800	[diff] [blame]	2407	rescuer->pool = NULL;
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	2408	spin_unlock(&pool->lock);
Tejun Heo	2e109a2	2013-03-13 19:47:40 -0700	[diff] [blame]	2409	spin_lock(&wq_mayday_lock);
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2410	}
				2411
Tejun Heo	2e109a2	2013-03-13 19:47:40 -0700	[diff] [blame]	2412	spin_unlock_irq(&wq_mayday_lock);
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	2413
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	2414	/* rescuers should never participate in concurrency management */
				2415	WARN_ON_ONCE(!(rescuer->flags & WORKER_NOT_RUNNING));
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	2416	schedule();
				2417	goto repeat;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2418	}
				2419
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2420	struct wq_barrier {
				2421	struct work_struct work;
				2422	struct completion done;
				2423	};
				2424
				2425	static void wq_barrier_func(struct work_struct *work)
				2426	{
				2427	struct wq_barrier *barr = container_of(work, struct wq_barrier, work);
				2428	complete(&barr->done);
				2429	}
				2430
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2431	/**
				2432	* insert_wq_barrier - insert a barrier work
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2433	* @pwq: pwq to insert barrier into
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2434	* @barr: wq_barrier to insert
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2435	* @target: target work to attach @barr to
				2436	* @worker: worker currently executing @target, NULL if @target is not executing
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2437	*
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2438	* @barr is linked to @target such that @barr is completed only after
				2439	* @target finishes execution. Please note that the ordering
				2440	* guarantee is observed only with respect to @target and on the local
				2441	* cpu.
				2442	*
				2443	* Currently, a queued barrier can't be canceled. This is because
				2444	* try_to_grab_pending() can't determine whether the work to be
				2445	* grabbed is at the head of the queue and thus can't clear LINKED
				2446	* flag of the previous work while there must be a valid next work
				2447	* after a work with LINKED flag set.
				2448	*
				2449	* Note that when @worker is non-NULL, @target may be modified
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2450	* underneath us, so we can't reliably determine pwq from @target.
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2451	*
				2452	* CONTEXT:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2453	* spin_lock_irq(pool->lock).
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	2454	*/
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2455	static void insert_wq_barrier(struct pool_workqueue *pwq,
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2456	struct wq_barrier *barr,
				2457	struct work_struct target, struct worker worker)
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2458	{
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2459	struct list_head *head;
				2460	unsigned int linked = 0;
				2461
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2462	/*
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2463	* debugobject calls are safe here even with pool->lock locked
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2464	* as we know for sure that this will not trigger any of the
				2465	* checks and call back into the fixup functions where we
				2466	* might deadlock.
				2467	*/
Andrew Morton	ca1cab3	2010-10-26 14:22:34 -0700	[diff] [blame]	2468	INIT_WORK_ONSTACK(&barr->work, wq_barrier_func);
Tejun Heo	22df02b	2010-06-29 10:07:10 +0200	[diff] [blame]	2469	__set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(&barr->work));
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2470	init_completion(&barr->done);
Oleg Nesterov	83c2252	2007-05-09 02:33:54 -0700	[diff] [blame]	2471
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2472	/*
				2473	* If @target is currently being executed, schedule the
				2474	* barrier to the worker; otherwise, put it after @target.
				2475	*/
				2476	if (worker)
				2477	head = worker->scheduled.next;
				2478	else {
				2479	unsigned long *bits = work_data_bits(target);
				2480
				2481	head = target->entry.next;
				2482	/* there can already be other linked works, inherit and set */
				2483	linked = *bits & WORK_STRUCT_LINKED;
				2484	__set_bit(WORK_STRUCT_LINKED_BIT, bits);
				2485	}
				2486
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2487	debug_work_activate(&barr->work);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2488	insert_work(pwq, &barr->work, head,
Tejun Heo	affee4b	2010-06-29 10:07:12 +0200	[diff] [blame]	2489	work_color_to_flags(WORK_NO_COLOR) \| linked);
Oleg Nesterov	fc2e4d7	2007-05-09 02:33:51 -0700	[diff] [blame]	2490	}
				2491
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2492	/**
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2493	* flush_workqueue_prep_pwqs - prepare pwqs for workqueue flushing
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2494	* @wq: workqueue being flushed
				2495	* @flush_color: new flush color, < 0 for no-op
				2496	* @work_color: new work color, < 0 for no-op
				2497	*
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2498	* Prepare pwqs for workqueue flushing.
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2499	*
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2500	* If @flush_color is non-negative, flush_color on all pwqs should be
				2501	* -1. If no pwq has in-flight commands at the specified color, all
				2502	* pwq->flush_color's stay at -1 and %false is returned. If any pwq
				2503	* has in flight commands, its pwq->flush_color is set to
				2504	* @flush_color, @wq->nr_pwqs_to_flush is updated accordingly, pwq
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2505	* wakeup logic is armed and %true is returned.
				2506	*
				2507	* The caller should have initialized @wq->first_flusher prior to
				2508	* calling this function with non-negative @flush_color. If
				2509	* @flush_color is negative, no flush color update is done and %false
				2510	* is returned.
				2511	*
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2512	* If @work_color is non-negative, all pwqs should have the same
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2513	* work_color which is previous to @work_color and all will be
				2514	* advanced to @work_color.
				2515	*
				2516	* CONTEXT:
				2517	* mutex_lock(wq->flush_mutex).
				2518	*
				2519	* RETURNS:
				2520	* %true if @flush_color >= 0 and there's something to flush. %false
				2521	* otherwise.
				2522	*/
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2523	static bool flush_workqueue_prep_pwqs(struct workqueue_struct *wq,
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2524	int flush_color, int work_color)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2525	{
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2526	bool wait = false;
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	2527	struct pool_workqueue *pwq;
Oleg Nesterov	1444196	2007-05-23 13:57:57 -0700	[diff] [blame]	2528
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2529	if (flush_color >= 0) {
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2530	WARN_ON_ONCE(atomic_read(&wq->nr_pwqs_to_flush));
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2531	atomic_set(&wq->nr_pwqs_to_flush, 1);
Thomas Gleixner	dc186ad	2009-11-16 01:09:48 +0900	[diff] [blame]	2532	}
Oleg Nesterov	1444196	2007-05-23 13:57:57 -0700	[diff] [blame]	2533
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	2534	local_irq_disable();
				2535
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	2536	for_each_pwq(pwq, wq) {
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2537	struct worker_pool *pool = pwq->pool;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2538
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	2539	spin_lock(&pool->lock);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2540
				2541	if (flush_color >= 0) {
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2542	WARN_ON_ONCE(pwq->flush_color != -1);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2543
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2544	if (pwq->nr_in_flight[flush_color]) {
				2545	pwq->flush_color = flush_color;
				2546	atomic_inc(&wq->nr_pwqs_to_flush);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2547	wait = true;
				2548	}
				2549	}
				2550
				2551	if (work_color >= 0) {
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2552	WARN_ON_ONCE(work_color != work_next_color(pwq->work_color));
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2553	pwq->work_color = work_color;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2554	}
				2555
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	2556	spin_unlock(&pool->lock);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2557	}
				2558
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	2559	local_irq_enable();
				2560
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2561	if (flush_color >= 0 && atomic_dec_and_test(&wq->nr_pwqs_to_flush))
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2562	complete(&wq->first_flusher->done);
				2563
				2564	return wait;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2565	}
				2566
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2567	/**
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2568	* flush_workqueue - ensure that any scheduled work has run to completion.
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2569	* @wq: workqueue to flush
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2570	*
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	2571	* This function sleeps until all work items which were queued on entry
				2572	* have finished execution, but it is not livelocked by new incoming ones.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2573	*/
Harvey Harrison	7ad5b3a	2008-02-08 04:19:53 -0800	[diff] [blame]	2574	void flush_workqueue(struct workqueue_struct *wq)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2575	{
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2576	struct wq_flusher this_flusher = {
				2577	.list = LIST_HEAD_INIT(this_flusher.list),
				2578	.flush_color = -1,
				2579	.done = COMPLETION_INITIALIZER_ONSTACK(this_flusher.done),
				2580	};
				2581	int next_color;
Oleg Nesterov	b1f4ec1	2007-05-09 02:34:12 -0700	[diff] [blame]	2582
Ingo Molnar	3295f0e	2008-08-11 10:30:30 +0200	[diff] [blame]	2583	lock_map_acquire(&wq->lockdep_map);
				2584	lock_map_release(&wq->lockdep_map);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2585
				2586	mutex_lock(&wq->flush_mutex);
				2587
				2588	/*
				2589	* Start-to-wait phase
				2590	*/
				2591	next_color = work_next_color(wq->work_color);
				2592
				2593	if (next_color != wq->flush_color) {
				2594	/*
				2595	* Color space is not full. The current work_color
				2596	* becomes our flush_color and work_color is advanced
				2597	* by one.
				2598	*/
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2599	WARN_ON_ONCE(!list_empty(&wq->flusher_overflow));
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2600	this_flusher.flush_color = wq->work_color;
				2601	wq->work_color = next_color;
				2602
				2603	if (!wq->first_flusher) {
				2604	/* no flush in progress, become the first flusher */
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2605	WARN_ON_ONCE(wq->flush_color != this_flusher.flush_color);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2606
				2607	wq->first_flusher = &this_flusher;
				2608
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2609	if (!flush_workqueue_prep_pwqs(wq, wq->flush_color,
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2610	wq->work_color)) {
				2611	/* nothing to flush, done */
				2612	wq->flush_color = next_color;
				2613	wq->first_flusher = NULL;
				2614	goto out_unlock;
				2615	}
				2616	} else {
				2617	/* wait in queue */
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2618	WARN_ON_ONCE(wq->flush_color == this_flusher.flush_color);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2619	list_add_tail(&this_flusher.list, &wq->flusher_queue);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2620	flush_workqueue_prep_pwqs(wq, -1, wq->work_color);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2621	}
				2622	} else {
				2623	/*
				2624	* Oops, color space is full, wait on overflow queue.
				2625	* The next flush completion will assign us
				2626	* flush_color and transfer to flusher_queue.
				2627	*/
				2628	list_add_tail(&this_flusher.list, &wq->flusher_overflow);
				2629	}
				2630
				2631	mutex_unlock(&wq->flush_mutex);
				2632
				2633	wait_for_completion(&this_flusher.done);
				2634
				2635	/*
				2636	* Wake-up-and-cascade phase
				2637	*
				2638	* First flushers are responsible for cascading flushes and
				2639	* handling overflow. Non-first flushers can simply return.
				2640	*/
				2641	if (wq->first_flusher != &this_flusher)
				2642	return;
				2643
				2644	mutex_lock(&wq->flush_mutex);
				2645
Tejun Heo	4ce48b3	2010-07-02 10:03:51 +0200	[diff] [blame]	2646	/* we might have raced, check again with mutex held */
				2647	if (wq->first_flusher != &this_flusher)
				2648	goto out_unlock;
				2649
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2650	wq->first_flusher = NULL;
				2651
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2652	WARN_ON_ONCE(!list_empty(&this_flusher.list));
				2653	WARN_ON_ONCE(wq->flush_color != this_flusher.flush_color);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2654
				2655	while (true) {
				2656	struct wq_flusher next, tmp;
				2657
				2658	/* complete all the flushers sharing the current flush color */
				2659	list_for_each_entry_safe(next, tmp, &wq->flusher_queue, list) {
				2660	if (next->flush_color != wq->flush_color)
				2661	break;
				2662	list_del_init(&next->list);
				2663	complete(&next->done);
				2664	}
				2665
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2666	WARN_ON_ONCE(!list_empty(&wq->flusher_overflow) &&
				2667	wq->flush_color != work_next_color(wq->work_color));
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2668
				2669	/* this flush_color is finished, advance by one */
				2670	wq->flush_color = work_next_color(wq->flush_color);
				2671
				2672	/* one color has been freed, handle overflow queue */
				2673	if (!list_empty(&wq->flusher_overflow)) {
				2674	/*
				2675	* Assign the same color to all overflowed
				2676	* flushers, advance work_color and append to
				2677	* flusher_queue. This is the start-to-wait
				2678	* phase for these overflowed flushers.
				2679	*/
				2680	list_for_each_entry(tmp, &wq->flusher_overflow, list)
				2681	tmp->flush_color = wq->work_color;
				2682
				2683	wq->work_color = work_next_color(wq->work_color);
				2684
				2685	list_splice_tail_init(&wq->flusher_overflow,
				2686	&wq->flusher_queue);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2687	flush_workqueue_prep_pwqs(wq, -1, wq->work_color);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2688	}
				2689
				2690	if (list_empty(&wq->flusher_queue)) {
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2691	WARN_ON_ONCE(wq->flush_color != wq->work_color);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2692	break;
				2693	}
				2694
				2695	/*
				2696	* Need to flush more colors. Make the next flusher
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2697	* the new first flusher and arm pwqs.
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2698	*/
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	2699	WARN_ON_ONCE(wq->flush_color == wq->work_color);
				2700	WARN_ON_ONCE(wq->flush_color != next->flush_color);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2701
				2702	list_del_init(&next->list);
				2703	wq->first_flusher = next;
				2704
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2705	if (flush_workqueue_prep_pwqs(wq, wq->flush_color, -1))
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	2706	break;
				2707
				2708	/*
				2709	* Meh... this color is already done, clear first
				2710	* flusher and repeat cascading.
				2711	*/
				2712	wq->first_flusher = NULL;
				2713	}
				2714
				2715	out_unlock:
				2716	mutex_unlock(&wq->flush_mutex);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2717	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	2718	EXPORT_SYMBOL_GPL(flush_workqueue);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2719
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2720	/**
				2721	* drain_workqueue - drain a workqueue
				2722	* @wq: workqueue to drain
				2723	*
				2724	* Wait until the workqueue becomes empty. While draining is in progress,
				2725	* only chain queueing is allowed. IOW, only currently pending or running
				2726	* work items on @wq can queue further work items on it. @wq is flushed
				2727	* repeatedly until it becomes empty. The number of flushing is detemined
				2728	* by the depth of chaining and should be relatively short. Whine if it
				2729	* takes too long.
				2730	*/
				2731	void drain_workqueue(struct workqueue_struct *wq)
				2732	{
				2733	unsigned int flush_cnt = 0;
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	2734	struct pool_workqueue *pwq;
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2735
				2736	/*
				2737	* __queue_work() needs to test whether there are drainers, is much
				2738	* hotter than drain_workqueue() and already looks at @wq->flags.
Tejun Heo	618b01e	2013-03-12 11:30:04 -0700	[diff] [blame]	2739	* Use __WQ_DRAINING so that queue doesn't have to check nr_drainers.
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2740	*/
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	2741	mutex_lock(&wq_mutex);
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2742	if (!wq->nr_drainers++)
Tejun Heo	618b01e	2013-03-12 11:30:04 -0700	[diff] [blame]	2743	wq->flags \|= __WQ_DRAINING;
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	2744	mutex_unlock(&wq_mutex);
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2745	reflush:
				2746	flush_workqueue(wq);
				2747
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	2748	local_irq_disable();
				2749
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	2750	for_each_pwq(pwq, wq) {
Thomas Tuttle	fa2563e	2011-09-14 16:22:28 -0700	[diff] [blame]	2751	bool drained;
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2752
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	2753	spin_lock(&pwq->pool->lock);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2754	drained = !pwq->nr_active && list_empty(&pwq->delayed_works);
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	2755	spin_unlock(&pwq->pool->lock);
Thomas Tuttle	fa2563e	2011-09-14 16:22:28 -0700	[diff] [blame]	2756
				2757	if (drained)
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2758	continue;
				2759
				2760	if (++flush_cnt == 10 \|\|
				2761	(flush_cnt % 100 == 0 && flush_cnt <= 1000))
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	2762	pr_warn("workqueue %s: drain_workqueue() isn't complete after %u tries\n",
Valentin Ilie	044c782	2012-08-19 00:52:42 +0300	[diff] [blame]	2763	wq->name, flush_cnt);
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	2764
				2765	local_irq_enable();
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2766	goto reflush;
				2767	}
				2768
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	2769	local_irq_enable();
				2770
				2771	mutex_lock(&wq_mutex);
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2772	if (!--wq->nr_drainers)
Tejun Heo	618b01e	2013-03-12 11:30:04 -0700	[diff] [blame]	2773	wq->flags &= ~__WQ_DRAINING;
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	2774	mutex_unlock(&wq_mutex);
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	2775	}
				2776	EXPORT_SYMBOL_GPL(drain_workqueue);
				2777
Tejun Heo	606a502	2012-08-20 14:51:23 -0700	[diff] [blame]	2778	static bool start_flush_work(struct work_struct work, struct wq_barrier barr)
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2779	{
				2780	struct worker *worker = NULL;
Tejun Heo	c9e7cf2	2013-01-24 11:01:33 -0800	[diff] [blame]	2781	struct worker_pool *pool;
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2782	struct pool_workqueue *pwq;
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2783
				2784	might_sleep();
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2785
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	2786	local_irq_disable();
				2787	pool = get_work_pool(work);
				2788	if (!pool) {
				2789	local_irq_enable();
				2790	return false;
				2791	}
				2792
				2793	spin_lock(&pool->lock);
Lai Jiangshan	0b3dae6	2013-02-06 18:04:53 -0800	[diff] [blame]	2794	/* see the comment in try_to_grab_pending() with the same code */
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2795	pwq = get_work_pwq(work);
				2796	if (pwq) {
				2797	if (unlikely(pwq->pool != pool))
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2798	goto already_gone;
Tejun Heo	606a502	2012-08-20 14:51:23 -0700	[diff] [blame]	2799	} else {
Tejun Heo	c9e7cf2	2013-01-24 11:01:33 -0800	[diff] [blame]	2800	worker = find_worker_executing_work(pool, work);
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2801	if (!worker)
				2802	goto already_gone;
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2803	pwq = worker->current_pwq;
Tejun Heo	606a502	2012-08-20 14:51:23 -0700	[diff] [blame]	2804	}
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2805
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2806	insert_wq_barrier(pwq, barr, work, worker);
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2807	spin_unlock_irq(&pool->lock);
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2808
Tejun Heo	e159489	2011-01-09 23:32:15 +0100	[diff] [blame]	2809	/*
				2810	* If @max_active is 1 or rescuer is in use, flushing another work
				2811	* item on the same workqueue may lead to deadlock. Make sure the
				2812	* flusher is not running on the same workqueue by verifying write
				2813	* access.
				2814	*/
Tejun Heo	493008a	2013-03-12 11:30:03 -0700	[diff] [blame]	2815	if (pwq->wq->saved_max_active == 1 \|\| pwq->wq->rescuer)
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2816	lock_map_acquire(&pwq->wq->lockdep_map);
Tejun Heo	e159489	2011-01-09 23:32:15 +0100	[diff] [blame]	2817	else
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	2818	lock_map_acquire_read(&pwq->wq->lockdep_map);
				2819	lock_map_release(&pwq->wq->lockdep_map);
Tejun Heo	e159489	2011-01-09 23:32:15 +0100	[diff] [blame]	2820
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2821	return true;
				2822	already_gone:
Tejun Heo	d565ed6	2013-01-24 11:01:33 -0800	[diff] [blame]	2823	spin_unlock_irq(&pool->lock);
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2824	return false;
				2825	}
				2826
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2827	/**
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2828	* flush_work - wait for a work to finish executing the last queueing instance
				2829	* @work: the work to flush
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2830	*
Tejun Heo	606a502	2012-08-20 14:51:23 -0700	[diff] [blame]	2831	* Wait until @work has finished execution. @work is guaranteed to be idle
				2832	* on return if it hasn't been requeued since flush started.
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2833	*
				2834	* RETURNS:
				2835	* %true if flush_work() waited for the work to finish execution,
				2836	* %false if it was already idle.
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2837	*/
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2838	bool flush_work(struct work_struct *work)
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2839	{
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2840	struct wq_barrier barr;
				2841
Stephen Boyd	0976dfc	2012-04-20 17:28:50 -0700	[diff] [blame]	2842	lock_map_acquire(&work->lockdep_map);
				2843	lock_map_release(&work->lockdep_map);
				2844
Tejun Heo	606a502	2012-08-20 14:51:23 -0700	[diff] [blame]	2845	if (start_flush_work(work, &barr)) {
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2846	wait_for_completion(&barr.done);
				2847	destroy_work_on_stack(&barr.work);
				2848	return true;
Tejun Heo	606a502	2012-08-20 14:51:23 -0700	[diff] [blame]	2849	} else {
Tejun Heo	baf5902	2010-09-16 10:42:16 +0200	[diff] [blame]	2850	return false;
Tejun Heo	606a502	2012-08-20 14:51:23 -0700	[diff] [blame]	2851	}
Oleg Nesterov	db70089	2008-07-25 01:47:49 -0700	[diff] [blame]	2852	}
				2853	EXPORT_SYMBOL_GPL(flush_work);
				2854
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	2855	static bool __cancel_work_timer(struct work_struct *work, bool is_dwork)
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2856	{
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	2857	unsigned long flags;
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2858	int ret;
				2859
				2860	do {
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	2861	ret = try_to_grab_pending(work, is_dwork, &flags);
				2862	/*
				2863	* If someone else is canceling, wait for the same event it
				2864	* would be waiting for before retrying.
				2865	*/
				2866	if (unlikely(ret == -ENOENT))
Tejun Heo	606a502	2012-08-20 14:51:23 -0700	[diff] [blame]	2867	flush_work(work);
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2868	} while (unlikely(ret < 0));
				2869
Tejun Heo	bbb68df	2012-08-03 10:30:46 -0700	[diff] [blame]	2870	/* tell other tasks trying to grab @work to back off */
				2871	mark_work_canceling(work);
				2872	local_irq_restore(flags);
				2873
Tejun Heo	606a502	2012-08-20 14:51:23 -0700	[diff] [blame]	2874	flush_work(work);
Tejun Heo	7a22ad7	2010-06-29 10:07:13 +0200	[diff] [blame]	2875	clear_work_data(work);
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2876	return ret;
				2877	}
				2878
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2879	/**
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2880	* cancel_work_sync - cancel a work and wait for it to finish
				2881	* @work: the work to cancel
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2882	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2883	* Cancel @work and wait for its execution to finish. This function
				2884	* can be used even if the work re-queues itself or migrates to
				2885	* another workqueue. On return from this function, @work is
				2886	* guaranteed to be not pending or executing on any CPU.
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2887	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2888	* cancel_work_sync(&delayed_work->work) must not be used for
				2889	* delayed_work's. Use cancel_delayed_work_sync() instead.
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2890	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2891	* The caller must ensure that the workqueue on which @work was last
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2892	* queued can't be destroyed before this function returns.
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2893	*
				2894	* RETURNS:
				2895	* %true if @work was pending, %false otherwise.
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2896	*/
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2897	bool cancel_work_sync(struct work_struct *work)
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2898	{
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	2899	return __cancel_work_timer(work, false);
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	2900	}
Oleg Nesterov	28e53bd	2007-05-09 02:34:22 -0700	[diff] [blame]	2901	EXPORT_SYMBOL_GPL(cancel_work_sync);
Oleg Nesterov	b89deed	2007-05-09 02:33:52 -0700	[diff] [blame]	2902
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2903	/**
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2904	* flush_delayed_work - wait for a dwork to finish executing the last queueing
				2905	* @dwork: the delayed work to flush
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2906	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2907	* Delayed timer is cancelled and the pending work is queued for
				2908	* immediate execution. Like flush_work(), this function only
				2909	* considers the last queueing instance of @dwork.
Oleg Nesterov	1f1f642	2007-07-15 23:41:44 -0700	[diff] [blame]	2910	*
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2911	* RETURNS:
				2912	* %true if flush_work() waited for the work to finish execution,
				2913	* %false if it was already idle.
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2914	*/
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2915	bool flush_delayed_work(struct delayed_work *dwork)
				2916	{
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	2917	local_irq_disable();
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2918	if (del_timer_sync(&dwork->timer))
Lai Jiangshan	60c057b	2013-02-06 18:04:53 -0800	[diff] [blame]	2919	__queue_work(dwork->cpu, dwork->wq, &dwork->work);
Tejun Heo	8930cab	2012-08-03 10:30:45 -0700	[diff] [blame]	2920	local_irq_enable();
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2921	return flush_work(&dwork->work);
				2922	}
				2923	EXPORT_SYMBOL(flush_delayed_work);
				2924
				2925	/**
Tejun Heo	57b30ae	2012-08-21 13:18:24 -0700	[diff] [blame]	2926	* cancel_delayed_work - cancel a delayed work
				2927	* @dwork: delayed_work to cancel
Tejun Heo	0938349	2010-09-16 10:48:29 +0200	[diff] [blame]	2928	*
Tejun Heo	57b30ae	2012-08-21 13:18:24 -0700	[diff] [blame]	2929	* Kill off a pending delayed_work. Returns %true if @dwork was pending
				2930	* and canceled; %false if wasn't pending. Note that the work callback
				2931	* function may still be running on return, unless it returns %true and the
				2932	* work doesn't re-arm itself. Explicitly flush or use
				2933	* cancel_delayed_work_sync() to wait on it.
Tejun Heo	0938349	2010-09-16 10:48:29 +0200	[diff] [blame]	2934	*
Tejun Heo	57b30ae	2012-08-21 13:18:24 -0700	[diff] [blame]	2935	* This function is safe to call from any context including IRQ handler.
Tejun Heo	0938349	2010-09-16 10:48:29 +0200	[diff] [blame]	2936	*/
Tejun Heo	57b30ae	2012-08-21 13:18:24 -0700	[diff] [blame]	2937	bool cancel_delayed_work(struct delayed_work *dwork)
Tejun Heo	0938349	2010-09-16 10:48:29 +0200	[diff] [blame]	2938	{
Tejun Heo	57b30ae	2012-08-21 13:18:24 -0700	[diff] [blame]	2939	unsigned long flags;
				2940	int ret;
				2941
				2942	do {
				2943	ret = try_to_grab_pending(&dwork->work, true, &flags);
				2944	} while (unlikely(ret == -EAGAIN));
				2945
				2946	if (unlikely(ret < 0))
				2947	return false;
				2948
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	2949	set_work_pool_and_clear_pending(&dwork->work,
				2950	get_work_pool_id(&dwork->work));
Tejun Heo	57b30ae	2012-08-21 13:18:24 -0700	[diff] [blame]	2951	local_irq_restore(flags);
Dan Magenheimer	c0158ca	2012-10-18 16:31:37 -0700	[diff] [blame]	2952	return ret;
Tejun Heo	0938349	2010-09-16 10:48:29 +0200	[diff] [blame]	2953	}
Tejun Heo	57b30ae	2012-08-21 13:18:24 -0700	[diff] [blame]	2954	EXPORT_SYMBOL(cancel_delayed_work);
Tejun Heo	0938349	2010-09-16 10:48:29 +0200	[diff] [blame]	2955
				2956	/**
Tejun Heo	401a8d0	2010-09-16 10:36:00 +0200	[diff] [blame]	2957	* cancel_delayed_work_sync - cancel a delayed work and wait for it to finish
				2958	* @dwork: the delayed work cancel
				2959	*
				2960	* This is cancel_work_sync() for delayed works.
				2961	*
				2962	* RETURNS:
				2963	* %true if @dwork was pending, %false otherwise.
				2964	*/
				2965	bool cancel_delayed_work_sync(struct delayed_work *dwork)
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2966	{
Tejun Heo	36e227d	2012-08-03 10:30:46 -0700	[diff] [blame]	2967	return __cancel_work_timer(&dwork->work, true);
Oleg Nesterov	6e84d64	2007-05-09 02:34:46 -0700	[diff] [blame]	2968	}
Oleg Nesterov	f5a421a	2007-07-15 23:41:44 -0700	[diff] [blame]	2969	EXPORT_SYMBOL(cancel_delayed_work_sync);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2970
Rolf Eike Beer	0fcb78c	2006-07-30 03:03:42 -0700	[diff] [blame]	2971	/**
Tejun Heo	31ddd87	2010-10-19 11:14:49 +0200	[diff] [blame]	2972	* schedule_on_each_cpu - execute a function synchronously on each online CPU
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2973	* @func: the function to call
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2974	*
Tejun Heo	31ddd87	2010-10-19 11:14:49 +0200	[diff] [blame]	2975	* schedule_on_each_cpu() executes @func on each online CPU using the
				2976	* system workqueue and blocks until all CPUs have completed.
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2977	* schedule_on_each_cpu() is very slow.
Tejun Heo	31ddd87	2010-10-19 11:14:49 +0200	[diff] [blame]	2978	*
				2979	* RETURNS:
				2980	* 0 on success, -errno on failure.
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2981	*/
David Howells	65f27f3	2006-11-22 14:55:48 +0000	[diff] [blame]	2982	int schedule_on_each_cpu(work_func_t func)
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	2983	{
				2984	int cpu;
Namhyung Kim	38f5156	2010-08-08 14:24:09 +0200	[diff] [blame]	2985	struct work_struct __percpu *works;
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	2986
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2987	works = alloc_percpu(struct work_struct);
				2988	if (!works)
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	2989	return -ENOMEM;
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	2990
Gautham R Shenoy	95402b3	2008-01-25 21:08:02 +0100	[diff] [blame]	2991	get_online_cpus();
Tejun Heo	9398180	2009-11-17 14:06:20 -0800	[diff] [blame]	2992
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	2993	for_each_online_cpu(cpu) {
Ingo Molnar	9bfb183	2006-12-18 20:05:09 +0100	[diff] [blame]	2994	struct work_struct *work = per_cpu_ptr(works, cpu);
				2995
				2996	INIT_WORK(work, func);
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	2997	schedule_work_on(cpu, work);
Andi Kleen	65a6446	2009-10-14 06:22:47 +0200	[diff] [blame]	2998	}
Tejun Heo	9398180	2009-11-17 14:06:20 -0800	[diff] [blame]	2999
				3000	for_each_online_cpu(cpu)
				3001	flush_work(per_cpu_ptr(works, cpu));
				3002
Gautham R Shenoy	95402b3	2008-01-25 21:08:02 +0100	[diff] [blame]	3003	put_online_cpus();
Andrew Morton	b613677	2006-06-25 05:47:49 -0700	[diff] [blame]	3004	free_percpu(works);
Christoph Lameter	15316ba	2006-01-08 01:00:43 -0800	[diff] [blame]	3005	return 0;
				3006	}
				3007
Alan Stern	eef6a7d	2010-02-12 17:39:21 +0900	[diff] [blame]	3008	/**
				3009	* flush_scheduled_work - ensure that any scheduled work has run to completion.
				3010	*
				3011	* Forces execution of the kernel-global workqueue and blocks until its
				3012	* completion.
				3013	*
				3014	* Think twice before calling this function! It's very easy to get into
				3015	* trouble if you don't take great care. Either of the following situations
				3016	* will lead to deadlock:
				3017	*
				3018	* One of the work items currently on the workqueue needs to acquire
				3019	* a lock held by your code or its caller.
				3020	*
				3021	* Your code is running in the context of a work routine.
				3022	*
				3023	* They will be detected by lockdep when they occur, but the first might not
				3024	* occur very often. It depends on what work items are on the workqueue and
				3025	* what locks they need, which you have no control over.
				3026	*
				3027	* In most situations flushing the entire workqueue is overkill; you merely
				3028	* need to know that a particular work item isn't queued and isn't running.
				3029	* In such cases you should use cancel_delayed_work_sync() or
				3030	* cancel_work_sync() instead.
				3031	*/
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3032	void flush_scheduled_work(void)
				3033	{
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3034	flush_workqueue(system_wq);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3035	}
Dave Jones	ae90dd5	2006-06-30 01:40:45 -0400	[diff] [blame]	3036	EXPORT_SYMBOL(flush_scheduled_work);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3037
				3038	/**
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	3039	* execute_in_process_context - reliably execute the routine with user context
				3040	* @fn: the function to execute
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	3041	* @ew: guaranteed storage for the execute work structure (must
				3042	* be available when the work executes)
				3043	*
				3044	* Executes the function immediately if process context is available,
				3045	* otherwise schedules the function for delayed execution.
				3046	*
				3047	* Returns: 0 - function was executed
				3048	* 1 - function was scheduled for execution
				3049	*/
David Howells	65f27f3	2006-11-22 14:55:48 +0000	[diff] [blame]	3050	int execute_in_process_context(work_func_t fn, struct execute_work *ew)
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	3051	{
				3052	if (!in_interrupt()) {
David Howells	65f27f3	2006-11-22 14:55:48 +0000	[diff] [blame]	3053	fn(&ew->work);
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	3054	return 0;
				3055	}
				3056
David Howells	65f27f3	2006-11-22 14:55:48 +0000	[diff] [blame]	3057	INIT_WORK(&ew->work, fn);
James Bottomley	1fa44ec	2006-02-23 12:43:43 -0600	[diff] [blame]	3058	schedule_work(&ew->work);
				3059
				3060	return 1;
				3061	}
				3062	EXPORT_SYMBOL_GPL(execute_in_process_context);
				3063
Tejun Heo	226223a	2013-03-12 11:30:05 -0700	[diff] [blame]	3064	#ifdef CONFIG_SYSFS
				3065	/*
				3066	* Workqueues with WQ_SYSFS flag set is visible to userland via
				3067	* /sys/bus/workqueue/devices/WQ_NAME. All visible workqueues have the
				3068	* following attributes.
				3069	*
				3070	* per_cpu RO bool : whether the workqueue is per-cpu or unbound
				3071	* max_active RW int : maximum number of in-flight work items
				3072	*
				3073	* Unbound workqueues have the following extra attributes.
				3074	*
				3075	* id RO int : the associated pool ID
				3076	* nice RW int : nice value of the workers
				3077	* cpumask RW mask : bitmask of allowed CPUs for the workers
				3078	*/
				3079	struct wq_device {
				3080	struct workqueue_struct *wq;
				3081	struct device dev;
				3082	};
				3083
				3084	static struct workqueue_struct dev_to_wq(struct device dev)
				3085	{
				3086	struct wq_device *wq_dev = container_of(dev, struct wq_device, dev);
				3087
				3088	return wq_dev->wq;
				3089	}
				3090
				3091	static ssize_t wq_per_cpu_show(struct device *dev,
				3092	struct device_attribute attr, char buf)
				3093	{
				3094	struct workqueue_struct *wq = dev_to_wq(dev);
				3095
				3096	return scnprintf(buf, PAGE_SIZE, "%d\n", (bool)!(wq->flags & WQ_UNBOUND));
				3097	}
				3098
				3099	static ssize_t wq_max_active_show(struct device *dev,
				3100	struct device_attribute attr, char buf)
				3101	{
				3102	struct workqueue_struct *wq = dev_to_wq(dev);
				3103
				3104	return scnprintf(buf, PAGE_SIZE, "%d\n", wq->saved_max_active);
				3105	}
				3106
				3107	static ssize_t wq_max_active_store(struct device *dev,
				3108	struct device_attribute *attr,
				3109	const char *buf, size_t count)
				3110	{
				3111	struct workqueue_struct *wq = dev_to_wq(dev);
				3112	int val;
				3113
				3114	if (sscanf(buf, "%d", &val) != 1 \|\| val <= 0)
				3115	return -EINVAL;
				3116
				3117	workqueue_set_max_active(wq, val);
				3118	return count;
				3119	}
				3120
				3121	static struct device_attribute wq_sysfs_attrs[] = {
				3122	__ATTR(per_cpu, 0444, wq_per_cpu_show, NULL),
				3123	__ATTR(max_active, 0644, wq_max_active_show, wq_max_active_store),
				3124	__ATTR_NULL,
				3125	};
				3126
				3127	static ssize_t wq_pool_id_show(struct device *dev,
				3128	struct device_attribute attr, char buf)
				3129	{
				3130	struct workqueue_struct *wq = dev_to_wq(dev);
				3131	struct worker_pool *pool;
				3132	int written;
				3133
				3134	rcu_read_lock_sched();
				3135	pool = first_pwq(wq)->pool;
				3136	written = scnprintf(buf, PAGE_SIZE, "%d\n", pool->id);
				3137	rcu_read_unlock_sched();
				3138
				3139	return written;
				3140	}
				3141
				3142	static ssize_t wq_nice_show(struct device dev, struct device_attribute attr,
				3143	char *buf)
				3144	{
				3145	struct workqueue_struct *wq = dev_to_wq(dev);
				3146	int written;
				3147
				3148	rcu_read_lock_sched();
				3149	written = scnprintf(buf, PAGE_SIZE, "%d\n",
				3150	first_pwq(wq)->pool->attrs->nice);
				3151	rcu_read_unlock_sched();
				3152
				3153	return written;
				3154	}
				3155
				3156	/* prepare workqueue_attrs for sysfs store operations */
				3157	static struct workqueue_attrs wq_sysfs_prep_attrs(struct workqueue_struct wq)
				3158	{
				3159	struct workqueue_attrs *attrs;
				3160
				3161	attrs = alloc_workqueue_attrs(GFP_KERNEL);
				3162	if (!attrs)
				3163	return NULL;
				3164
				3165	rcu_read_lock_sched();
				3166	copy_workqueue_attrs(attrs, first_pwq(wq)->pool->attrs);
				3167	rcu_read_unlock_sched();
				3168	return attrs;
				3169	}
				3170
				3171	static ssize_t wq_nice_store(struct device dev, struct device_attribute attr,
				3172	const char *buf, size_t count)
				3173	{
				3174	struct workqueue_struct *wq = dev_to_wq(dev);
				3175	struct workqueue_attrs *attrs;
				3176	int ret;
				3177
				3178	attrs = wq_sysfs_prep_attrs(wq);
				3179	if (!attrs)
				3180	return -ENOMEM;
				3181
				3182	if (sscanf(buf, "%d", &attrs->nice) == 1 &&
				3183	attrs->nice >= -20 && attrs->nice <= 19)
				3184	ret = apply_workqueue_attrs(wq, attrs);
				3185	else
				3186	ret = -EINVAL;
				3187
				3188	free_workqueue_attrs(attrs);
				3189	return ret ?: count;
				3190	}
				3191
				3192	static ssize_t wq_cpumask_show(struct device *dev,
				3193	struct device_attribute attr, char buf)
				3194	{
				3195	struct workqueue_struct *wq = dev_to_wq(dev);
				3196	int written;
				3197
				3198	rcu_read_lock_sched();
				3199	written = cpumask_scnprintf(buf, PAGE_SIZE,
				3200	first_pwq(wq)->pool->attrs->cpumask);
				3201	rcu_read_unlock_sched();
				3202
				3203	written += scnprintf(buf + written, PAGE_SIZE - written, "\n");
				3204	return written;
				3205	}
				3206
				3207	static ssize_t wq_cpumask_store(struct device *dev,
				3208	struct device_attribute *attr,
				3209	const char *buf, size_t count)
				3210	{
				3211	struct workqueue_struct *wq = dev_to_wq(dev);
				3212	struct workqueue_attrs *attrs;
				3213	int ret;
				3214
				3215	attrs = wq_sysfs_prep_attrs(wq);
				3216	if (!attrs)
				3217	return -ENOMEM;
				3218
				3219	ret = cpumask_parse(buf, attrs->cpumask);
				3220	if (!ret)
				3221	ret = apply_workqueue_attrs(wq, attrs);
				3222
				3223	free_workqueue_attrs(attrs);
				3224	return ret ?: count;
				3225	}
				3226
				3227	static struct device_attribute wq_sysfs_unbound_attrs[] = {
				3228	__ATTR(pool_id, 0444, wq_pool_id_show, NULL),
				3229	__ATTR(nice, 0644, wq_nice_show, wq_nice_store),
				3230	__ATTR(cpumask, 0644, wq_cpumask_show, wq_cpumask_store),
				3231	__ATTR_NULL,
				3232	};
				3233
				3234	static struct bus_type wq_subsys = {
				3235	.name = "workqueue",
				3236	.dev_attrs = wq_sysfs_attrs,
				3237	};
				3238
				3239	static int __init wq_sysfs_init(void)
				3240	{
				3241	return subsys_virtual_register(&wq_subsys, NULL);
				3242	}
				3243	core_initcall(wq_sysfs_init);
				3244
				3245	static void wq_device_release(struct device *dev)
				3246	{
				3247	struct wq_device *wq_dev = container_of(dev, struct wq_device, dev);
				3248
				3249	kfree(wq_dev);
				3250	}
				3251
				3252	/**
				3253	* workqueue_sysfs_register - make a workqueue visible in sysfs
				3254	* @wq: the workqueue to register
				3255	*
				3256	* Expose @wq in sysfs under /sys/bus/workqueue/devices.
				3257	* alloc_workqueue*() automatically calls this function if WQ_SYSFS is set
				3258	* which is the preferred method.
				3259	*
				3260	* Workqueue user should use this function directly iff it wants to apply
				3261	* workqueue_attrs before making the workqueue visible in sysfs; otherwise,
				3262	* apply_workqueue_attrs() may race against userland updating the
				3263	* attributes.
				3264	*
				3265	* Returns 0 on success, -errno on failure.
				3266	*/
				3267	int workqueue_sysfs_register(struct workqueue_struct *wq)
				3268	{
				3269	struct wq_device *wq_dev;
				3270	int ret;
				3271
				3272	/*
				3273	* Adjusting max_active or creating new pwqs by applyting
				3274	* attributes breaks ordering guarantee. Disallow exposing ordered
				3275	* workqueues.
				3276	*/
				3277	if (WARN_ON(wq->flags & __WQ_ORDERED))
				3278	return -EINVAL;
				3279
				3280	wq->wq_dev = wq_dev = kzalloc(sizeof(*wq_dev), GFP_KERNEL);
				3281	if (!wq_dev)
				3282	return -ENOMEM;
				3283
				3284	wq_dev->wq = wq;
				3285	wq_dev->dev.bus = &wq_subsys;
				3286	wq_dev->dev.init_name = wq->name;
				3287	wq_dev->dev.release = wq_device_release;
				3288
				3289	/*
				3290	* unbound_attrs are created separately. Suppress uevent until
				3291	* everything is ready.
				3292	*/
				3293	dev_set_uevent_suppress(&wq_dev->dev, true);
				3294
				3295	ret = device_register(&wq_dev->dev);
				3296	if (ret) {
				3297	kfree(wq_dev);
				3298	wq->wq_dev = NULL;
				3299	return ret;
				3300	}
				3301
				3302	if (wq->flags & WQ_UNBOUND) {
				3303	struct device_attribute *attr;
				3304
				3305	for (attr = wq_sysfs_unbound_attrs; attr->attr.name; attr++) {
				3306	ret = device_create_file(&wq_dev->dev, attr);
				3307	if (ret) {
				3308	device_unregister(&wq_dev->dev);
				3309	wq->wq_dev = NULL;
				3310	return ret;
				3311	}
				3312	}
				3313	}
				3314
				3315	kobject_uevent(&wq_dev->dev.kobj, KOBJ_ADD);
				3316	return 0;
				3317	}
				3318
				3319	/**
				3320	* workqueue_sysfs_unregister - undo workqueue_sysfs_register()
				3321	* @wq: the workqueue to unregister
				3322	*
				3323	* If @wq is registered to sysfs by workqueue_sysfs_register(), unregister.
				3324	*/
				3325	static void workqueue_sysfs_unregister(struct workqueue_struct *wq)
				3326	{
				3327	struct wq_device *wq_dev = wq->wq_dev;
				3328
				3329	if (!wq->wq_dev)
				3330	return;
				3331
				3332	wq->wq_dev = NULL;
				3333	device_unregister(&wq_dev->dev);
				3334	}
				3335	#else /* CONFIG_SYSFS */
				3336	static void workqueue_sysfs_unregister(struct workqueue_struct *wq) { }
				3337	#endif /* CONFIG_SYSFS */
				3338
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	3339	/**
				3340	* free_workqueue_attrs - free a workqueue_attrs
				3341	* @attrs: workqueue_attrs to free
				3342	*
				3343	* Undo alloc_workqueue_attrs().
				3344	*/
				3345	void free_workqueue_attrs(struct workqueue_attrs *attrs)
				3346	{
				3347	if (attrs) {
				3348	free_cpumask_var(attrs->cpumask);
				3349	kfree(attrs);
				3350	}
				3351	}
				3352
				3353	/**
				3354	* alloc_workqueue_attrs - allocate a workqueue_attrs
				3355	* @gfp_mask: allocation mask to use
				3356	*
				3357	* Allocate a new workqueue_attrs, initialize with default settings and
				3358	* return it. Returns NULL on failure.
				3359	*/
				3360	struct workqueue_attrs *alloc_workqueue_attrs(gfp_t gfp_mask)
				3361	{
				3362	struct workqueue_attrs *attrs;
				3363
				3364	attrs = kzalloc(sizeof(*attrs), gfp_mask);
				3365	if (!attrs)
				3366	goto fail;
				3367	if (!alloc_cpumask_var(&attrs->cpumask, gfp_mask))
				3368	goto fail;
				3369
				3370	cpumask_setall(attrs->cpumask);
				3371	return attrs;
				3372	fail:
				3373	free_workqueue_attrs(attrs);
				3374	return NULL;
				3375	}
				3376
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3377	static void copy_workqueue_attrs(struct workqueue_attrs *to,
				3378	const struct workqueue_attrs *from)
				3379	{
				3380	to->nice = from->nice;
				3381	cpumask_copy(to->cpumask, from->cpumask);
				3382	}
				3383
				3384	/*
				3385	* Hacky implementation of jhash of bitmaps which only considers the
				3386	* specified number of bits. We probably want a proper implementation in
				3387	* include/linux/jhash.h.
				3388	*/
				3389	static u32 jhash_bitmap(const unsigned long *bitmap, int bits, u32 hash)
				3390	{
				3391	int nr_longs = bits / BITS_PER_LONG;
				3392	int nr_leftover = bits % BITS_PER_LONG;
				3393	unsigned long leftover = 0;
				3394
				3395	if (nr_longs)
				3396	hash = jhash(bitmap, nr_longs * sizeof(long), hash);
				3397	if (nr_leftover) {
				3398	bitmap_copy(&leftover, bitmap + nr_longs, nr_leftover);
				3399	hash = jhash(&leftover, sizeof(long), hash);
				3400	}
				3401	return hash;
				3402	}
				3403
				3404	/* hash value of the content of @attr */
				3405	static u32 wqattrs_hash(const struct workqueue_attrs *attrs)
				3406	{
				3407	u32 hash = 0;
				3408
				3409	hash = jhash_1word(attrs->nice, hash);
				3410	hash = jhash_bitmap(cpumask_bits(attrs->cpumask), nr_cpu_ids, hash);
				3411	return hash;
				3412	}
				3413
				3414	/* content equality test */
				3415	static bool wqattrs_equal(const struct workqueue_attrs *a,
				3416	const struct workqueue_attrs *b)
				3417	{
				3418	if (a->nice != b->nice)
				3419	return false;
				3420	if (!cpumask_equal(a->cpumask, b->cpumask))
				3421	return false;
				3422	return true;
				3423	}
				3424
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	3425	/**
				3426	* init_worker_pool - initialize a newly zalloc'd worker_pool
				3427	* @pool: worker_pool to initialize
				3428	*
				3429	* Initiailize a newly zalloc'd @pool. It also allocates @pool->attrs.
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3430	* Returns 0 on success, -errno on failure. Even on failure, all fields
				3431	* inside @pool proper are initialized and put_unbound_pool() can be called
				3432	* on @pool safely to release it.
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	3433	*/
				3434	static int init_worker_pool(struct worker_pool *pool)
Tejun Heo	4e1a1f9	2013-03-12 11:30:00 -0700	[diff] [blame]	3435	{
				3436	spin_lock_init(&pool->lock);
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3437	pool->id = -1;
				3438	pool->cpu = -1;
Tejun Heo	4e1a1f9	2013-03-12 11:30:00 -0700	[diff] [blame]	3439	pool->flags \|= POOL_DISASSOCIATED;
				3440	INIT_LIST_HEAD(&pool->worklist);
				3441	INIT_LIST_HEAD(&pool->idle_list);
				3442	hash_init(pool->busy_hash);
				3443
				3444	init_timer_deferrable(&pool->idle_timer);
				3445	pool->idle_timer.function = idle_worker_timeout;
				3446	pool->idle_timer.data = (unsigned long)pool;
				3447
				3448	setup_timer(&pool->mayday_timer, pool_mayday_timeout,
				3449	(unsigned long)pool);
				3450
				3451	mutex_init(&pool->manager_arb);
Tejun Heo	bc3a1af	2013-03-13 19:47:39 -0700	[diff] [blame]	3452	mutex_init(&pool->manager_mutex);
Tejun Heo	822d840	2013-03-19 13:45:21 -0700	[diff] [blame]	3453	idr_init(&pool->worker_idr);
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	3454
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3455	INIT_HLIST_NODE(&pool->hash_node);
				3456	pool->refcnt = 1;
				3457
				3458	/* shouldn't fail above this point */
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	3459	pool->attrs = alloc_workqueue_attrs(GFP_KERNEL);
				3460	if (!pool->attrs)
				3461	return -ENOMEM;
				3462	return 0;
Tejun Heo	4e1a1f9	2013-03-12 11:30:00 -0700	[diff] [blame]	3463	}
				3464
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3465	static void rcu_free_pool(struct rcu_head *rcu)
				3466	{
				3467	struct worker_pool *pool = container_of(rcu, struct worker_pool, rcu);
				3468
Tejun Heo	822d840	2013-03-19 13:45:21 -0700	[diff] [blame]	3469	idr_destroy(&pool->worker_idr);
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3470	free_workqueue_attrs(pool->attrs);
				3471	kfree(pool);
				3472	}
				3473
				3474	/**
				3475	* put_unbound_pool - put a worker_pool
				3476	* @pool: worker_pool to put
				3477	*
				3478	* Put @pool. If its refcnt reaches zero, it gets destroyed in sched-RCU
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	3479	* safe manner. get_unbound_pool() calls this function on its failure path
				3480	* and this function should be able to release pools which went through,
				3481	* successfully or not, init_worker_pool().
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3482	*/
				3483	static void put_unbound_pool(struct worker_pool *pool)
				3484	{
				3485	struct worker *worker;
				3486
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	3487	mutex_lock(&wq_mutex);
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3488	if (--pool->refcnt) {
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	3489	mutex_unlock(&wq_mutex);
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3490	return;
				3491	}
				3492
				3493	/* sanity checks */
				3494	if (WARN_ON(!(pool->flags & POOL_DISASSOCIATED)) \|\|
				3495	WARN_ON(!list_empty(&pool->worklist))) {
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	3496	mutex_unlock(&wq_mutex);
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3497	return;
				3498	}
				3499
				3500	/* release id and unhash */
				3501	if (pool->id >= 0)
				3502	idr_remove(&worker_pool_idr, pool->id);
				3503	hash_del(&pool->hash_node);
				3504
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	3505	mutex_unlock(&wq_mutex);
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3506
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	3507	/*
				3508	* Become the manager and destroy all workers. Grabbing
				3509	* manager_arb prevents @pool's workers from blocking on
				3510	* manager_mutex.
				3511	*/
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3512	mutex_lock(&pool->manager_arb);
Tejun Heo	cd54968	2013-03-13 19:47:39 -0700	[diff] [blame]	3513	mutex_lock(&pool->manager_mutex);
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3514	spin_lock_irq(&pool->lock);
				3515
				3516	while ((worker = first_worker(pool)))
				3517	destroy_worker(worker);
				3518	WARN_ON(pool->nr_workers \|\| pool->nr_idle);
				3519
				3520	spin_unlock_irq(&pool->lock);
Tejun Heo	cd54968	2013-03-13 19:47:39 -0700	[diff] [blame]	3521	mutex_unlock(&pool->manager_mutex);
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3522	mutex_unlock(&pool->manager_arb);
				3523
				3524	/* shut down the timers */
				3525	del_timer_sync(&pool->idle_timer);
				3526	del_timer_sync(&pool->mayday_timer);
				3527
				3528	/* sched-RCU protected to allow dereferences from get_work_pool() */
				3529	call_rcu_sched(&pool->rcu, rcu_free_pool);
				3530	}
				3531
				3532	/**
				3533	* get_unbound_pool - get a worker_pool with the specified attributes
				3534	* @attrs: the attributes of the worker_pool to get
				3535	*
				3536	* Obtain a worker_pool which has the same attributes as @attrs, bump the
				3537	* reference count and return it. If there already is a matching
				3538	* worker_pool, it will be used; otherwise, this function attempts to
				3539	* create a new one. On failure, returns NULL.
				3540	*/
				3541	static struct worker_pool get_unbound_pool(const struct workqueue_attrs attrs)
				3542	{
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3543	u32 hash = wqattrs_hash(attrs);
				3544	struct worker_pool *pool;
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3545
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	3546	mutex_lock(&wq_mutex);
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3547
				3548	/* do we already have a matching pool? */
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3549	hash_for_each_possible(unbound_pool_hash, pool, hash_node, hash) {
				3550	if (wqattrs_equal(pool->attrs, attrs)) {
				3551	pool->refcnt++;
				3552	goto out_unlock;
				3553	}
				3554	}
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3555
				3556	/* nope, create a new one */
				3557	pool = kzalloc(sizeof(*pool), GFP_KERNEL);
				3558	if (!pool \|\| init_worker_pool(pool) < 0)
				3559	goto fail;
				3560
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	3561	lockdep_set_subclass(&pool->lock, 1); /* see put_pwq() */
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3562	copy_workqueue_attrs(pool->attrs, attrs);
				3563
				3564	if (worker_pool_assign_id(pool) < 0)
				3565	goto fail;
				3566
				3567	/* create and start the initial worker */
Tejun Heo	ebf44d1	2013-03-13 19:47:39 -0700	[diff] [blame]	3568	if (create_and_start_worker(pool) < 0)
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3569	goto fail;
				3570
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3571	/* install */
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3572	hash_add(unbound_pool_hash, &pool->hash_node, hash);
				3573	out_unlock:
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	3574	mutex_unlock(&wq_mutex);
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3575	return pool;
				3576	fail:
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	3577	mutex_unlock(&wq_mutex);
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3578	if (pool)
				3579	put_unbound_pool(pool);
				3580	return NULL;
				3581	}
				3582
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	3583	static void rcu_free_pwq(struct rcu_head *rcu)
				3584	{
				3585	kmem_cache_free(pwq_cache,
				3586	container_of(rcu, struct pool_workqueue, rcu));
				3587	}
				3588
				3589	/*
				3590	* Scheduled on system_wq by put_pwq() when an unbound pwq hits zero refcnt
				3591	* and needs to be destroyed.
				3592	*/
				3593	static void pwq_unbound_release_workfn(struct work_struct *work)
				3594	{
				3595	struct pool_workqueue *pwq = container_of(work, struct pool_workqueue,
				3596	unbound_release_work);
				3597	struct workqueue_struct *wq = pwq->wq;
				3598	struct worker_pool *pool = pwq->pool;
				3599
				3600	if (WARN_ON_ONCE(!(wq->flags & WQ_UNBOUND)))
				3601	return;
				3602
Tejun Heo	75ccf59	2013-03-12 11:30:04 -0700	[diff] [blame]	3603	/*
				3604	* Unlink @pwq. Synchronization against flush_mutex isn't strictly
				3605	* necessary on release but do it anyway. It's easier to verify
				3606	* and consistent with the linking path.
				3607	*/
				3608	mutex_lock(&wq->flush_mutex);
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	3609	spin_lock_irq(&pwq_lock);
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	3610	list_del_rcu(&pwq->pwqs_node);
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	3611	spin_unlock_irq(&pwq_lock);
Tejun Heo	75ccf59	2013-03-12 11:30:04 -0700	[diff] [blame]	3612	mutex_unlock(&wq->flush_mutex);
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	3613
				3614	put_unbound_pool(pool);
				3615	call_rcu_sched(&pwq->rcu, rcu_free_pwq);
				3616
				3617	/*
				3618	* If we're the last pwq going away, @wq is already dead and no one
				3619	* is gonna access it anymore. Free it.
				3620	*/
				3621	if (list_empty(&wq->pwqs))
				3622	kfree(wq);
				3623	}
				3624
Tejun Heo	0fbd95a	2013-03-13 16:51:35 -0700	[diff] [blame]	3625	/**
Tejun Heo	699ce09	2013-03-13 16:51:35 -0700	[diff] [blame]	3626	* pwq_adjust_max_active - update a pwq's max_active to the current setting
Tejun Heo	0fbd95a	2013-03-13 16:51:35 -0700	[diff] [blame]	3627	* @pwq: target pool_workqueue
Tejun Heo	0fbd95a	2013-03-13 16:51:35 -0700	[diff] [blame]	3628	*
Tejun Heo	699ce09	2013-03-13 16:51:35 -0700	[diff] [blame]	3629	* If @pwq isn't freezing, set @pwq->max_active to the associated
				3630	* workqueue's saved_max_active and activate delayed work items
				3631	* accordingly. If @pwq is freezing, clear @pwq->max_active to zero.
Tejun Heo	0fbd95a	2013-03-13 16:51:35 -0700	[diff] [blame]	3632	*/
Tejun Heo	699ce09	2013-03-13 16:51:35 -0700	[diff] [blame]	3633	static void pwq_adjust_max_active(struct pool_workqueue *pwq)
Tejun Heo	0fbd95a	2013-03-13 16:51:35 -0700	[diff] [blame]	3634	{
Tejun Heo	699ce09	2013-03-13 16:51:35 -0700	[diff] [blame]	3635	struct workqueue_struct *wq = pwq->wq;
				3636	bool freezable = wq->flags & WQ_FREEZABLE;
Tejun Heo	0fbd95a	2013-03-13 16:51:35 -0700	[diff] [blame]	3637
Tejun Heo	699ce09	2013-03-13 16:51:35 -0700	[diff] [blame]	3638	/* for @wq->saved_max_active */
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	3639	lockdep_assert_held(&pwq_lock);
Tejun Heo	699ce09	2013-03-13 16:51:35 -0700	[diff] [blame]	3640
				3641	/* fast exit for non-freezable wqs */
				3642	if (!freezable && pwq->max_active == wq->saved_max_active)
				3643	return;
				3644
				3645	spin_lock(&pwq->pool->lock);
				3646
				3647	if (!freezable \|\| !(pwq->pool->flags & POOL_FREEZING)) {
				3648	pwq->max_active = wq->saved_max_active;
				3649
				3650	while (!list_empty(&pwq->delayed_works) &&
				3651	pwq->nr_active < pwq->max_active)
				3652	pwq_activate_first_delayed(pwq);
				3653	} else {
				3654	pwq->max_active = 0;
				3655	}
				3656
				3657	spin_unlock(&pwq->pool->lock);
Tejun Heo	0fbd95a	2013-03-13 16:51:35 -0700	[diff] [blame]	3658	}
				3659
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3660	static void init_and_link_pwq(struct pool_workqueue *pwq,
				3661	struct workqueue_struct *wq,
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	3662	struct worker_pool *pool,
				3663	struct pool_workqueue **p_last_pwq)
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3664	{
				3665	BUG_ON((unsigned long)pwq & WORK_STRUCT_FLAG_MASK);
				3666
				3667	pwq->pool = pool;
				3668	pwq->wq = wq;
				3669	pwq->flush_color = -1;
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	3670	pwq->refcnt = 1;
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3671	INIT_LIST_HEAD(&pwq->delayed_works);
				3672	INIT_LIST_HEAD(&pwq->mayday_node);
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	3673	INIT_WORK(&pwq->unbound_release_work, pwq_unbound_release_workfn);
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3674
Tejun Heo	75ccf59	2013-03-12 11:30:04 -0700	[diff] [blame]	3675	mutex_lock(&wq->flush_mutex);
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	3676	spin_lock_irq(&pwq_lock);
Tejun Heo	75ccf59	2013-03-12 11:30:04 -0700	[diff] [blame]	3677
Tejun Heo	983ca25	2013-03-13 16:51:35 -0700	[diff] [blame]	3678	/*
				3679	* Set the matching work_color. This is synchronized with
				3680	* flush_mutex to avoid confusing flush_workqueue().
				3681	*/
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	3682	if (p_last_pwq)
				3683	*p_last_pwq = first_pwq(wq);
Tejun Heo	75ccf59	2013-03-12 11:30:04 -0700	[diff] [blame]	3684	pwq->work_color = wq->work_color;
Tejun Heo	983ca25	2013-03-13 16:51:35 -0700	[diff] [blame]	3685
				3686	/* sync max_active to the current setting */
				3687	pwq_adjust_max_active(pwq);
				3688
				3689	/* link in @pwq */
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	3690	list_add_rcu(&pwq->pwqs_node, &wq->pwqs);
Tejun Heo	75ccf59	2013-03-12 11:30:04 -0700	[diff] [blame]	3691
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	3692	spin_unlock_irq(&pwq_lock);
Tejun Heo	75ccf59	2013-03-12 11:30:04 -0700	[diff] [blame]	3693	mutex_unlock(&wq->flush_mutex);
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3694	}
				3695
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	3696	/**
				3697	* apply_workqueue_attrs - apply new workqueue_attrs to an unbound workqueue
				3698	* @wq: the target workqueue
				3699	* @attrs: the workqueue_attrs to apply, allocated with alloc_workqueue_attrs()
				3700	*
				3701	* Apply @attrs to an unbound workqueue @wq. If @attrs doesn't match the
				3702	* current attributes, a new pwq is created and made the first pwq which
				3703	* will serve all new work items. Older pwqs are released as in-flight
				3704	* work items finish. Note that a work item which repeatedly requeues
				3705	* itself back-to-back will stay on its current pwq.
				3706	*
				3707	* Performs GFP_KERNEL allocations. Returns 0 on success and -errno on
				3708	* failure.
				3709	*/
				3710	int apply_workqueue_attrs(struct workqueue_struct *wq,
				3711	const struct workqueue_attrs *attrs)
				3712	{
				3713	struct pool_workqueue pwq, last_pwq;
				3714	struct worker_pool *pool;
				3715
Tejun Heo	8719dce	2013-03-12 11:30:04 -0700	[diff] [blame]	3716	/* only unbound workqueues can change attributes */
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	3717	if (WARN_ON(!(wq->flags & WQ_UNBOUND)))
				3718	return -EINVAL;
				3719
Tejun Heo	8719dce	2013-03-12 11:30:04 -0700	[diff] [blame]	3720	/* creating multiple pwqs breaks ordering guarantee */
				3721	if (WARN_ON((wq->flags & __WQ_ORDERED) && !list_empty(&wq->pwqs)))
				3722	return -EINVAL;
				3723
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	3724	pwq = kmem_cache_zalloc(pwq_cache, GFP_KERNEL);
				3725	if (!pwq)
				3726	return -ENOMEM;
				3727
				3728	pool = get_unbound_pool(attrs);
				3729	if (!pool) {
				3730	kmem_cache_free(pwq_cache, pwq);
				3731	return -ENOMEM;
				3732	}
				3733
				3734	init_and_link_pwq(pwq, wq, pool, &last_pwq);
				3735	if (last_pwq) {
				3736	spin_lock_irq(&last_pwq->pool->lock);
				3737	put_pwq(last_pwq);
				3738	spin_unlock_irq(&last_pwq->pool->lock);
				3739	}
				3740
				3741	return 0;
				3742	}
				3743
Tejun Heo	30cdf24	2013-03-12 11:29:57 -0700	[diff] [blame]	3744	static int alloc_and_link_pwqs(struct workqueue_struct *wq)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	3745	{
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	3746	bool highpri = wq->flags & WQ_HIGHPRI;
Tejun Heo	30cdf24	2013-03-12 11:29:57 -0700	[diff] [blame]	3747	int cpu;
Frederic Weisbecker	e1d8aa9	2009-01-12 23:15:46 +0100	[diff] [blame]	3748
Tejun Heo	30cdf24	2013-03-12 11:29:57 -0700	[diff] [blame]	3749	if (!(wq->flags & WQ_UNBOUND)) {
Tejun Heo	420c0dd	2013-03-12 11:29:59 -0700	[diff] [blame]	3750	wq->cpu_pwqs = alloc_percpu(struct pool_workqueue);
				3751	if (!wq->cpu_pwqs)
Tejun Heo	30cdf24	2013-03-12 11:29:57 -0700	[diff] [blame]	3752	return -ENOMEM;
				3753
				3754	for_each_possible_cpu(cpu) {
Tejun Heo	7fb98ea	2013-03-12 11:30:00 -0700	[diff] [blame]	3755	struct pool_workqueue *pwq =
				3756	per_cpu_ptr(wq->cpu_pwqs, cpu);
Tejun Heo	7a62c2c	2013-03-12 11:30:03 -0700	[diff] [blame]	3757	struct worker_pool *cpu_pools =
Tejun Heo	f02ae73	2013-03-12 11:30:03 -0700	[diff] [blame]	3758	per_cpu(cpu_worker_pools, cpu);
Tejun Heo	30cdf24	2013-03-12 11:29:57 -0700	[diff] [blame]	3759
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	3760	init_and_link_pwq(pwq, wq, &cpu_pools[highpri], NULL);
Tejun Heo	30cdf24	2013-03-12 11:29:57 -0700	[diff] [blame]	3761	}
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	3762	return 0;
Tejun Heo	30cdf24	2013-03-12 11:29:57 -0700	[diff] [blame]	3763	} else {
Tejun Heo	9e8cd2f	2013-03-12 11:30:04 -0700	[diff] [blame]	3764	return apply_workqueue_attrs(wq, unbound_std_wq_attrs[highpri]);
Tejun Heo	30cdf24	2013-03-12 11:29:57 -0700	[diff] [blame]	3765	}
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3766	}
				3767
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3768	static int wq_clamp_max_active(int max_active, unsigned int flags,
				3769	const char *name)
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	3770	{
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3771	int lim = flags & WQ_UNBOUND ? WQ_UNBOUND_MAX_ACTIVE : WQ_MAX_ACTIVE;
				3772
				3773	if (max_active < 1 \|\| max_active > lim)
Valentin Ilie	044c782	2012-08-19 00:52:42 +0300	[diff] [blame]	3774	pr_warn("workqueue: max_active %d requested for %s is out of range, clamping between %d and %d\n",
				3775	max_active, name, 1, lim);
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	3776
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3777	return clamp_val(max_active, 1, lim);
Tejun Heo	b71ab8c	2010-06-29 10:07:14 +0200	[diff] [blame]	3778	}
				3779
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3780	struct workqueue_struct __alloc_workqueue_key(const char fmt,
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3781	unsigned int flags,
				3782	int max_active,
				3783	struct lock_class_key *key,
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3784	const char *lock_name, ...)
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3785	{
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3786	va_list args, args1;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3787	struct workqueue_struct *wq;
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	3788	struct pool_workqueue *pwq;
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3789	size_t namelen;
				3790
				3791	/* determine namelen, allocate wq and format name */
				3792	va_start(args, lock_name);
				3793	va_copy(args1, args);
				3794	namelen = vsnprintf(NULL, 0, fmt, args) + 1;
				3795
				3796	wq = kzalloc(sizeof(*wq) + namelen, GFP_KERNEL);
				3797	if (!wq)
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3798	return NULL;
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3799
				3800	vsnprintf(wq->name, namelen, fmt, args1);
				3801	va_end(args);
				3802	va_end(args1);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3803
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3804	max_active = max_active ?: WQ_DFL_ACTIVE;
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3805	max_active = wq_clamp_max_active(max_active, flags, wq->name);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3806
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3807	/* init wq */
Tejun Heo	97e37d7	2010-06-29 10:07:10 +0200	[diff] [blame]	3808	wq->flags = flags;
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3809	wq->saved_max_active = max_active;
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	3810	mutex_init(&wq->flush_mutex);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	3811	atomic_set(&wq->nr_pwqs_to_flush, 0);
Tejun Heo	30cdf24	2013-03-12 11:29:57 -0700	[diff] [blame]	3812	INIT_LIST_HEAD(&wq->pwqs);
Tejun Heo	73f53c4	2010-06-29 10:07:11 +0200	[diff] [blame]	3813	INIT_LIST_HEAD(&wq->flusher_queue);
				3814	INIT_LIST_HEAD(&wq->flusher_overflow);
Tejun Heo	493a172	2013-03-12 11:29:59 -0700	[diff] [blame]	3815	INIT_LIST_HEAD(&wq->maydays);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3816
Johannes Berg	eb13ba8	2008-01-16 09:51:58 +0100	[diff] [blame]	3817	lockdep_init_map(&wq->lockdep_map, lock_name, key, 0);
Oleg Nesterov	cce1a16	2007-05-09 02:34:13 -0700	[diff] [blame]	3818	INIT_LIST_HEAD(&wq->list);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3819
Tejun Heo	30cdf24	2013-03-12 11:29:57 -0700	[diff] [blame]	3820	if (alloc_and_link_pwqs(wq) < 0)
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3821	goto err_free_wq;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3822
Tejun Heo	493008a	2013-03-12 11:30:03 -0700	[diff] [blame]	3823	/*
				3824	* Workqueues which may be used during memory reclaim should
				3825	* have a rescuer to guarantee forward progress.
				3826	*/
				3827	if (flags & WQ_MEM_RECLAIM) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3828	struct worker *rescuer;
				3829
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3830	rescuer = alloc_worker();
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3831	if (!rescuer)
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3832	goto err_destroy;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3833
Tejun Heo	111c225	2013-01-17 17:16:24 -0800	[diff] [blame]	3834	rescuer->rescue_wq = wq;
				3835	rescuer->task = kthread_create(rescuer_thread, rescuer, "%s",
Tejun Heo	b196be8	2012-01-10 15:11:35 -0800	[diff] [blame]	3836	wq->name);
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3837	if (IS_ERR(rescuer->task)) {
				3838	kfree(rescuer);
				3839	goto err_destroy;
				3840	}
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3841
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3842	wq->rescuer = rescuer;
Tejun Heo	14a40ff	2013-03-19 13:45:20 -0700	[diff] [blame]	3843	rescuer->task->flags \|= PF_NO_SETAFFINITY;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3844	wake_up_process(rescuer->task);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3845	}
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3846
Tejun Heo	226223a	2013-03-12 11:30:05 -0700	[diff] [blame]	3847	if ((wq->flags & WQ_SYSFS) && workqueue_sysfs_register(wq))
				3848	goto err_destroy;
				3849
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3850	/*
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	3851	* wq_mutex protects global freeze state and workqueues list. Grab
				3852	* it, adjust max_active and add the new @wq to workqueues list.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3853	*/
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	3854	mutex_lock(&wq_mutex);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3855
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	3856	spin_lock_irq(&pwq_lock);
Tejun Heo	699ce09	2013-03-13 16:51:35 -0700	[diff] [blame]	3857	for_each_pwq(pwq, wq)
				3858	pwq_adjust_max_active(pwq);
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	3859	spin_unlock_irq(&pwq_lock);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3860
Tejun Heo	1537663	2010-06-29 10:07:11 +0200	[diff] [blame]	3861	list_add(&wq->list, &workqueues);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3862
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	3863	mutex_unlock(&wq_mutex);
Tejun Heo	1537663	2010-06-29 10:07:11 +0200	[diff] [blame]	3864
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3865	return wq;
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3866
				3867	err_free_wq:
				3868	kfree(wq);
				3869	return NULL;
				3870	err_destroy:
				3871	destroy_workqueue(wq);
Tejun Heo	4690c4a	2010-06-29 10:07:10 +0200	[diff] [blame]	3872	return NULL;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3873	}
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	3874	EXPORT_SYMBOL_GPL(__alloc_workqueue_key);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3875
				3876	/**
				3877	* destroy_workqueue - safely terminate a workqueue
				3878	* @wq: target workqueue
				3879	*
				3880	* Safely destroy a workqueue. All work currently pending will be done first.
				3881	*/
				3882	void destroy_workqueue(struct workqueue_struct *wq)
				3883	{
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	3884	struct pool_workqueue *pwq;
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3885
Tejun Heo	9c5a2ba	2011-04-05 18:01:44 +0200	[diff] [blame]	3886	/* drain it before proceeding with destruction */
				3887	drain_workqueue(wq);
Tejun Heo	c8efcc2	2010-12-20 19:32:04 +0100	[diff] [blame]	3888
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	3889	/* sanity checks */
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	3890	spin_lock_irq(&pwq_lock);
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	3891	for_each_pwq(pwq, wq) {
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	3892	int i;
				3893
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	3894	for (i = 0; i < WORK_NR_COLORS; i++) {
				3895	if (WARN_ON(pwq->nr_in_flight[i])) {
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	3896	spin_unlock_irq(&pwq_lock);
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	3897	return;
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	3898	}
				3899	}
				3900
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	3901	if (WARN_ON(pwq->refcnt > 1) \|\|
				3902	WARN_ON(pwq->nr_active) \|\|
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	3903	WARN_ON(!list_empty(&pwq->delayed_works))) {
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	3904	spin_unlock_irq(&pwq_lock);
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	3905	return;
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	3906	}
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	3907	}
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	3908	spin_unlock_irq(&pwq_lock);
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	3909
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	3910	/*
				3911	* wq list is used to freeze wq, remove from list after
				3912	* flushing is complete in case freeze races us.
				3913	*/
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	3914	mutex_lock(&wq_mutex);
Tejun Heo	d2c1d40	2013-03-12 11:30:04 -0700	[diff] [blame]	3915	list_del_init(&wq->list);
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	3916	mutex_unlock(&wq_mutex);
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3917
Tejun Heo	226223a	2013-03-12 11:30:05 -0700	[diff] [blame]	3918	workqueue_sysfs_unregister(wq);
				3919
Tejun Heo	493008a	2013-03-12 11:30:03 -0700	[diff] [blame]	3920	if (wq->rescuer) {
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3921	kthread_stop(wq->rescuer->task);
Xiaotian Feng	8d9df9f	2010-08-16 09:54:28 +0200	[diff] [blame]	3922	kfree(wq->rescuer);
Tejun Heo	493008a	2013-03-12 11:30:03 -0700	[diff] [blame]	3923	wq->rescuer = NULL;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	3924	}
				3925
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	3926	if (!(wq->flags & WQ_UNBOUND)) {
				3927	/*
				3928	* The base ref is never dropped on per-cpu pwqs. Directly
				3929	* free the pwqs and wq.
				3930	*/
				3931	free_percpu(wq->cpu_pwqs);
				3932	kfree(wq);
				3933	} else {
				3934	/*
				3935	* We're the sole accessor of @wq at this point. Directly
				3936	* access the first pwq and put the base ref. As both pwqs
				3937	* and pools are sched-RCU protected, the lock operations
				3938	* are safe. @wq will be freed when the last pwq is
				3939	* released.
				3940	*/
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3941	pwq = list_first_entry(&wq->pwqs, struct pool_workqueue,
				3942	pwqs_node);
Tejun Heo	8864b4e	2013-03-12 11:30:04 -0700	[diff] [blame]	3943	spin_lock_irq(&pwq->pool->lock);
				3944	put_pwq(pwq);
				3945	spin_unlock_irq(&pwq->pool->lock);
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	3946	}
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	3947	}
				3948	EXPORT_SYMBOL_GPL(destroy_workqueue);
				3949
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3950	/**
				3951	* workqueue_set_max_active - adjust max_active of a workqueue
				3952	* @wq: target workqueue
				3953	* @max_active: new max_active value.
				3954	*
				3955	* Set max_active of @wq to @max_active.
				3956	*
				3957	* CONTEXT:
				3958	* Don't call from IRQ context.
				3959	*/
				3960	void workqueue_set_max_active(struct workqueue_struct *wq, int max_active)
				3961	{
Tejun Heo	49e3cf4	2013-03-12 11:29:58 -0700	[diff] [blame]	3962	struct pool_workqueue *pwq;
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3963
Tejun Heo	8719dce	2013-03-12 11:30:04 -0700	[diff] [blame]	3964	/* disallow meddling with max_active for ordered workqueues */
				3965	if (WARN_ON(wq->flags & __WQ_ORDERED))
				3966	return;
				3967
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	3968	max_active = wq_clamp_max_active(max_active, wq->flags, wq->name);
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3969
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	3970	spin_lock_irq(&pwq_lock);
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3971
				3972	wq->saved_max_active = max_active;
				3973
Tejun Heo	699ce09	2013-03-13 16:51:35 -0700	[diff] [blame]	3974	for_each_pwq(pwq, wq)
				3975	pwq_adjust_max_active(pwq);
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3976
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	3977	spin_unlock_irq(&pwq_lock);
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3978	}
				3979	EXPORT_SYMBOL_GPL(workqueue_set_max_active);
				3980
				3981	/**
Tejun Heo	e626761	2013-03-12 17:41:37 -0700	[diff] [blame]	3982	* current_is_workqueue_rescuer - is %current workqueue rescuer?
				3983	*
				3984	* Determine whether %current is a workqueue rescuer. Can be used from
				3985	* work functions to determine whether it's being run off the rescuer task.
				3986	*/
				3987	bool current_is_workqueue_rescuer(void)
				3988	{
				3989	struct worker *worker = current_wq_worker();
				3990
				3991	return worker && worker == worker->current_pwq->wq->rescuer;
				3992	}
				3993
				3994	/**
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	3995	* workqueue_congested - test whether a workqueue is congested
				3996	* @cpu: CPU in question
				3997	* @wq: target workqueue
				3998	*
				3999	* Test whether @wq's cpu workqueue for @cpu is congested. There is
				4000	* no synchronization around this function and the test result is
				4001	* unreliable and only useful as advisory hints or for debugging.
				4002	*
				4003	* RETURNS:
				4004	* %true if congested, %false otherwise.
				4005	*/
Tejun Heo	d84ff05	2013-03-12 11:29:59 -0700	[diff] [blame]	4006	bool workqueue_congested(int cpu, struct workqueue_struct *wq)
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4007	{
Tejun Heo	7fb98ea	2013-03-12 11:30:00 -0700	[diff] [blame]	4008	struct pool_workqueue *pwq;
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	4009	bool ret;
				4010
				4011	preempt_disable();
Tejun Heo	7fb98ea	2013-03-12 11:30:00 -0700	[diff] [blame]	4012
				4013	if (!(wq->flags & WQ_UNBOUND))
				4014	pwq = per_cpu_ptr(wq->cpu_pwqs, cpu);
				4015	else
				4016	pwq = first_pwq(wq);
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4017
Tejun Heo	76af4d9	2013-03-12 11:30:00 -0700	[diff] [blame]	4018	ret = !list_empty(&pwq->delayed_works);
				4019	preempt_enable();
				4020
				4021	return ret;
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4022	}
				4023	EXPORT_SYMBOL_GPL(workqueue_congested);
				4024
				4025	/**
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4026	* work_busy - test whether a work is currently pending or running
				4027	* @work: the work to be tested
				4028	*
				4029	* Test whether @work is currently pending or running. There is no
				4030	* synchronization around this function and the test result is
				4031	* unreliable and only useful as advisory hints or for debugging.
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4032	*
				4033	* RETURNS:
				4034	* OR'd bitmask of WORK_BUSY_* bits.
				4035	*/
				4036	unsigned int work_busy(struct work_struct *work)
				4037	{
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	4038	struct worker_pool *pool;
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4039	unsigned long flags;
				4040	unsigned int ret = 0;
				4041
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4042	if (work_pending(work))
				4043	ret \|= WORK_BUSY_PENDING;
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4044
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	4045	local_irq_save(flags);
				4046	pool = get_work_pool(work);
Lai Jiangshan	038366c	2013-02-06 18:04:53 -0800	[diff] [blame]	4047	if (pool) {
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	4048	spin_lock(&pool->lock);
Lai Jiangshan	038366c	2013-02-06 18:04:53 -0800	[diff] [blame]	4049	if (find_worker_executing_work(pool, work))
				4050	ret \|= WORK_BUSY_RUNNING;
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	4051	spin_unlock(&pool->lock);
Lai Jiangshan	038366c	2013-02-06 18:04:53 -0800	[diff] [blame]	4052	}
Tejun Heo	fa1b54e	2013-03-12 11:30:00 -0700	[diff] [blame]	4053	local_irq_restore(flags);
Tejun Heo	dcd989c	2010-06-29 10:07:14 +0200	[diff] [blame]	4054
				4055	return ret;
				4056	}
				4057	EXPORT_SYMBOL_GPL(work_busy);
				4058
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	4059	/*
				4060	* CPU hotplug.
				4061	*
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	4062	* There are two challenges in supporting CPU hotplug. Firstly, there
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	4063	* are a lot of assumptions on strong associations among work, pwq and
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	4064	* pool which make migrating pending and scheduled works very
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	4065	* difficult to implement without impacting hot paths. Secondly,
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	4066	* worker pools serve mix of short, long and very long running works making
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	4067	* blocked draining impractical.
				4068	*
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	4069	* This is solved by allowing the pools to be disassociated from the CPU
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	4070	* running as an unbound one and allowing it to be reattached later if the
				4071	* cpu comes back online.
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	4072	*/
				4073
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	4074	static void wq_unbind_fn(struct work_struct *work)
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	4075	{
Tejun Heo	38db41d	2013-01-24 11:01:34 -0800	[diff] [blame]	4076	int cpu = smp_processor_id();
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	4077	struct worker_pool *pool;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	4078	struct worker *worker;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	4079	int i;
				4080
Tejun Heo	f02ae73	2013-03-12 11:30:03 -0700	[diff] [blame]	4081	for_each_cpu_worker_pool(pool, cpu) {
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	4082	WARN_ON_ONCE(cpu != smp_processor_id());
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	4083
Tejun Heo	bc3a1af	2013-03-13 19:47:39 -0700	[diff] [blame]	4084	mutex_lock(&pool->manager_mutex);
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	4085	spin_lock_irq(&pool->lock);
				4086
				4087	/*
Tejun Heo	bc3a1af	2013-03-13 19:47:39 -0700	[diff] [blame]	4088	* We've blocked all manager operations. Make all workers
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	4089	* unbound and set DISASSOCIATED. Before this, all workers
				4090	* except for the ones which are still executing works from
				4091	* before the last CPU down must be on the cpu. After
				4092	* this, they may become diasporas.
				4093	*/
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	4094	list_for_each_entry(worker, &pool->idle_list, entry)
Tejun Heo	403c821	2012-07-17 12:39:27 -0700	[diff] [blame]	4095	worker->flags \|= WORKER_UNBOUND;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	4096
Sasha Levin	b67bfe0	2013-02-27 17:06:00 -0800	[diff] [blame]	4097	for_each_busy_worker(worker, i, pool)
Tejun Heo	c9e7cf2	2013-01-24 11:01:33 -0800	[diff] [blame]	4098	worker->flags \|= WORKER_UNBOUND;
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	4099
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	4100	pool->flags \|= POOL_DISASSOCIATED;
Tejun Heo	f2d5a0e	2012-07-17 12:39:26 -0700	[diff] [blame]	4101
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	4102	spin_unlock_irq(&pool->lock);
Tejun Heo	bc3a1af	2013-03-13 19:47:39 -0700	[diff] [blame]	4103	mutex_unlock(&pool->manager_mutex);
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	4104	}
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	4105
				4106	/*
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	4107	* Call schedule() so that we cross rq->lock and thus can guarantee
				4108	* sched callbacks see the %WORKER_UNBOUND flag. This is necessary
				4109	* as scheduler callbacks may be invoked from other cpus.
				4110	*/
				4111	schedule();
				4112
				4113	/*
				4114	* Sched callbacks are disabled now. Zap nr_running. After this,
				4115	* nr_running stays zero and need_more_worker() and keep_working()
Tejun Heo	38db41d	2013-01-24 11:01:34 -0800	[diff] [blame]	4116	* are always true as long as the worklist is not empty. Pools on
				4117	* @cpu now behave as unbound (in terms of concurrency management)
				4118	* pools which are served by workers tied to the CPU.
Tejun Heo	628c78e	2012-07-17 12:39:27 -0700	[diff] [blame]	4119	*
				4120	* On return from this function, the current worker would trigger
				4121	* unbound chain execution of pending work items if other workers
				4122	* didn't already.
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	4123	*/
Tejun Heo	f02ae73	2013-03-12 11:30:03 -0700	[diff] [blame]	4124	for_each_cpu_worker_pool(pool, cpu)
Tejun Heo	e19e397	2013-01-24 11:39:44 -0800	[diff] [blame]	4125	atomic_set(&pool->nr_running, 0);
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	4126	}
				4127
Tejun Heo	bd7c089	2013-03-19 13:45:21 -0700	[diff] [blame^]	4128	/**
				4129	* rebind_workers - rebind all workers of a pool to the associated CPU
				4130	* @pool: pool of interest
				4131	*
				4132	* @pool->cpu is coming online. Rebind all workers to the CPU. Rebinding
				4133	* is different for idle and busy ones.
				4134	*
				4135	* Idle ones will be removed from the idle_list and woken up. They will
				4136	* add themselves back after completing rebind. This ensures that the
				4137	* idle_list doesn't contain any unbound workers when re-bound busy workers
				4138	* try to perform local wake-ups for concurrency management.
				4139	*
				4140	* Busy workers can rebind after they finish their current work items.
				4141	* Queueing the rebind work item at the head of the scheduled list is
				4142	* enough. Note that nr_running will be properly bumped as busy workers
				4143	* rebind.
				4144	*
				4145	* On return, all non-manager workers are scheduled for rebind - see
				4146	* manage_workers() for the manager special case. Any idle worker
				4147	* including the manager will not appear on @idle_list until rebind is
				4148	* complete, making local wake-ups safe.
				4149	*/
				4150	static void rebind_workers(struct worker_pool *pool)
				4151	{
				4152	struct worker worker, n;
				4153	int i;
				4154
				4155	lockdep_assert_held(&pool->manager_mutex);
				4156	lockdep_assert_held(&pool->lock);
				4157
				4158	/* dequeue and kick idle ones */
				4159	list_for_each_entry_safe(worker, n, &pool->idle_list, entry) {
				4160	/*
				4161	* idle workers should be off @pool->idle_list until rebind
				4162	* is complete to avoid receiving premature local wake-ups.
				4163	*/
				4164	list_del_init(&worker->entry);
				4165
				4166	/*
				4167	* worker_thread() will see the above dequeuing and call
				4168	* idle_worker_rebind().
				4169	*/
				4170	wake_up_process(worker->task);
				4171	}
				4172
				4173	/* rebind busy workers */
				4174	for_each_busy_worker(worker, i, pool) {
				4175	struct work_struct *rebind_work = &worker->rebind_work;
				4176	struct workqueue_struct *wq;
				4177
				4178	if (test_and_set_bit(WORK_STRUCT_PENDING_BIT,
				4179	work_data_bits(rebind_work)))
				4180	continue;
				4181
				4182	debug_work_activate(rebind_work);
				4183
				4184	/*
				4185	* wq doesn't really matter but let's keep @worker->pool
				4186	* and @pwq->pool consistent for sanity.
				4187	*/
				4188	if (worker->pool->attrs->nice < 0)
				4189	wq = system_highpri_wq;
				4190	else
				4191	wq = system_wq;
				4192
				4193	insert_work(per_cpu_ptr(wq->cpu_pwqs, pool->cpu), rebind_work,
				4194	worker->scheduled.next,
				4195	work_color_to_flags(WORK_NO_COLOR));
				4196	}
				4197	}
				4198
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	4199	/*
				4200	* Workqueues should be brought up before normal priority CPU notifiers.
				4201	* This will be registered high priority CPU notifier.
				4202	*/
Lai Jiangshan	9fdf9b7	2012-09-18 09:59:23 -0700	[diff] [blame]	4203	static int __cpuinit workqueue_cpu_up_callback(struct notifier_block *nfb,
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	4204	unsigned long action,
				4205	void *hcpu)
Oleg Nesterov	3af24433	2007-05-09 02:34:09 -0700	[diff] [blame]	4206	{
Tejun Heo	d84ff05	2013-03-12 11:29:59 -0700	[diff] [blame]	4207	int cpu = (unsigned long)hcpu;
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	4208	struct worker_pool *pool;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	4209
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	4210	switch (action & ~CPU_TASKS_FROZEN) {
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	4211	case CPU_UP_PREPARE:
Tejun Heo	f02ae73	2013-03-12 11:30:03 -0700	[diff] [blame]	4212	for_each_cpu_worker_pool(pool, cpu) {
Tejun Heo	3ce6337	2012-07-17 12:39:27 -0700	[diff] [blame]	4213	if (pool->nr_workers)
				4214	continue;
Tejun Heo	ebf44d1	2013-03-13 19:47:39 -0700	[diff] [blame]	4215	if (create_and_start_worker(pool) < 0)
Tejun Heo	3ce6337	2012-07-17 12:39:27 -0700	[diff] [blame]	4216	return NOTIFY_BAD;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	4217	}
Tejun Heo	db7bccf	2010-06-29 10:07:12 +0200	[diff] [blame]	4218	break;
Oleg Nesterov	00dfcaf	2008-04-29 01:00:27 -0700	[diff] [blame]	4219
Tejun Heo	6575820	2012-07-17 12:39:26 -0700	[diff] [blame]	4220	case CPU_DOWN_FAILED:
				4221	case CPU_ONLINE:
Tejun Heo	f02ae73	2013-03-12 11:30:03 -0700	[diff] [blame]	4222	for_each_cpu_worker_pool(pool, cpu) {
Tejun Heo	bc3a1af	2013-03-13 19:47:39 -0700	[diff] [blame]	4223	mutex_lock(&pool->manager_mutex);
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	4224	spin_lock_irq(&pool->lock);
				4225
Tejun Heo	2464757	2013-01-24 11:01:33 -0800	[diff] [blame]	4226	pool->flags &= ~POOL_DISASSOCIATED;
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	4227	rebind_workers(pool);
				4228
				4229	spin_unlock_irq(&pool->lock);
Tejun Heo	bc3a1af	2013-03-13 19:47:39 -0700	[diff] [blame]	4230	mutex_unlock(&pool->manager_mutex);
Tejun Heo	94cf58b	2013-01-24 11:01:33 -0800	[diff] [blame]	4231	}
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	4232	break;
Tejun Heo	6575820	2012-07-17 12:39:26 -0700	[diff] [blame]	4233	}
				4234	return NOTIFY_OK;
				4235	}
				4236
				4237	/*
				4238	* Workqueues should be brought down after normal priority CPU notifiers.
				4239	* This will be registered as low priority CPU notifier.
				4240	*/
Lai Jiangshan	9fdf9b7	2012-09-18 09:59:23 -0700	[diff] [blame]	4241	static int __cpuinit workqueue_cpu_down_callback(struct notifier_block *nfb,
Tejun Heo	6575820	2012-07-17 12:39:26 -0700	[diff] [blame]	4242	unsigned long action,
				4243	void *hcpu)
				4244	{
Tejun Heo	d84ff05	2013-03-12 11:29:59 -0700	[diff] [blame]	4245	int cpu = (unsigned long)hcpu;
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	4246	struct work_struct unbind_work;
				4247
Tejun Heo	6575820	2012-07-17 12:39:26 -0700	[diff] [blame]	4248	switch (action & ~CPU_TASKS_FROZEN) {
				4249	case CPU_DOWN_PREPARE:
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	4250	/* unbinding should happen on the local CPU */
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	4251	INIT_WORK_ONSTACK(&unbind_work, wq_unbind_fn);
Joonsoo Kim	7635d2f	2012-08-15 23:25:41 +0900	[diff] [blame]	4252	queue_work_on(cpu, system_highpri_wq, &unbind_work);
Tejun Heo	8db25e7	2012-07-17 12:39:28 -0700	[diff] [blame]	4253	flush_work(&unbind_work);
				4254	break;
Tejun Heo	6575820	2012-07-17 12:39:26 -0700	[diff] [blame]	4255	}
				4256	return NOTIFY_OK;
				4257	}
				4258
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	4259	#ifdef CONFIG_SMP
Rusty Russell	8ccad40	2009-01-16 15:31:15 -0800	[diff] [blame]	4260
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	4261	struct work_for_cpu {
Tejun Heo	ed48ece	2012-09-18 12:48:43 -0700	[diff] [blame]	4262	struct work_struct work;
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	4263	long (fn)(void );
				4264	void *arg;
				4265	long ret;
				4266	};
				4267
Tejun Heo	ed48ece	2012-09-18 12:48:43 -0700	[diff] [blame]	4268	static void work_for_cpu_fn(struct work_struct *work)
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	4269	{
Tejun Heo	ed48ece	2012-09-18 12:48:43 -0700	[diff] [blame]	4270	struct work_for_cpu *wfc = container_of(work, struct work_for_cpu, work);
				4271
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	4272	wfc->ret = wfc->fn(wfc->arg);
				4273	}
				4274
				4275	/**
				4276	* work_on_cpu - run a function in user context on a particular cpu
				4277	* @cpu: the cpu to run on
				4278	* @fn: the function to run
				4279	* @arg: the function arg
				4280	*
Rusty Russell	31ad908	2009-01-16 15:31:15 -0800	[diff] [blame]	4281	* This will return the value @fn returns.
				4282	* It is up to the caller to ensure that the cpu doesn't go offline.
Andrew Morton	6b44003	2009-04-09 09:50:37 -0600	[diff] [blame]	4283	* The caller must not hold any locks which would prevent @fn from completing.
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	4284	*/
Tejun Heo	d84ff05	2013-03-12 11:29:59 -0700	[diff] [blame]	4285	long work_on_cpu(int cpu, long (fn)(void ), void *arg)
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	4286	{
Tejun Heo	ed48ece	2012-09-18 12:48:43 -0700	[diff] [blame]	4287	struct work_for_cpu wfc = { .fn = fn, .arg = arg };
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	4288
Tejun Heo	ed48ece	2012-09-18 12:48:43 -0700	[diff] [blame]	4289	INIT_WORK_ONSTACK(&wfc.work, work_for_cpu_fn);
				4290	schedule_work_on(cpu, &wfc.work);
				4291	flush_work(&wfc.work);
Rusty Russell	2d3854a	2008-11-05 13:39:10 +1100	[diff] [blame]	4292	return wfc.ret;
				4293	}
				4294	EXPORT_SYMBOL_GPL(work_on_cpu);
				4295	#endif /* CONFIG_SMP */
				4296
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4297	#ifdef CONFIG_FREEZER
Rusty Russell	e7577c5	2009-01-01 10:12:25 +1030	[diff] [blame]	4298
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4299	/**
				4300	* freeze_workqueues_begin - begin freezing workqueues
				4301	*
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	4302	* Start freezing workqueues. After this function returns, all freezable
Tejun Heo	c5aa87b	2013-03-13 16:51:36 -0700	[diff] [blame]	4303	* workqueues will queue new works to their delayed_works list instead of
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	4304	* pool->worklist.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4305	*
				4306	* CONTEXT:
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	4307	* Grabs and releases wq_mutex, pwq_lock and pool->lock's.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4308	*/
				4309	void freeze_workqueues_begin(void)
				4310	{
Tejun Heo	1711696	2013-03-12 11:29:58 -0700	[diff] [blame]	4311	struct worker_pool *pool;
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4312	struct workqueue_struct *wq;
				4313	struct pool_workqueue *pwq;
Tejun Heo	611c92a	2013-03-13 16:51:36 -0700	[diff] [blame]	4314	int pi;
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4315
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	4316	mutex_lock(&wq_mutex);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4317
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	4318	WARN_ON_ONCE(workqueue_freezing);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4319	workqueue_freezing = true;
				4320
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4321	/* set FREEZING */
Tejun Heo	611c92a	2013-03-13 16:51:36 -0700	[diff] [blame]	4322	for_each_pool(pool, pi) {
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	4323	spin_lock_irq(&pool->lock);
Tejun Heo	1711696	2013-03-12 11:29:58 -0700	[diff] [blame]	4324	WARN_ON_ONCE(pool->flags & POOL_FREEZING);
				4325	pool->flags \|= POOL_FREEZING;
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	4326	spin_unlock_irq(&pool->lock);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4327	}
				4328
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4329	/* suppress further executions by setting max_active to zero */
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	4330	spin_lock_irq(&pwq_lock);
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4331	list_for_each_entry(wq, &workqueues, list) {
Tejun Heo	699ce09	2013-03-13 16:51:35 -0700	[diff] [blame]	4332	for_each_pwq(pwq, wq)
				4333	pwq_adjust_max_active(pwq);
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4334	}
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	4335	spin_unlock_irq(&pwq_lock);
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	4336
				4337	mutex_unlock(&wq_mutex);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	4338	}
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4339
				4340	/**
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	4341	* freeze_workqueues_busy - are freezable workqueues still busy?
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4342	*
				4343	* Check whether freezing is complete. This function must be called
				4344	* between freeze_workqueues_begin() and thaw_workqueues().
				4345	*
				4346	* CONTEXT:
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	4347	* Grabs and releases wq_mutex.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4348	*
				4349	* RETURNS:
Tejun Heo	58a69cb	2011-02-16 09:25:31 +0100	[diff] [blame]	4350	* %true if some freezable workqueues are still busy. %false if freezing
				4351	* is complete.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4352	*/
				4353	bool freeze_workqueues_busy(void)
				4354	{
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4355	bool busy = false;
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4356	struct workqueue_struct *wq;
				4357	struct pool_workqueue *pwq;
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4358
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	4359	mutex_lock(&wq_mutex);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4360
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	4361	WARN_ON_ONCE(!workqueue_freezing);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4362
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4363	list_for_each_entry(wq, &workqueues, list) {
				4364	if (!(wq->flags & WQ_FREEZABLE))
				4365	continue;
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4366	/*
				4367	* nr_active is monotonically decreasing. It's safe
				4368	* to peek without lock.
				4369	*/
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	4370	preempt_disable();
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4371	for_each_pwq(pwq, wq) {
Tejun Heo	6183c00	2013-03-12 11:29:57 -0700	[diff] [blame]	4372	WARN_ON_ONCE(pwq->nr_active < 0);
Tejun Heo	112202d	2013-02-13 19:29:12 -0800	[diff] [blame]	4373	if (pwq->nr_active) {
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4374	busy = true;
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	4375	preempt_enable();
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4376	goto out_unlock;
				4377	}
				4378	}
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	4379	preempt_enable();
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4380	}
				4381	out_unlock:
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	4382	mutex_unlock(&wq_mutex);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4383	return busy;
				4384	}
				4385
				4386	/**
				4387	* thaw_workqueues - thaw workqueues
				4388	*
				4389	* Thaw workqueues. Normal queueing is restored and all collected
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	4390	* frozen works are transferred to their respective pool worklists.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4391	*
				4392	* CONTEXT:
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	4393	* Grabs and releases wq_mutex, pwq_lock and pool->lock's.
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4394	*/
				4395	void thaw_workqueues(void)
				4396	{
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4397	struct workqueue_struct *wq;
				4398	struct pool_workqueue *pwq;
				4399	struct worker_pool *pool;
Tejun Heo	611c92a	2013-03-13 16:51:36 -0700	[diff] [blame]	4400	int pi;
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4401
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	4402	mutex_lock(&wq_mutex);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4403
				4404	if (!workqueue_freezing)
				4405	goto out_unlock;
				4406
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4407	/* clear FREEZING */
Tejun Heo	611c92a	2013-03-13 16:51:36 -0700	[diff] [blame]	4408	for_each_pool(pool, pi) {
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	4409	spin_lock_irq(&pool->lock);
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4410	WARN_ON_ONCE(!(pool->flags & POOL_FREEZING));
				4411	pool->flags &= ~POOL_FREEZING;
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	4412	spin_unlock_irq(&pool->lock);
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4413	}
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	4414
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4415	/* restore max_active and repopulate worklist */
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	4416	spin_lock_irq(&pwq_lock);
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4417	list_for_each_entry(wq, &workqueues, list) {
Tejun Heo	699ce09	2013-03-13 16:51:35 -0700	[diff] [blame]	4418	for_each_pwq(pwq, wq)
				4419	pwq_adjust_max_active(pwq);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4420	}
Tejun Heo	794b18b	2013-03-13 19:47:40 -0700	[diff] [blame]	4421	spin_unlock_irq(&pwq_lock);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4422
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4423	/* kick workers */
Tejun Heo	611c92a	2013-03-13 16:51:36 -0700	[diff] [blame]	4424	for_each_pool(pool, pi) {
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	4425	spin_lock_irq(&pool->lock);
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4426	wake_up_worker(pool);
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	4427	spin_unlock_irq(&pool->lock);
Tejun Heo	24b8a84	2013-03-12 11:29:58 -0700	[diff] [blame]	4428	}
				4429
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4430	workqueue_freezing = false;
				4431	out_unlock:
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	4432	mutex_unlock(&wq_mutex);
Tejun Heo	a0a1a5f	2010-06-29 10:07:12 +0200	[diff] [blame]	4433	}
				4434	#endif /* CONFIG_FREEZER */
				4435
Suresh Siddha	6ee0578	2010-07-30 14:57:37 -0700	[diff] [blame]	4436	static int __init init_workqueues(void)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	4437	{
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	4438	int std_nice[NR_STD_WORKER_POOLS] = { 0, HIGHPRI_NICE_LEVEL };
				4439	int i, cpu;
Tejun Heo	c34056a	2010-06-29 10:07:11 +0200	[diff] [blame]	4440
Tejun Heo	7c3eed5	2013-01-24 11:01:33 -0800	[diff] [blame]	4441	/* make sure we have enough bits for OFFQ pool ID */
				4442	BUILD_BUG_ON((1LU << (BITS_PER_LONG - WORK_OFFQ_POOL_SHIFT)) <
Lai Jiangshan	6be1958	2013-02-06 18:04:53 -0800	[diff] [blame]	4443	WORK_CPU_END * NR_STD_WORKER_POOLS);
Tejun Heo	b549007	2012-08-03 10:30:46 -0700	[diff] [blame]	4444
Tejun Heo	e904e6c	2013-03-12 11:29:57 -0700	[diff] [blame]	4445	WARN_ON(__alignof__(struct pool_workqueue) < __alignof__(long long));
				4446
				4447	pwq_cache = KMEM_CACHE(pool_workqueue, SLAB_PANIC);
				4448
Tejun Heo	6575820	2012-07-17 12:39:26 -0700	[diff] [blame]	4449	cpu_notifier(workqueue_cpu_up_callback, CPU_PRI_WORKQUEUE_UP);
Lai Jiangshan	a5b4e57	2012-09-18 09:59:23 -0700	[diff] [blame]	4450	hotcpu_notifier(workqueue_cpu_down_callback, CPU_PRI_WORKQUEUE_DOWN);
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	4451
Tejun Heo	706026c	2013-01-24 11:01:34 -0800	[diff] [blame]	4452	/* initialize CPU pools */
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	4453	for_each_possible_cpu(cpu) {
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	4454	struct worker_pool *pool;
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	4455
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	4456	i = 0;
Tejun Heo	f02ae73	2013-03-12 11:30:03 -0700	[diff] [blame]	4457	for_each_cpu_worker_pool(pool, cpu) {
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	4458	BUG_ON(init_worker_pool(pool));
Tejun Heo	ec22ca5	2013-01-24 11:01:33 -0800	[diff] [blame]	4459	pool->cpu = cpu;
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	4460	cpumask_copy(pool->attrs->cpumask, cpumask_of(cpu));
Tejun Heo	7a4e344	2013-03-12 11:30:00 -0700	[diff] [blame]	4461	pool->attrs->nice = std_nice[i++];
				4462
Tejun Heo	9daf9e6	2013-01-24 11:01:33 -0800	[diff] [blame]	4463	/* alloc pool ID */
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	4464	mutex_lock(&wq_mutex);
Tejun Heo	9daf9e6	2013-01-24 11:01:33 -0800	[diff] [blame]	4465	BUG_ON(worker_pool_assign_id(pool));
Tejun Heo	5bcab33	2013-03-13 19:47:40 -0700	[diff] [blame]	4466	mutex_unlock(&wq_mutex);
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	4467	}
Tejun Heo	8b03ae3	2010-06-29 10:07:12 +0200	[diff] [blame]	4468	}
				4469
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	4470	/* create the initial worker */
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	4471	for_each_online_cpu(cpu) {
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	4472	struct worker_pool *pool;
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	4473
Tejun Heo	f02ae73	2013-03-12 11:30:03 -0700	[diff] [blame]	4474	for_each_cpu_worker_pool(pool, cpu) {
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	4475	pool->flags &= ~POOL_DISASSOCIATED;
Tejun Heo	ebf44d1	2013-03-13 19:47:39 -0700	[diff] [blame]	4476	BUG_ON(create_and_start_worker(pool) < 0);
Tejun Heo	4ce62e9	2012-07-13 22:16:44 -0700	[diff] [blame]	4477	}
Tejun Heo	e22bee7	2010-06-29 10:07:14 +0200	[diff] [blame]	4478	}
				4479
Tejun Heo	29c91e9	2013-03-12 11:30:03 -0700	[diff] [blame]	4480	/* create default unbound wq attrs */
				4481	for (i = 0; i < NR_STD_WORKER_POOLS; i++) {
				4482	struct workqueue_attrs *attrs;
				4483
				4484	BUG_ON(!(attrs = alloc_workqueue_attrs(GFP_KERNEL)));
				4485
				4486	attrs->nice = std_nice[i];
				4487	cpumask_setall(attrs->cpumask);
				4488
				4489	unbound_std_wq_attrs[i] = attrs;
				4490	}
				4491
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	4492	system_wq = alloc_workqueue("events", 0, 0);
Joonsoo Kim	1aabe90	2012-08-15 23:25:39 +0900	[diff] [blame]	4493	system_highpri_wq = alloc_workqueue("events_highpri", WQ_HIGHPRI, 0);
Tejun Heo	d320c03	2010-06-29 10:07:14 +0200	[diff] [blame]	4494	system_long_wq = alloc_workqueue("events_long", 0, 0);
Tejun Heo	f342179	2010-07-02 10:03:51 +0200	[diff] [blame]	4495	system_unbound_wq = alloc_workqueue("events_unbound", WQ_UNBOUND,
				4496	WQ_UNBOUND_MAX_ACTIVE);
Tejun Heo	24d51ad	2011-02-21 09:52:50 +0100	[diff] [blame]	4497	system_freezable_wq = alloc_workqueue("events_freezable",
				4498	WQ_FREEZABLE, 0);
Joonsoo Kim	1aabe90	2012-08-15 23:25:39 +0900	[diff] [blame]	4499	BUG_ON(!system_wq \|\| !system_highpri_wq \|\| !system_long_wq \|\|
Tejun Heo	ae930e0	2012-08-20 14:51:23 -0700	[diff] [blame]	4500	!system_unbound_wq \|\| !system_freezable_wq);
Suresh Siddha	6ee0578	2010-07-30 14:57:37 -0700	[diff] [blame]	4501	return 0;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	4502	}
Suresh Siddha	6ee0578	2010-07-30 14:57:37 -0700	[diff] [blame]	4503	early_initcall(init_workqueues);