~hc/RK356X_SDK_RELEASE.git

..	..	@@ -1,3 +1,4 @@
	1	+// SPDX-License-Identifier: GPL-2.0-only
1	2	/*
2	3	* kernel/workqueue.c - generic async execution with shared worker pool
3	4	*
..	..	@@ -50,8 +51,13 @@
50	51	#include <linux/sched/isolation.h>
51	52	#include <linux/nmi.h>
52	53	#include <linux/kvm_para.h>
	54	+#include <uapi/linux/sched/types.h>
53	55
54	56	#include "workqueue_internal.h"
	57	+
	58	+#include <trace/hooks/wqlockup.h>
	59	+/* events/workqueue.h uses default TRACE_INCLUDE_PATH */
	60	+#undef TRACE_INCLUDE_PATH
55	61
56	62	enum {
57	63	/*
..	..	@@ -133,7 +139,7 @@
133	139	* PW: wq_pool_mutex and wq->mutex protected for writes. Either for reads.
134	140	*
135	141	* PWR: wq_pool_mutex and wq->mutex protected for writes. Either or
136		- * sched-RCU for reads.
	142	+ * RCU for reads.
137	143	*
138	144	* WQ: wq->mutex protected.
139	145	*
..	..	@@ -248,7 +254,7 @@
248	254	struct list_head flusher_overflow; /* WQ: flush overflow list */
249	255
250	256	struct list_head maydays; /* MD: pwqs requesting rescue */
251		- struct worker rescuer; / I: rescue worker */
	257	+ struct worker rescuer; / MD: rescue worker */
252	258
253	259	int nr_drainers; /* WQ: drain in progress */
254	260	int saved_max_active; /* WQ: saved pwq max_active */
..	..	@@ -260,13 +266,15 @@
260	266	struct wq_device wq_dev; / I: for sysfs interface */
261	267	#endif
262	268	#ifdef CONFIG_LOCKDEP
	269	+ char *lock_name;
	270	+ struct lock_class_key key;
263	271	struct lockdep_map lockdep_map;
264	272	#endif
265	273	char name[WQ_NAME_LEN]; /* I: workqueue name */
266	274
267	275	/*
268		- * Destruction of workqueue_struct is sched-RCU protected to allow
269		- * walking the workqueues list without grabbing wq_pool_mutex.
	276	+ * Destruction of workqueue_struct is RCU protected to allow walking
	277	+ * the workqueues list without grabbing wq_pool_mutex.
270	278	* This is used to dump all workqueues from sysrq.
271	279	*/
272	280	struct rcu_head rcu;
..	..	@@ -299,7 +307,8 @@
299	307	static DEFINE_MUTEX(wq_pool_mutex); /* protects pools and workqueues list */
300	308	static DEFINE_MUTEX(wq_pool_attach_mutex); /* protects worker attach/detach */
301	309	static DEFINE_RAW_SPINLOCK(wq_mayday_lock); /* protects wq->maydays list */
302		-static DECLARE_SWAIT_QUEUE_HEAD(wq_manager_wait); /* wait for manager to go away */
	310	+/* wait for manager to go away */
	311	+static struct rcuwait manager_wait = __RCUWAIT_INITIALIZER(manager_wait);
303	312
304	313	static LIST_HEAD(workqueues); /* PR: list of all workqueues */
305	314	static bool workqueue_freezing; /* PL: have wqs started freezing? */
..	..	@@ -353,19 +362,18 @@
353	362
354	363	static int worker_thread(void *__worker);
355	364	static void workqueue_sysfs_unregister(struct workqueue_struct *wq);
	365	+static void show_pwq(struct pool_workqueue *pwq);
356	366
357	367	#define CREATE_TRACE_POINTS
358	368	#include <trace/events/workqueue.h>
	369	+
	370	+EXPORT_TRACEPOINT_SYMBOL_GPL(workqueue_execute_start);
	371	+EXPORT_TRACEPOINT_SYMBOL_GPL(workqueue_execute_end);
359	372
360	373	#define assert_rcu_or_pool_mutex() \
361	374	RCU_LOCKDEP_WARN(!rcu_read_lock_held() && \
362	375	!lockdep_is_held(&wq_pool_mutex), \
363	376	"RCU or wq_pool_mutex should be held")
364		-
365		-#define assert_rcu_or_wq_mutex(wq) \
366		- RCU_LOCKDEP_WARN(!rcu_read_lock_held() && \
367		- !lockdep_is_held(&wq->mutex), \
368		- "RCU or wq->mutex should be held")
369	377
370	378	#define assert_rcu_or_wq_mutex_or_pool_mutex(wq) \
371	379	RCU_LOCKDEP_WARN(!rcu_read_lock_held() && \
..	..	@@ -423,13 +431,12 @@
423	431	* ignored.
424	432	*/
425	433	#define for_each_pwq(pwq, wq) \
426		- list_for_each_entry_rcu((pwq), &(wq)->pwqs, pwqs_node) \
427		- if (({ assert_rcu_or_wq_mutex(wq); false; })) { } \
428		- else
	434	+ list_for_each_entry_rcu((pwq), &(wq)->pwqs, pwqs_node, \
	435	+ lockdep_is_held(&(wq->mutex)))
429	436
430	437	#ifdef CONFIG_DEBUG_OBJECTS_WORK
431	438
432		-static struct debug_obj_descr work_debug_descr;
	439	+static const struct debug_obj_descr work_debug_descr;
433	440
434	441	static void work_debug_hint(void addr)
435	442	{
..	..	@@ -479,7 +486,7 @@
479	486	}
480	487	}
481	488
482		-static struct debug_obj_descr work_debug_descr = {
	489	+static const struct debug_obj_descr work_debug_descr = {
483	490	.name = "work_struct",
484	491	.debug_hint = work_debug_hint,
485	492	.is_static_object = work_is_static_object,
..	..	@@ -647,7 +654,7 @@
647	654	* The following mb guarantees that previous clear of a PENDING bit
648	655	* will not be reordered with any speculative LOADS or STORES from
649	656	* work->current_func, which is executed afterwards. This possible
650		- * reordering can lead to a missed execution on attempt to qeueue
	657	+ * reordering can lead to a missed execution on attempt to queue
651	658	* the same @work. E.g. consider this case:
652	659	*
653	660	* CPU#0 CPU#1
..	..	@@ -680,12 +687,17 @@
680	687	set_work_data(work, WORK_STRUCT_NO_POOL, 0);
681	688	}
682	689
	690	+static inline struct pool_workqueue *work_struct_pwq(unsigned long data)
	691	+{
	692	+ return (struct pool_workqueue *)(data & WORK_STRUCT_WQ_DATA_MASK);
	693	+}
	694	+
683	695	static struct pool_workqueue get_work_pwq(struct work_struct work)
684	696	{
685	697	unsigned long data = atomic_long_read(&work->data);
686	698
687	699	if (data & WORK_STRUCT_PWQ)
688		- return (void *)(data & WORK_STRUCT_WQ_DATA_MASK);
	700	+ return work_struct_pwq(data);
689	701	else
690	702	return NULL;
691	703	}
..	..	@@ -713,8 +725,7 @@
713	725	assert_rcu_or_pool_mutex();
714	726
715	727	if (data & WORK_STRUCT_PWQ)
716		- return ((struct pool_workqueue *)
717		- (data & WORK_STRUCT_WQ_DATA_MASK))->pool;
	728	+ return work_struct_pwq(data)->pool;
718	729
719	730	pool_id = data >> WORK_OFFQ_POOL_SHIFT;
720	731	if (pool_id == WORK_OFFQ_POOL_NONE)
..	..	@@ -735,8 +746,7 @@
735	746	unsigned long data = atomic_long_read(&work->data);
736	747
737	748	if (data & WORK_STRUCT_PWQ)
738		- return ((struct pool_workqueue *)
739		- (data & WORK_STRUCT_WQ_DATA_MASK))->pool->id;
	749	+ return work_struct_pwq(data)->pool->id;
740	750
741	751	return data >> WORK_OFFQ_POOL_SHIFT;
742	752	}
..	..	@@ -851,8 +861,17 @@
851	861
852	862	if (!worker->sleeping)
853	863	return;
	864	+
	865	+ /*
	866	+ * If preempted by unbind_workers() between the WORKER_NOT_RUNNING check
	867	+ * and the nr_running increment below, we may ruin the nr_running reset
	868	+ * and leave with an unexpected pool->nr_running == 1 on the newly unbound
	869	+ * pool. Protect against such race.
	870	+ */
	871	+ preempt_disable();
854	872	if (!(worker->flags & WORKER_NOT_RUNNING))
855	873	atomic_inc(&worker->pool->nr_running);
	874	+ preempt_enable();
856	875	worker->sleeping = 0;
857	876	}
858	877
..	..	@@ -861,7 +880,8 @@
861	880	* @task: task going to sleep
862	881	*
863	882	* This function is called from schedule() when a busy worker is
864		- * going to sleep.
	883	+ * going to sleep. Preemption needs to be disabled to protect ->sleeping
	884	+ * assignment.
865	885	*/
866	886	void wq_worker_sleeping(struct task_struct *task)
867	887	{
..	..	@@ -878,7 +898,8 @@
878	898
879	899	pool = worker->pool;
880	900
881		- if (WARN_ON_ONCE(worker->sleeping))
	901	+ /* Return if preempted before wq_worker_running() was reached */
	902	+ if (worker->sleeping)
882	903	return;
883	904
884	905	worker->sleeping = 1;
..	..	@@ -906,12 +927,23 @@
906	927
907	928	/**
908	929	* wq_worker_last_func - retrieve worker's last work function
	930	+ * @task: Task to retrieve last work function of.
909	931	*
910	932	* Determine the last function a worker executed. This is called from
911	933	* the scheduler to get a worker's last known identity.
912	934	*
913	935	* CONTEXT:
914		- * spin_lock_irq(rq->lock)
	936	+ * raw_spin_lock_irq(rq->lock)
	937	+ *
	938	+ * This function is called during schedule() when a kworker is going
	939	+ * to sleep. It's used by psi to identify aggregation workers during
	940	+ * dequeuing, to allow periodic aggregation to shut-off when that
	941	+ * worker is the last task in the system or cgroup to go to sleep.
	942	+ *
	943	+ * As this function doesn't involve any workqueue-related locking, it
	944	+ * only returns stable values when called from inside the scheduler's
	945	+ * queuing and dequeuing paths, when @task, which must be a kworker,
	946	+ * is guaranteed to not be processing any works.
915	947	*
916	948	* Return:
917	949	* The last work function %current executed as a worker, NULL if it
..	..	@@ -1201,11 +1233,14 @@
1201	1233	* stable state - idle, on timer or on worklist.
1202	1234	*
1203	1235	* Return:
	1236	+ *
	1237	+ * ======== ================================================================
1204	1238	* 1 if @work was pending and we successfully stole PENDING
1205	1239	* 0 if @work was idle and we claimed PENDING
1206	1240	* -EAGAIN if PENDING couldn't be grabbed at the moment, safe to busy-retry
1207	1241	* -ENOENT if someone else is canceling @work, this state may persist
1208	1242	* for arbitrarily long
	1243	+ * ======== ================================================================
1209	1244	*
1210	1245	* Note:
1211	1246	* On >= 0 return, the caller owns @work's PENDING bit. To avoid getting
..	..	@@ -1313,6 +1348,9 @@
1313	1348	{
1314	1349	struct worker_pool *pool = pwq->pool;
1315	1350
	1351	+ /* record the work call stack in order to print it in KASAN reports */
	1352	+ kasan_record_aux_stack(work);
	1353	+
1316	1354	/* we own @work, set data and link */
1317	1355	set_work_pwq(work, pwq, extra_flags);
1318	1356	list_add_tail(&work->entry, head);
..	..	@@ -1339,7 +1377,7 @@
1339	1377
1340	1378	worker = current_wq_worker();
1341	1379	/*
1342		- * Return %true iff I'm a worker execuing a work item on @wq. If
	1380	+ * Return %true iff I'm a worker executing a work item on @wq. If
1343	1381	* I'm @worker, it's safe to dereference it without locking.
1344	1382	*/
1345	1383	return worker && worker->current_pwq->wq == wq;
..	..	@@ -1513,14 +1551,96 @@
1513	1551	}
1514	1552	EXPORT_SYMBOL(queue_work_on);
1515	1553
	1554	+/**
	1555	+ * workqueue_select_cpu_near - Select a CPU based on NUMA node
	1556	+ * @node: NUMA node ID that we want to select a CPU from
	1557	+ *
	1558	+ * This function will attempt to find a "random" cpu available on a given
	1559	+ * node. If there are no CPUs available on the given node it will return
	1560	+ * WORK_CPU_UNBOUND indicating that we should just schedule to any
	1561	+ * available CPU if we need to schedule this work.
	1562	+ */
	1563	+static int workqueue_select_cpu_near(int node)
	1564	+{
	1565	+ int cpu;
	1566	+
	1567	+ /* No point in doing this if NUMA isn't enabled for workqueues */
	1568	+ if (!wq_numa_enabled)
	1569	+ return WORK_CPU_UNBOUND;
	1570	+
	1571	+ /* Delay binding to CPU if node is not valid or online */
	1572	+ if (node < 0 \|\| node >= MAX_NUMNODES \|\| !node_online(node))
	1573	+ return WORK_CPU_UNBOUND;
	1574	+
	1575	+ /* Use local node/cpu if we are already there */
	1576	+ cpu = raw_smp_processor_id();
	1577	+ if (node == cpu_to_node(cpu))
	1578	+ return cpu;
	1579	+
	1580	+ /* Use "random" otherwise know as "first" online CPU of node */
	1581	+ cpu = cpumask_any_and(cpumask_of_node(node), cpu_online_mask);
	1582	+
	1583	+ /* If CPU is valid return that, otherwise just defer */
	1584	+ return cpu < nr_cpu_ids ? cpu : WORK_CPU_UNBOUND;
	1585	+}
	1586	+
	1587	+/**
	1588	+ * queue_work_node - queue work on a "random" cpu for a given NUMA node
	1589	+ * @node: NUMA node that we are targeting the work for
	1590	+ * @wq: workqueue to use
	1591	+ * @work: work to queue
	1592	+ *
	1593	+ * We queue the work to a "random" CPU within a given NUMA node. The basic
	1594	+ * idea here is to provide a way to somehow associate work with a given
	1595	+ * NUMA node.
	1596	+ *
	1597	+ * This function will only make a best effort attempt at getting this onto
	1598	+ * the right NUMA node. If no node is requested or the requested node is
	1599	+ * offline then we just fall back to standard queue_work behavior.
	1600	+ *
	1601	+ * Currently the "random" CPU ends up being the first available CPU in the
	1602	+ * intersection of cpu_online_mask and the cpumask of the node, unless we
	1603	+ * are running on the node. In that case we just use the current CPU.
	1604	+ *
	1605	+ * Return: %false if @work was already on a queue, %true otherwise.
	1606	+ */
	1607	+bool queue_work_node(int node, struct workqueue_struct *wq,
	1608	+ struct work_struct *work)
	1609	+{
	1610	+ unsigned long flags;
	1611	+ bool ret = false;
	1612	+
	1613	+ /*
	1614	+ * This current implementation is specific to unbound workqueues.
	1615	+ * Specifically we only return the first available CPU for a given
	1616	+ * node instead of cycling through individual CPUs within the node.
	1617	+ *
	1618	+ * If this is used with a per-cpu workqueue then the logic in
	1619	+ * workqueue_select_cpu_near would need to be updated to allow for
	1620	+ * some round robin type logic.
	1621	+ */
	1622	+ WARN_ON_ONCE(!(wq->flags & WQ_UNBOUND));
	1623	+
	1624	+ local_irq_save(flags);
	1625	+
	1626	+ if (!test_and_set_bit(WORK_STRUCT_PENDING_BIT, work_data_bits(work))) {
	1627	+ int cpu = workqueue_select_cpu_near(node);
	1628	+
	1629	+ __queue_work(cpu, wq, work);
	1630	+ ret = true;
	1631	+ }
	1632	+
	1633	+ local_irq_restore(flags);
	1634	+ return ret;
	1635	+}
	1636	+EXPORT_SYMBOL_GPL(queue_work_node);
	1637	+
1516	1638	void delayed_work_timer_fn(struct timer_list *t)
1517	1639	{
1518	1640	struct delayed_work *dwork = from_timer(dwork, t, timer);
1519		- unsigned long flags;
1520	1641
1521		- local_irq_save(flags);
	1642	+ /* should have been called from irqsafe timer with irq already off */
1522	1643	__queue_work(dwork->cpu, dwork->wq, &dwork->work);
1523		- local_irq_restore(flags);
1524	1644	}
1525	1645	EXPORT_SYMBOL(delayed_work_timer_fn);
1526	1646
..	..	@@ -1531,9 +1651,14 @@
1531	1651	struct work_struct *work = &dwork->work;
1532	1652
1533	1653	WARN_ON_ONCE(!wq);
1534		-#ifndef CONFIG_CFI_CLANG
1535		- WARN_ON_ONCE(timer->function != delayed_work_timer_fn);
1536		-#endif
	1654	+ /*
	1655	+ * With CFI, timer->function can point to a jump table entry in a module,
	1656	+ * which fails the comparison. Disable the warning if CFI and modules are
	1657	+ * both enabled.
	1658	+ */
	1659	+ if (!IS_ENABLED(CONFIG_CFI_CLANG) \|\| !IS_ENABLED(CONFIG_MODULES))
	1660	+ WARN_ON_ONCE(timer->function != delayed_work_timer_fn);
	1661	+
1537	1662	WARN_ON_ONCE(timer_pending(timer));
1538	1663	WARN_ON_ONCE(!list_empty(&work->entry));
1539	1664
..	..	@@ -1644,7 +1769,7 @@
1644	1769	*
1645	1770	* Return: %false if @rwork was already pending, %true otherwise. Note
1646	1771	* that a full RCU grace period is guaranteed only after a %true return.
1647		- * While @rwork is guarnateed to be executed after a %false return, the
	1772	+ * While @rwork is guaranteed to be executed after a %false return, the
1648	1773	* execution may happen before a full RCU grace period has passed.
1649	1774	*/
1650	1775	bool queue_rcu_work(struct workqueue_struct wq, struct rcu_work rwork)
..	..	@@ -1838,6 +1963,15 @@
1838	1963	goto fail;
1839	1964
1840	1965	set_user_nice(worker->task, pool->attrs->nice);
	1966	+ if (IS_ENABLED(CONFIG_ROCKCHIP_OPTIMIZE_RT_PRIO)) {
	1967	+ struct sched_param param;
	1968	+
	1969	+ if (pool->attrs->nice == 0)
	1970	+ param.sched_priority = MAX_RT_PRIO / 2 - 4;
	1971	+ else
	1972	+ param.sched_priority = MAX_RT_PRIO / 2 - 2;
	1973	+ sched_setscheduler_nocheck(worker->task, SCHED_RR, &param);
	1974	+ }
1841	1975	kthread_bind_mask(worker->task, pool->attrs->cpumask);
1842	1976
1843	1977	/* successful, attach the worker to the pool */
..	..	@@ -2047,7 +2181,7 @@
2047	2181
2048	2182	pool->manager = NULL;
2049	2183	pool->flags &= ~POOL_MANAGER_ACTIVE;
2050		- swake_up_one(&wq_manager_wait);
	2184	+ rcuwait_wake_up(&manager_wait);
2051	2185	return true;
2052	2186	}
2053	2187
..	..	@@ -2177,13 +2311,13 @@
2177	2311	* While we must be careful to not use "work" after this, the trace
2178	2312	* point will only record its address.
2179	2313	*/
2180		- trace_workqueue_execute_end(work);
	2314	+ trace_workqueue_execute_end(work, worker->current_func);
2181	2315	lock_map_release(&lockdep_map);
2182	2316	lock_map_release(&pwq->wq->lockdep_map);
2183	2317
2184	2318	if (unlikely(in_atomic() \|\| lockdep_depth(current) > 0)) {
2185	2319	pr_err("BUG: workqueue leaked lock or atomic: %s/0x%08x/%d\n"
2186		- " last function: %pf\n",
	2320	+ " last function: %ps\n",
2187	2321	current->comm, preempt_count(), task_pid_nr(current),
2188	2322	worker->current_func);
2189	2323	debug_show_held_locks(current);
..	..	@@ -2191,7 +2325,7 @@
2191	2325	}
2192	2326
2193	2327	/*
2194		- * The following prevents a kworker from hogging CPU on !PREEMPT
	2328	+ * The following prevents a kworker from hogging CPU on !PREEMPTION
2195	2329	* kernels, where a requeueing work item waiting for something to
2196	2330	* happen could deadlock with stop_machine as such work item could
2197	2331	* indefinitely requeue itself while all other CPUs are trapped in
..	..	@@ -2436,7 +2570,7 @@
2436	2570	* being used to relieve memory pressure, don't
2437	2571	* incur MAYDAY_INTERVAL delay inbetween.
2438	2572	*/
2439		- if (need_to_create_worker(pool)) {
	2573	+ if (pwq->nr_active && need_to_create_worker(pool)) {
2440	2574	raw_spin_lock(&wq_mayday_lock);
2441	2575	/*
2442	2576	* Queue iff we aren't racing destruction
..	..	@@ -2508,11 +2642,11 @@
2508	2642	worker = current_wq_worker();
2509	2643
2510	2644	WARN_ONCE(current->flags & PF_MEMALLOC,
2511		- "workqueue: PF_MEMALLOC task %d(%s) is flushing !WQ_MEM_RECLAIM %s:%pf",
	2645	+ "workqueue: PF_MEMALLOC task %d(%s) is flushing !WQ_MEM_RECLAIM %s:%ps",
2512	2646	current->pid, current->comm, target_wq->name, target_func);
2513	2647	WARN_ONCE(worker && ((worker->current_pwq->wq->flags &
2514	2648	(WQ_MEM_RECLAIM \| __WQ_LEGACY)) == WQ_MEM_RECLAIM),
2515		- "workqueue: WQ_MEM_RECLAIM %s:%pf is flushing !WQ_MEM_RECLAIM %s:%pf",
	2649	+ "workqueue: WQ_MEM_RECLAIM %s:%ps is flushing !WQ_MEM_RECLAIM %s:%ps",
2516	2650	worker->current_pwq->wq->name, worker->current_func,
2517	2651	target_wq->name, target_func);
2518	2652	}
..	..	@@ -2743,7 +2877,7 @@
2743	2877	* First flushers are responsible for cascading flushes and
2744	2878	* handling overflow. Non-first flushers can simply return.
2745	2879	*/
2746		- if (wq->first_flusher != &this_flusher)
	2880	+ if (READ_ONCE(wq->first_flusher) != &this_flusher)
2747	2881	return;
2748	2882
2749	2883	mutex_lock(&wq->mutex);
..	..	@@ -2752,7 +2886,7 @@
2752	2886	if (wq->first_flusher != &this_flusher)
2753	2887	goto out_unlock;
2754	2888
2755		- wq->first_flusher = NULL;
	2889	+ WRITE_ONCE(wq->first_flusher, NULL);
2756	2890
2757	2891	WARN_ON_ONCE(!list_empty(&this_flusher.list));
2758	2892	WARN_ON_ONCE(wq->flush_color != this_flusher.flush_color);
..	..	@@ -2943,10 +3077,8 @@
2943	3077	if (WARN_ON(!work->func))
2944	3078	return false;
2945	3079
2946		- if (!from_cancel) {
2947		- lock_map_acquire(&work->lockdep_map);
2948		- lock_map_release(&work->lockdep_map);
2949		- }
	3080	+ lock_map_acquire(&work->lockdep_map);
	3081	+ lock_map_release(&work->lockdep_map);
2950	3082
2951	3083	if (start_flush_work(work, &barr, from_cancel)) {
2952	3084	wait_for_completion(&barr.done);
..	..	@@ -3241,7 +3373,7 @@
3241	3373	*
3242	3374	* Undo alloc_workqueue_attrs().
3243	3375	*/
3244		-static void free_workqueue_attrs(struct workqueue_attrs *attrs)
	3376	+void free_workqueue_attrs(struct workqueue_attrs *attrs)
3245	3377	{
3246	3378	if (attrs) {
3247	3379	free_cpumask_var(attrs->cpumask);
..	..	@@ -3257,7 +3389,7 @@
3257	3389	*
3258	3390	* Return: The allocated new workqueue_attr on success. %NULL on failure.
3259	3391	*/
3260		-static struct workqueue_attrs *alloc_workqueue_attrs(void)
	3392	+struct workqueue_attrs *alloc_workqueue_attrs(void)
3261	3393	{
3262	3394	struct workqueue_attrs *attrs;
3263	3395
..	..	@@ -3348,17 +3480,56 @@
3348	3480	return 0;
3349	3481	}
3350	3482
	3483	+#ifdef CONFIG_LOCKDEP
	3484	+static void wq_init_lockdep(struct workqueue_struct *wq)
	3485	+{
	3486	+ char *lock_name;
	3487	+
	3488	+ lockdep_register_key(&wq->key);
	3489	+ lock_name = kasprintf(GFP_KERNEL, "%s%s", "(wq_completion)", wq->name);
	3490	+ if (!lock_name)
	3491	+ lock_name = wq->name;
	3492	+
	3493	+ wq->lock_name = lock_name;
	3494	+ lockdep_init_map(&wq->lockdep_map, lock_name, &wq->key, 0);
	3495	+}
	3496	+
	3497	+static void wq_unregister_lockdep(struct workqueue_struct *wq)
	3498	+{
	3499	+ lockdep_unregister_key(&wq->key);
	3500	+}
	3501	+
	3502	+static void wq_free_lockdep(struct workqueue_struct *wq)
	3503	+{
	3504	+ if (wq->lock_name != wq->name)
	3505	+ kfree(wq->lock_name);
	3506	+}
	3507	+#else
	3508	+static void wq_init_lockdep(struct workqueue_struct *wq)
	3509	+{
	3510	+}
	3511	+
	3512	+static void wq_unregister_lockdep(struct workqueue_struct *wq)
	3513	+{
	3514	+}
	3515	+
	3516	+static void wq_free_lockdep(struct workqueue_struct *wq)
	3517	+{
	3518	+}
	3519	+#endif
	3520	+
3351	3521	static void rcu_free_wq(struct rcu_head *rcu)
3352	3522	{
3353	3523	struct workqueue_struct *wq =
3354	3524	container_of(rcu, struct workqueue_struct, rcu);
	3525	+
	3526	+ wq_free_lockdep(wq);
3355	3527
3356	3528	if (!(wq->flags & WQ_UNBOUND))
3357	3529	free_percpu(wq->cpu_pwqs);
3358	3530	else
3359	3531	free_workqueue_attrs(wq->unbound_attrs);
3360	3532
3361		- kfree(wq->rescuer);
3362	3533	kfree(wq);
3363	3534	}
3364	3535
..	..	@@ -3369,6 +3540,18 @@
3369	3540	ida_destroy(&pool->worker_ida);
3370	3541	free_workqueue_attrs(pool->attrs);
3371	3542	kfree(pool);
	3543	+}
	3544	+
	3545	+/* This returns with the lock held on success (pool manager is inactive). */
	3546	+static bool wq_manager_inactive(struct worker_pool *pool)
	3547	+{
	3548	+ raw_spin_lock_irq(&pool->lock);
	3549	+
	3550	+ if (pool->flags & POOL_MANAGER_ACTIVE) {
	3551	+ raw_spin_unlock_irq(&pool->lock);
	3552	+ return false;
	3553	+ }
	3554	+ return true;
3372	3555	}
3373	3556
3374	3557	/**
..	..	@@ -3406,10 +3589,11 @@
3406	3589	* Become the manager and destroy all workers. This prevents
3407	3590	* @pool's workers from blocking on attach_mutex. We're the last
3408	3591	* manager and @pool gets freed with the flag set.
	3592	+ * Because of how wq_manager_inactive() works, we will hold the
	3593	+ * spinlock after a successful wait.
3409	3594	*/
3410		- raw_spin_lock_irq(&pool->lock);
3411		- swait_event_lock_irq(wq_manager_wait,
3412		- !(pool->flags & POOL_MANAGER_ACTIVE), pool->lock);
	3595	+ rcuwait_wait_event(&manager_wait, wq_manager_inactive(pool),
	3596	+ TASK_UNINTERRUPTIBLE);
3413	3597	pool->flags \|= POOL_MANAGER_ACTIVE;
3414	3598
3415	3599	while ((worker = first_idle_worker(pool)))
..	..	@@ -3549,8 +3733,10 @@
3549	3733	* If we're the last pwq going away, @wq is already dead and no one
3550	3734	* is gonna access it anymore. Schedule RCU free.
3551	3735	*/
3552		- if (is_last)
	3736	+ if (is_last) {
	3737	+ wq_unregister_lockdep(wq);
3553	3738	call_rcu(&wq->rcu, rcu_free_wq);
	3739	+ }
3554	3740	}
3555	3741
3556	3742	/**
..	..	@@ -3913,16 +4099,20 @@
3913	4099	*
3914	4100	* Performs GFP_KERNEL allocations.
3915	4101	*
	4102	+ * Assumes caller has CPU hotplug read exclusion, i.e. get_online_cpus().
	4103	+ *
3916	4104	* Return: 0 on success and -errno on failure.
3917	4105	*/
3918		-static int apply_workqueue_attrs(struct workqueue_struct *wq,
	4106	+int apply_workqueue_attrs(struct workqueue_struct *wq,
3919	4107	const struct workqueue_attrs *attrs)
3920	4108	{
3921	4109	int ret;
3922	4110
3923		- apply_wqattrs_lock();
	4111	+ lockdep_assert_cpus_held();
	4112	+
	4113	+ mutex_lock(&wq_pool_mutex);
3924	4114	ret = apply_workqueue_attrs_locked(wq, attrs);
3925		- apply_wqattrs_unlock();
	4115	+ mutex_unlock(&wq_pool_mutex);
3926	4116
3927	4117	return ret;
3928	4118	}
..	..	@@ -4035,16 +4225,21 @@
4035	4225	mutex_unlock(&wq->mutex);
4036	4226	}
4037	4227	return 0;
4038		- } else if (wq->flags & __WQ_ORDERED) {
	4228	+ }
	4229	+
	4230	+ get_online_cpus();
	4231	+ if (wq->flags & __WQ_ORDERED) {
4039	4232	ret = apply_workqueue_attrs(wq, ordered_wq_attrs[highpri]);
4040	4233	/* there should only be single pwq for ordering guarantee */
4041	4234	WARN(!ret && (wq->pwqs.next != &wq->dfl_pwq->pwqs_node \|\|
4042	4235	wq->pwqs.prev != &wq->dfl_pwq->pwqs_node),
4043	4236	"ordering guarantee broken for workqueue %s\n", wq->name);
4044		- return ret;
4045	4237	} else {
4046		- return apply_workqueue_attrs(wq, unbound_std_wq_attrs[highpri]);
	4238	+ ret = apply_workqueue_attrs(wq, unbound_std_wq_attrs[highpri]);
4047	4239	}
	4240	+ put_online_cpus();
	4241	+
	4242	+ return ret;
4048	4243	}
4049	4244
4050	4245	static int wq_clamp_max_active(int max_active, unsigned int flags,
..	..	@@ -4077,8 +4272,8 @@
4077	4272
4078	4273	rescuer->rescue_wq = wq;
4079	4274	rescuer->task = kthread_create(rescuer_thread, rescuer, "%s", wq->name);
4080		- ret = PTR_ERR_OR_ZERO(rescuer->task);
4081		- if (ret) {
	4275	+ if (IS_ERR(rescuer->task)) {
	4276	+ ret = PTR_ERR(rescuer->task);
4082	4277	kfree(rescuer);
4083	4278	return ret;
4084	4279	}
..	..	@@ -4090,11 +4285,10 @@
4090	4285	return 0;
4091	4286	}
4092	4287
4093		-struct workqueue_struct __alloc_workqueue_key(const char fmt,
4094		- unsigned int flags,
4095		- int max_active,
4096		- struct lock_class_key *key,
4097		- const char *lock_name, ...)
	4288	+__printf(1, 4)
	4289	+struct workqueue_struct alloc_workqueue(const char fmt,
	4290	+ unsigned int flags,
	4291	+ int max_active, ...)
4098	4292	{
4099	4293	size_t tbl_size = 0;
4100	4294	va_list args;
..	..	@@ -4129,7 +4323,7 @@
4129	4323	goto err_free_wq;
4130	4324	}
4131	4325
4132		- va_start(args, lock_name);
	4326	+ va_start(args, max_active);
4133	4327	vsnprintf(wq->name, sizeof(wq->name), fmt, args);
4134	4328	va_end(args);
4135	4329
..	..	@@ -4146,11 +4340,11 @@
4146	4340	INIT_LIST_HEAD(&wq->flusher_overflow);
4147	4341	INIT_LIST_HEAD(&wq->maydays);
4148	4342
4149		- lockdep_init_map(&wq->lockdep_map, lock_name, key, 0);
	4343	+ wq_init_lockdep(wq);
4150	4344	INIT_LIST_HEAD(&wq->list);
4151	4345
4152	4346	if (alloc_and_link_pwqs(wq) < 0)
4153		- goto err_free_wq;
	4347	+ goto err_unreg_lockdep;
4154	4348
4155	4349	if (wq_online && init_rescuer(wq) < 0)
4156	4350	goto err_destroy;
..	..	@@ -4176,6 +4370,9 @@
4176	4370
4177	4371	return wq;
4178	4372
	4373	+err_unreg_lockdep:
	4374	+ wq_unregister_lockdep(wq);
	4375	+ wq_free_lockdep(wq);
4179	4376	err_free_wq:
4180	4377	free_workqueue_attrs(wq->unbound_attrs);
4181	4378	kfree(wq);
..	..	@@ -4184,7 +4381,23 @@
4184	4381	destroy_workqueue(wq);
4185	4382	return NULL;
4186	4383	}
4187		-EXPORT_SYMBOL_GPL(__alloc_workqueue_key);
	4384	+EXPORT_SYMBOL_GPL(alloc_workqueue);
	4385	+
	4386	+static bool pwq_busy(struct pool_workqueue *pwq)
	4387	+{
	4388	+ int i;
	4389	+
	4390	+ for (i = 0; i < WORK_NR_COLORS; i++)
	4391	+ if (pwq->nr_in_flight[i])
	4392	+ return true;
	4393	+
	4394	+ if ((pwq != pwq->wq->dfl_pwq) && (pwq->refcnt > 1))
	4395	+ return true;
	4396	+ if (pwq->nr_active \|\| !list_empty(&pwq->delayed_works))
	4397	+ return true;
	4398	+
	4399	+ return false;
	4400	+}
4188	4401
4189	4402	/**
4190	4403	* destroy_workqueue - safely terminate a workqueue
..	..	@@ -4220,26 +4433,25 @@
4220	4433	kfree(rescuer);
4221	4434	}
4222	4435
4223		- /* sanity checks */
	4436	+ /*
	4437	+ * Sanity checks - grab all the locks so that we wait for all
	4438	+ * in-flight operations which may do put_pwq().
	4439	+ */
	4440	+ mutex_lock(&wq_pool_mutex);
4224	4441	mutex_lock(&wq->mutex);
4225	4442	for_each_pwq(pwq, wq) {
4226		- int i;
4227		-
4228		- for (i = 0; i < WORK_NR_COLORS; i++) {
4229		- if (WARN_ON(pwq->nr_in_flight[i])) {
4230		- mutex_unlock(&wq->mutex);
4231		- show_workqueue_state();
4232		- return;
4233		- }
4234		- }
4235		-
4236		- if (WARN_ON((pwq != wq->dfl_pwq) && (pwq->refcnt > 1)) \|\|
4237		- WARN_ON(pwq->nr_active) \|\|
4238		- WARN_ON(!list_empty(&pwq->delayed_works))) {
	4443	+ raw_spin_lock_irq(&pwq->pool->lock);
	4444	+ if (WARN_ON(pwq_busy(pwq))) {
	4445	+ pr_warn("%s: %s has the following busy pwq\n",
	4446	+ __func__, wq->name);
	4447	+ show_pwq(pwq);
	4448	+ raw_spin_unlock_irq(&pwq->pool->lock);
4239	4449	mutex_unlock(&wq->mutex);
	4450	+ mutex_unlock(&wq_pool_mutex);
4240	4451	show_workqueue_state();
4241	4452	return;
4242	4453	}
	4454	+ raw_spin_unlock_irq(&pwq->pool->lock);
4243	4455	}
4244	4456	mutex_unlock(&wq->mutex);
4245	4457
..	..	@@ -4247,11 +4459,11 @@
4247	4459	* wq list is used to freeze wq, remove from list after
4248	4460	* flushing is complete in case freeze races us.
4249	4461	*/
4250		- mutex_lock(&wq_pool_mutex);
4251	4462	list_del_rcu(&wq->list);
4252	4463	mutex_unlock(&wq_pool_mutex);
4253	4464
4254	4465	if (!(wq->flags & WQ_UNBOUND)) {
	4466	+ wq_unregister_lockdep(wq);
4255	4467	/*
4256	4468	* The base ref is never dropped on per-cpu pwqs. Directly
4257	4469	* schedule RCU free.
..	..	@@ -4477,14 +4689,14 @@
4477	4689	* Carefully copy the associated workqueue's workfn, name and desc.
4478	4690	* Keep the original last '\0' in case the original is garbage.
4479	4691	*/
4480		- probe_kernel_read(&fn, &worker->current_func, sizeof(fn));
4481		- probe_kernel_read(&pwq, &worker->current_pwq, sizeof(pwq));
4482		- probe_kernel_read(&wq, &pwq->wq, sizeof(wq));
4483		- probe_kernel_read(name, wq->name, sizeof(name) - 1);
4484		- probe_kernel_read(desc, worker->desc, sizeof(desc) - 1);
	4692	+ copy_from_kernel_nofault(&fn, &worker->current_func, sizeof(fn));
	4693	+ copy_from_kernel_nofault(&pwq, &worker->current_pwq, sizeof(pwq));
	4694	+ copy_from_kernel_nofault(&wq, &pwq->wq, sizeof(wq));
	4695	+ copy_from_kernel_nofault(name, wq->name, sizeof(name) - 1);
	4696	+ copy_from_kernel_nofault(desc, worker->desc, sizeof(desc) - 1);
4485	4697
4486	4698	if (fn \|\| name[0] \|\| desc[0]) {
4487		- printk("%sWorkqueue: %s %pf", log_lvl, name, fn);
	4699	+ printk("%sWorkqueue: %s %ps", log_lvl, name, fn);
4488	4700	if (strcmp(name, desc))
4489	4701	pr_cont(" (%s)", desc);
4490	4702	pr_cont("\n");
..	..	@@ -4509,7 +4721,7 @@
4509	4721	pr_cont("%s BAR(%d)", comma ? "," : "",
4510	4722	task_pid_nr(barr->task));
4511	4723	} else {
4512		- pr_cont("%s %pf", comma ? "," : "", work->func);
	4724	+ pr_cont("%s %ps", comma ? "," : "", work->func);
4513	4725	}
4514	4726	}
4515	4727
..	..	@@ -4542,9 +4754,9 @@
4542	4754	if (worker->current_pwq != pwq)
4543	4755	continue;
4544	4756
4545		- pr_cont("%s %d%s:%pf", comma ? "," : "",
	4757	+ pr_cont("%s %d%s:%ps", comma ? "," : "",
4546	4758	task_pid_nr(worker->task),
4547		- worker == pwq->wq->rescuer ? "(RESCUER)" : "",
	4759	+ worker->rescue_wq ? "(RESCUER)" : "",
4548	4760	worker->current_func);
4549	4761	list_for_each_entry(work, &worker->scheduled, entry)
4550	4762	pr_cont_work(false, work);
..	..	@@ -4704,6 +4916,7 @@
4704	4916
4705	4917	mutex_unlock(&wq_pool_attach_mutex);
4706	4918	}
	4919	+EXPORT_SYMBOL_GPL(wq_worker_comm);
4707	4920
4708	4921	#ifdef CONFIG_SMP
4709	4922
..	..	@@ -4827,7 +5040,7 @@
4827	5040	*
4828	5041	* WRITE_ONCE() is necessary because @worker->flags may be
4829	5042	* tested without holding any lock in
4830		- * wq_worker_waking_up(). Without it, NOT_RUNNING test may
	5043	+ * wq_worker_running(). Without it, NOT_RUNNING test may
4831	5044	* fail incorrectly leading to premature concurrency
4832	5045	* management operations.
4833	5046	*/
..	..	@@ -5642,6 +5855,7 @@
5642	5855	pr_cont_pool_info(pool);
5643	5856	pr_cont(" stuck for %us!\n",
5644	5857	jiffies_to_msecs(now - pool_ts) / 1000);
	5858	+ trace_android_vh_wq_lockup_pool(pool->cpu, pool_ts);
5645	5859	}
5646	5860	}
5647	5861
..	..	@@ -5725,6 +5939,13 @@
5725	5939	return;
5726	5940	}
5727	5941
	5942	+ for_each_possible_cpu(cpu) {
	5943	+ if (WARN_ON(cpu_to_node(cpu) == NUMA_NO_NODE)) {
	5944	+ pr_warn("workqueue: NUMA node mapping not available for cpu%d, disabling NUMA support\n", cpu);
	5945	+ return;
	5946	+ }
	5947	+ }
	5948	+
5728	5949	wq_update_unbound_numa_attrs_buf = alloc_workqueue_attrs();
5729	5950	BUG_ON(!wq_update_unbound_numa_attrs_buf);
5730	5951
..	..	@@ -5742,11 +5963,6 @@
5742	5963
5743	5964	for_each_possible_cpu(cpu) {
5744	5965	node = cpu_to_node(cpu);
5745		- if (WARN_ON(node == NUMA_NO_NODE)) {
5746		- pr_warn("workqueue: NUMA node mapping not available for cpu%d, disabling NUMA support\n", cpu);
5747		- /* happens iff arch is bonkers, let's just proceed */
5748		- return;
5749		- }
5750	5966	cpumask_set_cpu(cpu, tbl[node]);
5751	5967	}
5752	5968
..	..	@@ -5764,13 +5980,13 @@
5764	5980	* items. Actual work item execution starts only after kthreads can be
5765	5981	* created and scheduled right before early initcalls.
5766	5982	*/
5767		-int __init workqueue_init_early(void)
	5983	+void __init workqueue_init_early(void)
5768	5984	{
5769	5985	int std_nice[NR_STD_WORKER_POOLS] = { 0, HIGHPRI_NICE_LEVEL };
5770	5986	int hk_flags = HK_FLAG_DOMAIN \| HK_FLAG_WQ;
5771	5987	int i, cpu;
5772	5988
5773		- WARN_ON(__alignof__(struct pool_workqueue) < __alignof__(long long));
	5989	+ BUILD_BUG_ON(__alignof__(struct pool_workqueue) < __alignof__(long long));
5774	5990
5775	5991	BUG_ON(!alloc_cpumask_var(&wq_unbound_cpumask, GFP_KERNEL));
5776	5992	cpumask_copy(wq_unbound_cpumask, housekeeping_cpumask(hk_flags));
..	..	@@ -5831,8 +6047,6 @@
5831	6047	!system_unbound_wq \|\| !system_freezable_wq \|\|
5832	6048	!system_power_efficient_wq \|\|
5833	6049	!system_freezable_power_efficient_wq);
5834		-
5835		- return 0;
5836	6050	}
5837	6051
5838	6052	/**
..	..	@@ -5844,7 +6058,7 @@
5844	6058	* are no kworkers executing the work items yet. Populate the worker pools
5845	6059	* with the initial workers and enable future kworker creations.
5846	6060	*/
5847		-int __init workqueue_init(void)
	6061	+void __init workqueue_init(void)
5848	6062	{
5849	6063	struct workqueue_struct *wq;
5850	6064	struct worker_pool *pool;
..	..	@@ -5891,6 +6105,4 @@
5891	6105
5892	6106	wq_online = true;
5893	6107	wq_watchdog_init();
5894		-
5895		- return 0;
5896	6108	}