xref: /xnu-11215.41.3/bsd/pthread/pthread_workqueue.c (revision 33de042d024d46de5ff4e89f2471de6608e37fa4)
1*33de042dSApple OSS Distributions /*
2*33de042dSApple OSS Distributions  * Copyright (c) 2000-2020 Apple Inc. All rights reserved.
3*33de042dSApple OSS Distributions  *
4*33de042dSApple OSS Distributions  * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
5*33de042dSApple OSS Distributions  *
6*33de042dSApple OSS Distributions  * This file contains Original Code and/or Modifications of Original Code
7*33de042dSApple OSS Distributions  * as defined in and that are subject to the Apple Public Source License
8*33de042dSApple OSS Distributions  * Version 2.0 (the 'License'). You may not use this file except in
9*33de042dSApple OSS Distributions  * compliance with the License. The rights granted to you under the License
10*33de042dSApple OSS Distributions  * may not be used to create, or enable the creation or redistribution of,
11*33de042dSApple OSS Distributions  * unlawful or unlicensed copies of an Apple operating system, or to
12*33de042dSApple OSS Distributions  * circumvent, violate, or enable the circumvention or violation of, any
13*33de042dSApple OSS Distributions  * terms of an Apple operating system software license agreement.
14*33de042dSApple OSS Distributions  *
15*33de042dSApple OSS Distributions  * Please obtain a copy of the License at
16*33de042dSApple OSS Distributions  * http://www.opensource.apple.com/apsl/ and read it before using this file.
17*33de042dSApple OSS Distributions  *
18*33de042dSApple OSS Distributions  * The Original Code and all software distributed under the License are
19*33de042dSApple OSS Distributions  * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20*33de042dSApple OSS Distributions  * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21*33de042dSApple OSS Distributions  * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22*33de042dSApple OSS Distributions  * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23*33de042dSApple OSS Distributions  * Please see the License for the specific language governing rights and
24*33de042dSApple OSS Distributions  * limitations under the License.
25*33de042dSApple OSS Distributions  *
26*33de042dSApple OSS Distributions  * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
27*33de042dSApple OSS Distributions  */
28*33de042dSApple OSS Distributions /* Copyright (c) 1995-2018 Apple, Inc. All Rights Reserved */
29*33de042dSApple OSS Distributions 
30*33de042dSApple OSS Distributions #include <sys/cdefs.h>
31*33de042dSApple OSS Distributions 
32*33de042dSApple OSS Distributions #include <kern/assert.h>
33*33de042dSApple OSS Distributions #include <kern/ast.h>
34*33de042dSApple OSS Distributions #include <kern/clock.h>
35*33de042dSApple OSS Distributions #include <kern/cpu_data.h>
36*33de042dSApple OSS Distributions #include <kern/kern_types.h>
37*33de042dSApple OSS Distributions #include <kern/policy_internal.h>
38*33de042dSApple OSS Distributions #include <kern/processor.h>
39*33de042dSApple OSS Distributions #include <kern/sched_prim.h>    /* for thread_exception_return */
40*33de042dSApple OSS Distributions #include <kern/task.h>
41*33de042dSApple OSS Distributions #include <kern/thread.h>
42*33de042dSApple OSS Distributions #include <kern/thread_group.h>
43*33de042dSApple OSS Distributions #include <kern/zalloc.h>
44*33de042dSApple OSS Distributions #include <kern/work_interval.h>
45*33de042dSApple OSS Distributions #include <mach/kern_return.h>
46*33de042dSApple OSS Distributions #include <mach/mach_param.h>
47*33de042dSApple OSS Distributions #include <mach/mach_port.h>
48*33de042dSApple OSS Distributions #include <mach/mach_types.h>
49*33de042dSApple OSS Distributions #include <mach/mach_vm.h>
50*33de042dSApple OSS Distributions #include <mach/sync_policy.h>
51*33de042dSApple OSS Distributions #include <mach/task.h>
52*33de042dSApple OSS Distributions #include <mach/thread_act.h> /* for thread_resume */
53*33de042dSApple OSS Distributions #include <mach/thread_policy.h>
54*33de042dSApple OSS Distributions #include <mach/thread_status.h>
55*33de042dSApple OSS Distributions #include <mach/vm_prot.h>
56*33de042dSApple OSS Distributions #include <mach/vm_statistics.h>
57*33de042dSApple OSS Distributions #include <machine/atomic.h>
58*33de042dSApple OSS Distributions #include <machine/machine_routines.h>
59*33de042dSApple OSS Distributions #include <machine/smp.h>
60*33de042dSApple OSS Distributions #include <vm/vm_map.h>
61*33de042dSApple OSS Distributions #include <vm/vm_protos.h>
62*33de042dSApple OSS Distributions 
63*33de042dSApple OSS Distributions #include <sys/eventvar.h>
64*33de042dSApple OSS Distributions #include <sys/kdebug.h>
65*33de042dSApple OSS Distributions #include <sys/kernel.h>
66*33de042dSApple OSS Distributions #include <sys/lock.h>
67*33de042dSApple OSS Distributions #include <sys/param.h>
68*33de042dSApple OSS Distributions #include <sys/proc_info.h>      /* for fill_procworkqueue */
69*33de042dSApple OSS Distributions #include <sys/proc_internal.h>
70*33de042dSApple OSS Distributions #include <sys/pthread_shims.h>
71*33de042dSApple OSS Distributions #include <sys/resourcevar.h>
72*33de042dSApple OSS Distributions #include <sys/signalvar.h>
73*33de042dSApple OSS Distributions #include <sys/sysctl.h>
74*33de042dSApple OSS Distributions #include <sys/sysproto.h>
75*33de042dSApple OSS Distributions #include <sys/systm.h>
76*33de042dSApple OSS Distributions #include <sys/ulock.h> /* for ulock_owner_value_to_port_name */
77*33de042dSApple OSS Distributions 
78*33de042dSApple OSS Distributions #include <pthread/bsdthread_private.h>
79*33de042dSApple OSS Distributions #include <pthread/workqueue_syscalls.h>
80*33de042dSApple OSS Distributions #include <pthread/workqueue_internal.h>
81*33de042dSApple OSS Distributions #include <pthread/workqueue_trace.h>
82*33de042dSApple OSS Distributions 
83*33de042dSApple OSS Distributions #include <os/log.h>
84*33de042dSApple OSS Distributions 
85*33de042dSApple OSS Distributions static void workq_unpark_continue(void *uth, wait_result_t wr) __dead2;
86*33de042dSApple OSS Distributions 
87*33de042dSApple OSS Distributions static void workq_bound_thread_unpark_continue(void *uth, wait_result_t wr) __dead2;
88*33de042dSApple OSS Distributions 
89*33de042dSApple OSS Distributions static void workq_bound_thread_initialize_and_unpark_continue(void *uth, wait_result_t wr) __dead2;
90*33de042dSApple OSS Distributions 
91*33de042dSApple OSS Distributions static void workq_bound_thread_setup_and_run(struct uthread *uth, int setup_flags) __dead2;
92*33de042dSApple OSS Distributions 
93*33de042dSApple OSS Distributions static void workq_schedule_creator(proc_t p, struct workqueue *wq,
94*33de042dSApple OSS Distributions     workq_kern_threadreq_flags_t flags);
95*33de042dSApple OSS Distributions 
96*33de042dSApple OSS Distributions static bool workq_threadreq_admissible(struct workqueue *wq, struct uthread *uth,
97*33de042dSApple OSS Distributions     workq_threadreq_t req);
98*33de042dSApple OSS Distributions 
99*33de042dSApple OSS Distributions static uint32_t workq_constrained_allowance(struct workqueue *wq,
100*33de042dSApple OSS Distributions     thread_qos_t at_qos, struct uthread *uth,
101*33de042dSApple OSS Distributions     bool may_start_timer, bool record_failed_allowance);
102*33de042dSApple OSS Distributions 
103*33de042dSApple OSS Distributions static bool _wq_cooperative_queue_refresh_best_req_qos(struct workqueue *wq);
104*33de042dSApple OSS Distributions 
105*33de042dSApple OSS Distributions static bool workq_thread_is_busy(uint64_t cur_ts,
106*33de042dSApple OSS Distributions     _Atomic uint64_t *lastblocked_tsp);
107*33de042dSApple OSS Distributions 
108*33de042dSApple OSS Distributions static int workq_sysctl_handle_usecs SYSCTL_HANDLER_ARGS;
109*33de042dSApple OSS Distributions 
110*33de042dSApple OSS Distributions static bool
111*33de042dSApple OSS Distributions workq_schedule_delayed_thread_creation(struct workqueue *wq, int flags);
112*33de042dSApple OSS Distributions 
113*33de042dSApple OSS Distributions static inline void
114*33de042dSApple OSS Distributions workq_lock_spin(struct workqueue *wq);
115*33de042dSApple OSS Distributions 
116*33de042dSApple OSS Distributions static inline void
117*33de042dSApple OSS Distributions workq_unlock(struct workqueue *wq);
118*33de042dSApple OSS Distributions 
119*33de042dSApple OSS Distributions #pragma mark globals
120*33de042dSApple OSS Distributions 
121*33de042dSApple OSS Distributions struct workq_usec_var {
122*33de042dSApple OSS Distributions 	uint32_t usecs;
123*33de042dSApple OSS Distributions 	uint64_t abstime;
124*33de042dSApple OSS Distributions };
125*33de042dSApple OSS Distributions 
126*33de042dSApple OSS Distributions #define WORKQ_SYSCTL_USECS(var, init) \
127*33de042dSApple OSS Distributions 	        static struct workq_usec_var var = { .usecs = init }; \
128*33de042dSApple OSS Distributions 	        SYSCTL_OID(_kern, OID_AUTO, var##_usecs, \
129*33de042dSApple OSS Distributions 	                        CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED, &var, 0, \
130*33de042dSApple OSS Distributions 	                        workq_sysctl_handle_usecs, "I", "")
131*33de042dSApple OSS Distributions 
132*33de042dSApple OSS Distributions static LCK_GRP_DECLARE(workq_lck_grp, "workq");
133*33de042dSApple OSS Distributions os_refgrp_decl(static, workq_refgrp, "workq", NULL);
134*33de042dSApple OSS Distributions 
135*33de042dSApple OSS Distributions static ZONE_DEFINE(workq_zone_workqueue, "workq.wq",
136*33de042dSApple OSS Distributions     sizeof(struct workqueue), ZC_NONE);
137*33de042dSApple OSS Distributions static ZONE_DEFINE(workq_zone_threadreq, "workq.threadreq",
138*33de042dSApple OSS Distributions     sizeof(struct workq_threadreq_s), ZC_CACHING);
139*33de042dSApple OSS Distributions 
140*33de042dSApple OSS Distributions static struct mpsc_daemon_queue workq_deallocate_queue;
141*33de042dSApple OSS Distributions 
142*33de042dSApple OSS Distributions WORKQ_SYSCTL_USECS(wq_stalled_window, WQ_STALLED_WINDOW_USECS);
143*33de042dSApple OSS Distributions WORKQ_SYSCTL_USECS(wq_reduce_pool_window, WQ_REDUCE_POOL_WINDOW_USECS);
144*33de042dSApple OSS Distributions WORKQ_SYSCTL_USECS(wq_max_timer_interval, WQ_MAX_TIMER_INTERVAL_USECS);
145*33de042dSApple OSS Distributions static uint32_t wq_max_threads              = WORKQUEUE_MAXTHREADS;
146*33de042dSApple OSS Distributions static uint32_t wq_max_constrained_threads  = WORKQUEUE_MAXTHREADS / 8;
147*33de042dSApple OSS Distributions static uint32_t wq_init_constrained_limit   = 1;
148*33de042dSApple OSS Distributions static uint16_t wq_death_max_load;
149*33de042dSApple OSS Distributions static uint32_t wq_max_parallelism[WORKQ_NUM_QOS_BUCKETS];
150*33de042dSApple OSS Distributions 
151*33de042dSApple OSS Distributions /*
152*33de042dSApple OSS Distributions  * This is not a hard limit but the max size we want to aim to hit across the
153*33de042dSApple OSS Distributions  * entire cooperative pool. We can oversubscribe the pool due to non-cooperative
154*33de042dSApple OSS Distributions  * workers and the max we will oversubscribe the pool by, is a total of
155*33de042dSApple OSS Distributions  * wq_max_cooperative_threads * WORKQ_NUM_QOS_BUCKETS.
156*33de042dSApple OSS Distributions  */
157*33de042dSApple OSS Distributions static uint32_t wq_max_cooperative_threads;
158*33de042dSApple OSS Distributions 
159*33de042dSApple OSS Distributions static inline uint32_t
wq_cooperative_queue_max_size(struct workqueue * wq)160*33de042dSApple OSS Distributions wq_cooperative_queue_max_size(struct workqueue *wq)
161*33de042dSApple OSS Distributions {
162*33de042dSApple OSS Distributions 	return wq->wq_cooperative_queue_has_limited_max_size ? 1 : wq_max_cooperative_threads;
163*33de042dSApple OSS Distributions }
164*33de042dSApple OSS Distributions 
165*33de042dSApple OSS Distributions #pragma mark sysctls
166*33de042dSApple OSS Distributions 
167*33de042dSApple OSS Distributions static int
168*33de042dSApple OSS Distributions workq_sysctl_handle_usecs SYSCTL_HANDLER_ARGS
169*33de042dSApple OSS Distributions {
170*33de042dSApple OSS Distributions #pragma unused(arg2)
171*33de042dSApple OSS Distributions 	struct workq_usec_var *v = arg1;
172*33de042dSApple OSS Distributions 	int error = sysctl_handle_int(oidp, &v->usecs, 0, req);
173*33de042dSApple OSS Distributions 	if (error || !req->newptr) {
174*33de042dSApple OSS Distributions 		return error;
175*33de042dSApple OSS Distributions 	}
176*33de042dSApple OSS Distributions 	clock_interval_to_absolutetime_interval(v->usecs, NSEC_PER_USEC,
177*33de042dSApple OSS Distributions 	    &v->abstime);
178*33de042dSApple OSS Distributions 	return 0;
179*33de042dSApple OSS Distributions }
180*33de042dSApple OSS Distributions 
181*33de042dSApple OSS Distributions SYSCTL_INT(_kern, OID_AUTO, wq_max_threads, CTLFLAG_RW | CTLFLAG_LOCKED,
182*33de042dSApple OSS Distributions     &wq_max_threads, 0, "");
183*33de042dSApple OSS Distributions 
184*33de042dSApple OSS Distributions SYSCTL_INT(_kern, OID_AUTO, wq_max_constrained_threads, CTLFLAG_RW | CTLFLAG_LOCKED,
185*33de042dSApple OSS Distributions     &wq_max_constrained_threads, 0, "");
186*33de042dSApple OSS Distributions 
187*33de042dSApple OSS Distributions static int
188*33de042dSApple OSS Distributions wq_limit_cooperative_threads_for_proc SYSCTL_HANDLER_ARGS
189*33de042dSApple OSS Distributions {
190*33de042dSApple OSS Distributions #pragma unused(arg1, arg2, oidp)
191*33de042dSApple OSS Distributions 	int input_pool_size = 0;
192*33de042dSApple OSS Distributions 	int changed;
193*33de042dSApple OSS Distributions 	int error = 0;
194*33de042dSApple OSS Distributions 
195*33de042dSApple OSS Distributions 	error = sysctl_io_number(req, 0, sizeof(int), &input_pool_size, &changed);
196*33de042dSApple OSS Distributions 	if (error || !changed) {
197*33de042dSApple OSS Distributions 		return error;
198*33de042dSApple OSS Distributions 	}
199*33de042dSApple OSS Distributions 
200*33de042dSApple OSS Distributions #define WQ_COOPERATIVE_POOL_SIZE_DEFAULT 0
201*33de042dSApple OSS Distributions #define WQ_COOPERATIVE_POOL_SIZE_STRICT_PER_QOS -1
202*33de042dSApple OSS Distributions /* Not available currently, but sysctl interface is designed to allow these
203*33de042dSApple OSS Distributions  * extra parameters:
204*33de042dSApple OSS Distributions  *		WQ_COOPERATIVE_POOL_SIZE_STRICT : -2 (across all bucket)
205*33de042dSApple OSS Distributions  *		WQ_COOPERATIVE_POOL_SIZE_CUSTOM : [1, 512]
206*33de042dSApple OSS Distributions  */
207*33de042dSApple OSS Distributions 
208*33de042dSApple OSS Distributions 	if (input_pool_size != WQ_COOPERATIVE_POOL_SIZE_DEFAULT
209*33de042dSApple OSS Distributions 	    && input_pool_size != WQ_COOPERATIVE_POOL_SIZE_STRICT_PER_QOS) {
210*33de042dSApple OSS Distributions 		error = EINVAL;
211*33de042dSApple OSS Distributions 		goto out;
212*33de042dSApple OSS Distributions 	}
213*33de042dSApple OSS Distributions 
214*33de042dSApple OSS Distributions 	proc_t p = req->p;
215*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
216*33de042dSApple OSS Distributions 
217*33de042dSApple OSS Distributions 	if (wq != NULL) {
218*33de042dSApple OSS Distributions 		workq_lock_spin(wq);
219*33de042dSApple OSS Distributions 		if (wq->wq_reqcount > 0 || wq->wq_nthreads > 0) {
220*33de042dSApple OSS Distributions 			// Hackily enforce that the workqueue is still new (no requests or
221*33de042dSApple OSS Distributions 			// threads)
222*33de042dSApple OSS Distributions 			error = ENOTSUP;
223*33de042dSApple OSS Distributions 		} else {
224*33de042dSApple OSS Distributions 			wq->wq_cooperative_queue_has_limited_max_size = (input_pool_size == WQ_COOPERATIVE_POOL_SIZE_STRICT_PER_QOS);
225*33de042dSApple OSS Distributions 		}
226*33de042dSApple OSS Distributions 		workq_unlock(wq);
227*33de042dSApple OSS Distributions 	} else {
228*33de042dSApple OSS Distributions 		/* This process has no workqueue, calling this syctl makes no sense */
229*33de042dSApple OSS Distributions 		return ENOTSUP;
230*33de042dSApple OSS Distributions 	}
231*33de042dSApple OSS Distributions 
232*33de042dSApple OSS Distributions out:
233*33de042dSApple OSS Distributions 	return error;
234*33de042dSApple OSS Distributions }
235*33de042dSApple OSS Distributions 
236*33de042dSApple OSS Distributions SYSCTL_PROC(_kern, OID_AUTO, wq_limit_cooperative_threads,
237*33de042dSApple OSS Distributions     CTLFLAG_ANYBODY | CTLFLAG_MASKED | CTLFLAG_WR | CTLFLAG_LOCKED | CTLTYPE_INT, 0, 0,
238*33de042dSApple OSS Distributions     wq_limit_cooperative_threads_for_proc,
239*33de042dSApple OSS Distributions     "I", "Modify the max pool size of the cooperative pool");
240*33de042dSApple OSS Distributions 
241*33de042dSApple OSS Distributions #pragma mark p_wqptr
242*33de042dSApple OSS Distributions 
243*33de042dSApple OSS Distributions #define WQPTR_IS_INITING_VALUE ((struct workqueue *)~(uintptr_t)0)
244*33de042dSApple OSS Distributions 
245*33de042dSApple OSS Distributions static struct workqueue *
proc_get_wqptr_fast(struct proc * p)246*33de042dSApple OSS Distributions proc_get_wqptr_fast(struct proc *p)
247*33de042dSApple OSS Distributions {
248*33de042dSApple OSS Distributions 	return os_atomic_load(&p->p_wqptr, relaxed);
249*33de042dSApple OSS Distributions }
250*33de042dSApple OSS Distributions 
251*33de042dSApple OSS Distributions struct workqueue *
proc_get_wqptr(struct proc * p)252*33de042dSApple OSS Distributions proc_get_wqptr(struct proc *p)
253*33de042dSApple OSS Distributions {
254*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr_fast(p);
255*33de042dSApple OSS Distributions 	return wq == WQPTR_IS_INITING_VALUE ? NULL : wq;
256*33de042dSApple OSS Distributions }
257*33de042dSApple OSS Distributions 
258*33de042dSApple OSS Distributions static void
proc_set_wqptr(struct proc * p,struct workqueue * wq)259*33de042dSApple OSS Distributions proc_set_wqptr(struct proc *p, struct workqueue *wq)
260*33de042dSApple OSS Distributions {
261*33de042dSApple OSS Distributions 	wq = os_atomic_xchg(&p->p_wqptr, wq, release);
262*33de042dSApple OSS Distributions 	if (wq == WQPTR_IS_INITING_VALUE) {
263*33de042dSApple OSS Distributions 		proc_lock(p);
264*33de042dSApple OSS Distributions 		thread_wakeup(&p->p_wqptr);
265*33de042dSApple OSS Distributions 		proc_unlock(p);
266*33de042dSApple OSS Distributions 	}
267*33de042dSApple OSS Distributions }
268*33de042dSApple OSS Distributions 
269*33de042dSApple OSS Distributions static bool
proc_init_wqptr_or_wait(struct proc * p)270*33de042dSApple OSS Distributions proc_init_wqptr_or_wait(struct proc *p)
271*33de042dSApple OSS Distributions {
272*33de042dSApple OSS Distributions 	struct workqueue *wq;
273*33de042dSApple OSS Distributions 
274*33de042dSApple OSS Distributions 	proc_lock(p);
275*33de042dSApple OSS Distributions 	wq = os_atomic_load(&p->p_wqptr, relaxed);
276*33de042dSApple OSS Distributions 
277*33de042dSApple OSS Distributions 	if (wq == NULL) {
278*33de042dSApple OSS Distributions 		os_atomic_store(&p->p_wqptr, WQPTR_IS_INITING_VALUE, relaxed);
279*33de042dSApple OSS Distributions 		proc_unlock(p);
280*33de042dSApple OSS Distributions 		return true;
281*33de042dSApple OSS Distributions 	}
282*33de042dSApple OSS Distributions 
283*33de042dSApple OSS Distributions 	if (wq == WQPTR_IS_INITING_VALUE) {
284*33de042dSApple OSS Distributions 		assert_wait(&p->p_wqptr, THREAD_UNINT);
285*33de042dSApple OSS Distributions 		proc_unlock(p);
286*33de042dSApple OSS Distributions 		thread_block(THREAD_CONTINUE_NULL);
287*33de042dSApple OSS Distributions 	} else {
288*33de042dSApple OSS Distributions 		proc_unlock(p);
289*33de042dSApple OSS Distributions 	}
290*33de042dSApple OSS Distributions 	return false;
291*33de042dSApple OSS Distributions }
292*33de042dSApple OSS Distributions 
293*33de042dSApple OSS Distributions static inline event_t
workq_parked_wait_event(struct uthread * uth)294*33de042dSApple OSS Distributions workq_parked_wait_event(struct uthread *uth)
295*33de042dSApple OSS Distributions {
296*33de042dSApple OSS Distributions 	return (event_t)&uth->uu_workq_stackaddr;
297*33de042dSApple OSS Distributions }
298*33de042dSApple OSS Distributions 
299*33de042dSApple OSS Distributions static inline void
workq_thread_wakeup(struct uthread * uth)300*33de042dSApple OSS Distributions workq_thread_wakeup(struct uthread *uth)
301*33de042dSApple OSS Distributions {
302*33de042dSApple OSS Distributions 	thread_wakeup_thread(workq_parked_wait_event(uth), get_machthread(uth));
303*33de042dSApple OSS Distributions }
304*33de042dSApple OSS Distributions 
305*33de042dSApple OSS Distributions #pragma mark wq_thactive
306*33de042dSApple OSS Distributions 
307*33de042dSApple OSS Distributions #if defined(__LP64__)
308*33de042dSApple OSS Distributions // Layout is:
309*33de042dSApple OSS Distributions //   127 - 115 : 13 bits of zeroes
310*33de042dSApple OSS Distributions //   114 - 112 : best QoS among all pending constrained requests
311*33de042dSApple OSS Distributions //   111 -   0 : MGR, AUI, UI, IN, DF, UT, BG+MT buckets every 16 bits
312*33de042dSApple OSS Distributions #define WQ_THACTIVE_BUCKET_WIDTH 16
313*33de042dSApple OSS Distributions #define WQ_THACTIVE_QOS_SHIFT    (7 * WQ_THACTIVE_BUCKET_WIDTH)
314*33de042dSApple OSS Distributions #else
315*33de042dSApple OSS Distributions // Layout is:
316*33de042dSApple OSS Distributions //   63 - 61 : best QoS among all pending constrained requests
317*33de042dSApple OSS Distributions //   60      : Manager bucket (0 or 1)
318*33de042dSApple OSS Distributions //   59 -  0 : AUI, UI, IN, DF, UT, BG+MT buckets every 10 bits
319*33de042dSApple OSS Distributions #define WQ_THACTIVE_BUCKET_WIDTH 10
320*33de042dSApple OSS Distributions #define WQ_THACTIVE_QOS_SHIFT    (6 * WQ_THACTIVE_BUCKET_WIDTH + 1)
321*33de042dSApple OSS Distributions #endif
322*33de042dSApple OSS Distributions #define WQ_THACTIVE_BUCKET_MASK  ((1U << WQ_THACTIVE_BUCKET_WIDTH) - 1)
323*33de042dSApple OSS Distributions #define WQ_THACTIVE_BUCKET_HALF  (1U << (WQ_THACTIVE_BUCKET_WIDTH - 1))
324*33de042dSApple OSS Distributions 
325*33de042dSApple OSS Distributions static_assert(sizeof(wq_thactive_t) * CHAR_BIT - WQ_THACTIVE_QOS_SHIFT >= 3,
326*33de042dSApple OSS Distributions     "Make sure we have space to encode a QoS");
327*33de042dSApple OSS Distributions 
328*33de042dSApple OSS Distributions static inline wq_thactive_t
_wq_thactive(struct workqueue * wq)329*33de042dSApple OSS Distributions _wq_thactive(struct workqueue *wq)
330*33de042dSApple OSS Distributions {
331*33de042dSApple OSS Distributions 	return os_atomic_load_wide(&wq->wq_thactive, relaxed);
332*33de042dSApple OSS Distributions }
333*33de042dSApple OSS Distributions 
334*33de042dSApple OSS Distributions static inline uint8_t
_wq_bucket(thread_qos_t qos)335*33de042dSApple OSS Distributions _wq_bucket(thread_qos_t qos)
336*33de042dSApple OSS Distributions {
337*33de042dSApple OSS Distributions 	// Map both BG and MT to the same bucket by over-shifting down and
338*33de042dSApple OSS Distributions 	// clamping MT and BG together.
339*33de042dSApple OSS Distributions 	switch (qos) {
340*33de042dSApple OSS Distributions 	case THREAD_QOS_MAINTENANCE:
341*33de042dSApple OSS Distributions 		return 0;
342*33de042dSApple OSS Distributions 	default:
343*33de042dSApple OSS Distributions 		return qos - 2;
344*33de042dSApple OSS Distributions 	}
345*33de042dSApple OSS Distributions }
346*33de042dSApple OSS Distributions 
347*33de042dSApple OSS Distributions #define WQ_THACTIVE_BEST_CONSTRAINED_REQ_QOS(tha) \
348*33de042dSApple OSS Distributions 	        ((thread_qos_t)((tha) >> WQ_THACTIVE_QOS_SHIFT))
349*33de042dSApple OSS Distributions 
350*33de042dSApple OSS Distributions static inline thread_qos_t
_wq_thactive_best_constrained_req_qos(struct workqueue * wq)351*33de042dSApple OSS Distributions _wq_thactive_best_constrained_req_qos(struct workqueue *wq)
352*33de042dSApple OSS Distributions {
353*33de042dSApple OSS Distributions 	// Avoid expensive atomic operations: the three bits we're loading are in
354*33de042dSApple OSS Distributions 	// a single byte, and always updated under the workqueue lock
355*33de042dSApple OSS Distributions 	wq_thactive_t v = *(wq_thactive_t *)&wq->wq_thactive;
356*33de042dSApple OSS Distributions 	return WQ_THACTIVE_BEST_CONSTRAINED_REQ_QOS(v);
357*33de042dSApple OSS Distributions }
358*33de042dSApple OSS Distributions 
359*33de042dSApple OSS Distributions static void
_wq_thactive_refresh_best_constrained_req_qos(struct workqueue * wq)360*33de042dSApple OSS Distributions _wq_thactive_refresh_best_constrained_req_qos(struct workqueue *wq)
361*33de042dSApple OSS Distributions {
362*33de042dSApple OSS Distributions 	thread_qos_t old_qos, new_qos;
363*33de042dSApple OSS Distributions 	workq_threadreq_t req;
364*33de042dSApple OSS Distributions 
365*33de042dSApple OSS Distributions 	req = priority_queue_max(&wq->wq_constrained_queue,
366*33de042dSApple OSS Distributions 	    struct workq_threadreq_s, tr_entry);
367*33de042dSApple OSS Distributions 	new_qos = req ? req->tr_qos : THREAD_QOS_UNSPECIFIED;
368*33de042dSApple OSS Distributions 	old_qos = _wq_thactive_best_constrained_req_qos(wq);
369*33de042dSApple OSS Distributions 	if (old_qos != new_qos) {
370*33de042dSApple OSS Distributions 		long delta = (long)new_qos - (long)old_qos;
371*33de042dSApple OSS Distributions 		wq_thactive_t v = (wq_thactive_t)delta << WQ_THACTIVE_QOS_SHIFT;
372*33de042dSApple OSS Distributions 		/*
373*33de042dSApple OSS Distributions 		 * We can do an atomic add relative to the initial load because updates
374*33de042dSApple OSS Distributions 		 * to this qos are always serialized under the workqueue lock.
375*33de042dSApple OSS Distributions 		 */
376*33de042dSApple OSS Distributions 		v = os_atomic_add(&wq->wq_thactive, v, relaxed);
377*33de042dSApple OSS Distributions #ifdef __LP64__
378*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_thactive_update, wq, (uint64_t)v,
379*33de042dSApple OSS Distributions 		    (uint64_t)(v >> 64), 0);
380*33de042dSApple OSS Distributions #else
381*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_thactive_update, wq, v, 0, 0);
382*33de042dSApple OSS Distributions #endif
383*33de042dSApple OSS Distributions 	}
384*33de042dSApple OSS Distributions }
385*33de042dSApple OSS Distributions 
386*33de042dSApple OSS Distributions static inline wq_thactive_t
_wq_thactive_offset_for_qos(thread_qos_t qos)387*33de042dSApple OSS Distributions _wq_thactive_offset_for_qos(thread_qos_t qos)
388*33de042dSApple OSS Distributions {
389*33de042dSApple OSS Distributions 	uint8_t bucket = _wq_bucket(qos);
390*33de042dSApple OSS Distributions 	__builtin_assume(bucket < WORKQ_NUM_BUCKETS);
391*33de042dSApple OSS Distributions 	return (wq_thactive_t)1 << (bucket * WQ_THACTIVE_BUCKET_WIDTH);
392*33de042dSApple OSS Distributions }
393*33de042dSApple OSS Distributions 
394*33de042dSApple OSS Distributions static inline wq_thactive_t
_wq_thactive_inc(struct workqueue * wq,thread_qos_t qos)395*33de042dSApple OSS Distributions _wq_thactive_inc(struct workqueue *wq, thread_qos_t qos)
396*33de042dSApple OSS Distributions {
397*33de042dSApple OSS Distributions 	wq_thactive_t v = _wq_thactive_offset_for_qos(qos);
398*33de042dSApple OSS Distributions 	return os_atomic_add_orig(&wq->wq_thactive, v, relaxed);
399*33de042dSApple OSS Distributions }
400*33de042dSApple OSS Distributions 
401*33de042dSApple OSS Distributions static inline wq_thactive_t
_wq_thactive_dec(struct workqueue * wq,thread_qos_t qos)402*33de042dSApple OSS Distributions _wq_thactive_dec(struct workqueue *wq, thread_qos_t qos)
403*33de042dSApple OSS Distributions {
404*33de042dSApple OSS Distributions 	wq_thactive_t v = _wq_thactive_offset_for_qos(qos);
405*33de042dSApple OSS Distributions 	return os_atomic_sub_orig(&wq->wq_thactive, v, relaxed);
406*33de042dSApple OSS Distributions }
407*33de042dSApple OSS Distributions 
408*33de042dSApple OSS Distributions static inline void
_wq_thactive_move(struct workqueue * wq,thread_qos_t old_qos,thread_qos_t new_qos)409*33de042dSApple OSS Distributions _wq_thactive_move(struct workqueue *wq,
410*33de042dSApple OSS Distributions     thread_qos_t old_qos, thread_qos_t new_qos)
411*33de042dSApple OSS Distributions {
412*33de042dSApple OSS Distributions 	wq_thactive_t v = _wq_thactive_offset_for_qos(new_qos) -
413*33de042dSApple OSS Distributions 	    _wq_thactive_offset_for_qos(old_qos);
414*33de042dSApple OSS Distributions 	os_atomic_add(&wq->wq_thactive, v, relaxed);
415*33de042dSApple OSS Distributions 	wq->wq_thscheduled_count[_wq_bucket(old_qos)]--;
416*33de042dSApple OSS Distributions 	wq->wq_thscheduled_count[_wq_bucket(new_qos)]++;
417*33de042dSApple OSS Distributions }
418*33de042dSApple OSS Distributions 
419*33de042dSApple OSS Distributions static inline uint32_t
_wq_thactive_aggregate_downto_qos(struct workqueue * wq,wq_thactive_t v,thread_qos_t qos,uint32_t * busycount,uint32_t * max_busycount)420*33de042dSApple OSS Distributions _wq_thactive_aggregate_downto_qos(struct workqueue *wq, wq_thactive_t v,
421*33de042dSApple OSS Distributions     thread_qos_t qos, uint32_t *busycount, uint32_t *max_busycount)
422*33de042dSApple OSS Distributions {
423*33de042dSApple OSS Distributions 	uint32_t count = 0, active;
424*33de042dSApple OSS Distributions 	uint64_t curtime;
425*33de042dSApple OSS Distributions 
426*33de042dSApple OSS Distributions 	assert(WORKQ_THREAD_QOS_MIN <= qos && qos <= WORKQ_THREAD_QOS_MAX);
427*33de042dSApple OSS Distributions 
428*33de042dSApple OSS Distributions 	if (busycount) {
429*33de042dSApple OSS Distributions 		curtime = mach_absolute_time();
430*33de042dSApple OSS Distributions 		*busycount = 0;
431*33de042dSApple OSS Distributions 	}
432*33de042dSApple OSS Distributions 	if (max_busycount) {
433*33de042dSApple OSS Distributions 		*max_busycount = THREAD_QOS_LAST - qos;
434*33de042dSApple OSS Distributions 	}
435*33de042dSApple OSS Distributions 
436*33de042dSApple OSS Distributions 	uint8_t i = _wq_bucket(qos);
437*33de042dSApple OSS Distributions 	v >>= i * WQ_THACTIVE_BUCKET_WIDTH;
438*33de042dSApple OSS Distributions 	for (; i < WORKQ_NUM_QOS_BUCKETS; i++, v >>= WQ_THACTIVE_BUCKET_WIDTH) {
439*33de042dSApple OSS Distributions 		active = v & WQ_THACTIVE_BUCKET_MASK;
440*33de042dSApple OSS Distributions 		count += active;
441*33de042dSApple OSS Distributions 
442*33de042dSApple OSS Distributions 		if (busycount && wq->wq_thscheduled_count[i] > active) {
443*33de042dSApple OSS Distributions 			if (workq_thread_is_busy(curtime, &wq->wq_lastblocked_ts[i])) {
444*33de042dSApple OSS Distributions 				/*
445*33de042dSApple OSS Distributions 				 * We only consider the last blocked thread for a given bucket
446*33de042dSApple OSS Distributions 				 * as busy because we don't want to take the list lock in each
447*33de042dSApple OSS Distributions 				 * sched callback. However this is an approximation that could
448*33de042dSApple OSS Distributions 				 * contribute to thread creation storms.
449*33de042dSApple OSS Distributions 				 */
450*33de042dSApple OSS Distributions 				(*busycount)++;
451*33de042dSApple OSS Distributions 			}
452*33de042dSApple OSS Distributions 		}
453*33de042dSApple OSS Distributions 	}
454*33de042dSApple OSS Distributions 
455*33de042dSApple OSS Distributions 	return count;
456*33de042dSApple OSS Distributions }
457*33de042dSApple OSS Distributions 
458*33de042dSApple OSS Distributions /* The input qos here should be the requested QoS of the thread, not accounting
459*33de042dSApple OSS Distributions  * for any overrides */
460*33de042dSApple OSS Distributions static inline void
_wq_cooperative_queue_scheduled_count_dec(struct workqueue * wq,thread_qos_t qos)461*33de042dSApple OSS Distributions _wq_cooperative_queue_scheduled_count_dec(struct workqueue *wq, thread_qos_t qos)
462*33de042dSApple OSS Distributions {
463*33de042dSApple OSS Distributions 	__assert_only uint8_t old_scheduled_count = wq->wq_cooperative_queue_scheduled_count[_wq_bucket(qos)]--;
464*33de042dSApple OSS Distributions 	assert(old_scheduled_count > 0);
465*33de042dSApple OSS Distributions }
466*33de042dSApple OSS Distributions 
467*33de042dSApple OSS Distributions /* The input qos here should be the requested QoS of the thread, not accounting
468*33de042dSApple OSS Distributions  * for any overrides */
469*33de042dSApple OSS Distributions static inline void
_wq_cooperative_queue_scheduled_count_inc(struct workqueue * wq,thread_qos_t qos)470*33de042dSApple OSS Distributions _wq_cooperative_queue_scheduled_count_inc(struct workqueue *wq, thread_qos_t qos)
471*33de042dSApple OSS Distributions {
472*33de042dSApple OSS Distributions 	__assert_only uint8_t old_scheduled_count = wq->wq_cooperative_queue_scheduled_count[_wq_bucket(qos)]++;
473*33de042dSApple OSS Distributions 	assert(old_scheduled_count < UINT8_MAX);
474*33de042dSApple OSS Distributions }
475*33de042dSApple OSS Distributions 
476*33de042dSApple OSS Distributions #pragma mark wq_flags
477*33de042dSApple OSS Distributions 
478*33de042dSApple OSS Distributions static inline uint32_t
_wq_flags(struct workqueue * wq)479*33de042dSApple OSS Distributions _wq_flags(struct workqueue *wq)
480*33de042dSApple OSS Distributions {
481*33de042dSApple OSS Distributions 	return os_atomic_load(&wq->wq_flags, relaxed);
482*33de042dSApple OSS Distributions }
483*33de042dSApple OSS Distributions 
484*33de042dSApple OSS Distributions static inline bool
_wq_exiting(struct workqueue * wq)485*33de042dSApple OSS Distributions _wq_exiting(struct workqueue *wq)
486*33de042dSApple OSS Distributions {
487*33de042dSApple OSS Distributions 	return _wq_flags(wq) & WQ_EXITING;
488*33de042dSApple OSS Distributions }
489*33de042dSApple OSS Distributions 
490*33de042dSApple OSS Distributions bool
workq_is_exiting(struct proc * p)491*33de042dSApple OSS Distributions workq_is_exiting(struct proc *p)
492*33de042dSApple OSS Distributions {
493*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
494*33de042dSApple OSS Distributions 	return !wq || _wq_exiting(wq);
495*33de042dSApple OSS Distributions }
496*33de042dSApple OSS Distributions 
497*33de042dSApple OSS Distributions 
498*33de042dSApple OSS Distributions #pragma mark workqueue lock
499*33de042dSApple OSS Distributions 
500*33de042dSApple OSS Distributions static bool
workq_lock_is_acquired_kdp(struct workqueue * wq)501*33de042dSApple OSS Distributions workq_lock_is_acquired_kdp(struct workqueue *wq)
502*33de042dSApple OSS Distributions {
503*33de042dSApple OSS Distributions 	return kdp_lck_ticket_is_acquired(&wq->wq_lock);
504*33de042dSApple OSS Distributions }
505*33de042dSApple OSS Distributions 
506*33de042dSApple OSS Distributions static inline void
workq_lock_spin(struct workqueue * wq)507*33de042dSApple OSS Distributions workq_lock_spin(struct workqueue *wq)
508*33de042dSApple OSS Distributions {
509*33de042dSApple OSS Distributions 	lck_ticket_lock(&wq->wq_lock, &workq_lck_grp);
510*33de042dSApple OSS Distributions }
511*33de042dSApple OSS Distributions 
512*33de042dSApple OSS Distributions static inline void
workq_lock_held(struct workqueue * wq)513*33de042dSApple OSS Distributions workq_lock_held(struct workqueue *wq)
514*33de042dSApple OSS Distributions {
515*33de042dSApple OSS Distributions 	LCK_TICKET_ASSERT_OWNED(&wq->wq_lock);
516*33de042dSApple OSS Distributions }
517*33de042dSApple OSS Distributions 
518*33de042dSApple OSS Distributions static inline bool
workq_lock_try(struct workqueue * wq)519*33de042dSApple OSS Distributions workq_lock_try(struct workqueue *wq)
520*33de042dSApple OSS Distributions {
521*33de042dSApple OSS Distributions 	return lck_ticket_lock_try(&wq->wq_lock, &workq_lck_grp);
522*33de042dSApple OSS Distributions }
523*33de042dSApple OSS Distributions 
524*33de042dSApple OSS Distributions static inline void
workq_unlock(struct workqueue * wq)525*33de042dSApple OSS Distributions workq_unlock(struct workqueue *wq)
526*33de042dSApple OSS Distributions {
527*33de042dSApple OSS Distributions 	lck_ticket_unlock(&wq->wq_lock);
528*33de042dSApple OSS Distributions }
529*33de042dSApple OSS Distributions 
530*33de042dSApple OSS Distributions #pragma mark idle thread lists
531*33de042dSApple OSS Distributions 
532*33de042dSApple OSS Distributions #define WORKQ_POLICY_INIT(qos) \
533*33de042dSApple OSS Distributions 	        (struct uu_workq_policy){ .qos_req = qos, .qos_bucket = qos }
534*33de042dSApple OSS Distributions 
535*33de042dSApple OSS Distributions static inline thread_qos_t
workq_pri_bucket(struct uu_workq_policy req)536*33de042dSApple OSS Distributions workq_pri_bucket(struct uu_workq_policy req)
537*33de042dSApple OSS Distributions {
538*33de042dSApple OSS Distributions 	return MAX(MAX(req.qos_req, req.qos_max), req.qos_override);
539*33de042dSApple OSS Distributions }
540*33de042dSApple OSS Distributions 
541*33de042dSApple OSS Distributions static inline thread_qos_t
workq_pri_override(struct uu_workq_policy req)542*33de042dSApple OSS Distributions workq_pri_override(struct uu_workq_policy req)
543*33de042dSApple OSS Distributions {
544*33de042dSApple OSS Distributions 	return MAX(workq_pri_bucket(req), req.qos_bucket);
545*33de042dSApple OSS Distributions }
546*33de042dSApple OSS Distributions 
547*33de042dSApple OSS Distributions static inline bool
workq_thread_needs_params_change(workq_threadreq_t req,struct uthread * uth)548*33de042dSApple OSS Distributions workq_thread_needs_params_change(workq_threadreq_t req, struct uthread *uth)
549*33de042dSApple OSS Distributions {
550*33de042dSApple OSS Distributions 	workq_threadreq_param_t cur_trp, req_trp = { };
551*33de042dSApple OSS Distributions 
552*33de042dSApple OSS Distributions 	cur_trp.trp_value = uth->uu_save.uus_workq_park_data.workloop_params;
553*33de042dSApple OSS Distributions 	if (req->tr_flags & WORKQ_TR_FLAG_WL_PARAMS) {
554*33de042dSApple OSS Distributions 		req_trp = kqueue_threadreq_workloop_param(req);
555*33de042dSApple OSS Distributions 	}
556*33de042dSApple OSS Distributions 
557*33de042dSApple OSS Distributions 	/*
558*33de042dSApple OSS Distributions 	 * CPU percent flags are handled separately to policy changes, so ignore
559*33de042dSApple OSS Distributions 	 * them for all of these checks.
560*33de042dSApple OSS Distributions 	 */
561*33de042dSApple OSS Distributions 	uint16_t cur_flags = (cur_trp.trp_flags & ~TRP_CPUPERCENT);
562*33de042dSApple OSS Distributions 	uint16_t req_flags = (req_trp.trp_flags & ~TRP_CPUPERCENT);
563*33de042dSApple OSS Distributions 
564*33de042dSApple OSS Distributions 	if (!req_flags && !cur_flags) {
565*33de042dSApple OSS Distributions 		return false;
566*33de042dSApple OSS Distributions 	}
567*33de042dSApple OSS Distributions 
568*33de042dSApple OSS Distributions 	if (req_flags != cur_flags) {
569*33de042dSApple OSS Distributions 		return true;
570*33de042dSApple OSS Distributions 	}
571*33de042dSApple OSS Distributions 
572*33de042dSApple OSS Distributions 	if ((req_flags & TRP_PRIORITY) && req_trp.trp_pri != cur_trp.trp_pri) {
573*33de042dSApple OSS Distributions 		return true;
574*33de042dSApple OSS Distributions 	}
575*33de042dSApple OSS Distributions 
576*33de042dSApple OSS Distributions 	if ((req_flags & TRP_POLICY) && req_trp.trp_pol != cur_trp.trp_pol) {
577*33de042dSApple OSS Distributions 		return true;
578*33de042dSApple OSS Distributions 	}
579*33de042dSApple OSS Distributions 
580*33de042dSApple OSS Distributions 	return false;
581*33de042dSApple OSS Distributions }
582*33de042dSApple OSS Distributions 
583*33de042dSApple OSS Distributions static inline bool
workq_thread_needs_priority_change(workq_threadreq_t req,struct uthread * uth)584*33de042dSApple OSS Distributions workq_thread_needs_priority_change(workq_threadreq_t req, struct uthread *uth)
585*33de042dSApple OSS Distributions {
586*33de042dSApple OSS Distributions 	if (workq_thread_needs_params_change(req, uth)) {
587*33de042dSApple OSS Distributions 		return true;
588*33de042dSApple OSS Distributions 	}
589*33de042dSApple OSS Distributions 
590*33de042dSApple OSS Distributions 	if (req->tr_qos != workq_pri_override(uth->uu_workq_pri)) {
591*33de042dSApple OSS Distributions 		return true;
592*33de042dSApple OSS Distributions 	}
593*33de042dSApple OSS Distributions 
594*33de042dSApple OSS Distributions #if CONFIG_PREADOPT_TG
595*33de042dSApple OSS Distributions 	thread_group_qos_t tg = kqr_preadopt_thread_group(req);
596*33de042dSApple OSS Distributions 	if (KQWL_HAS_VALID_PREADOPTED_TG(tg)) {
597*33de042dSApple OSS Distributions 		/*
598*33de042dSApple OSS Distributions 		 * Ideally, we'd add check here to see if thread's preadopt TG is same
599*33de042dSApple OSS Distributions 		 * as the thread requests's thread group and short circuit if that is
600*33de042dSApple OSS Distributions 		 * the case. But in the interest of keeping the code clean and not
601*33de042dSApple OSS Distributions 		 * taking the thread lock here, we're going to skip this. We will
602*33de042dSApple OSS Distributions 		 * eventually shortcircuit once we try to set the preadoption thread
603*33de042dSApple OSS Distributions 		 * group on the thread.
604*33de042dSApple OSS Distributions 		 */
605*33de042dSApple OSS Distributions 		return true;
606*33de042dSApple OSS Distributions 	}
607*33de042dSApple OSS Distributions #endif
608*33de042dSApple OSS Distributions 
609*33de042dSApple OSS Distributions 	return false;
610*33de042dSApple OSS Distributions }
611*33de042dSApple OSS Distributions 
612*33de042dSApple OSS Distributions /* Input thread must be self. Called during self override, resetting overrides
613*33de042dSApple OSS Distributions  * or while processing kevents
614*33de042dSApple OSS Distributions  *
615*33de042dSApple OSS Distributions  * Called with workq lock held. Sometimes also the thread mutex
616*33de042dSApple OSS Distributions  */
617*33de042dSApple OSS Distributions static void
workq_thread_update_bucket(proc_t p,struct workqueue * wq,struct uthread * uth,struct uu_workq_policy old_pri,struct uu_workq_policy new_pri,bool force_run)618*33de042dSApple OSS Distributions workq_thread_update_bucket(proc_t p, struct workqueue *wq, struct uthread *uth,
619*33de042dSApple OSS Distributions     struct uu_workq_policy old_pri, struct uu_workq_policy new_pri,
620*33de042dSApple OSS Distributions     bool force_run)
621*33de042dSApple OSS Distributions {
622*33de042dSApple OSS Distributions 	assert(uth == current_uthread());
623*33de042dSApple OSS Distributions 
624*33de042dSApple OSS Distributions 	thread_qos_t old_bucket = old_pri.qos_bucket;
625*33de042dSApple OSS Distributions 	thread_qos_t new_bucket = workq_pri_bucket(new_pri);
626*33de042dSApple OSS Distributions 
627*33de042dSApple OSS Distributions 	if ((old_bucket != new_bucket) &&
628*33de042dSApple OSS Distributions 	    !workq_thread_is_permanently_bound(uth)) {
629*33de042dSApple OSS Distributions 		_wq_thactive_move(wq, old_bucket, new_bucket);
630*33de042dSApple OSS Distributions 	}
631*33de042dSApple OSS Distributions 
632*33de042dSApple OSS Distributions 	new_pri.qos_bucket = new_bucket;
633*33de042dSApple OSS Distributions 	uth->uu_workq_pri = new_pri;
634*33de042dSApple OSS Distributions 
635*33de042dSApple OSS Distributions 	if (old_pri.qos_override != new_pri.qos_override) {
636*33de042dSApple OSS Distributions 		thread_set_workq_override(get_machthread(uth), new_pri.qos_override);
637*33de042dSApple OSS Distributions 	}
638*33de042dSApple OSS Distributions 
639*33de042dSApple OSS Distributions 	if (wq->wq_reqcount &&
640*33de042dSApple OSS Distributions 	    !workq_thread_is_permanently_bound(uth) &&
641*33de042dSApple OSS Distributions 	    (old_bucket > new_bucket || force_run)) {
642*33de042dSApple OSS Distributions 		int flags = WORKQ_THREADREQ_CAN_CREATE_THREADS;
643*33de042dSApple OSS Distributions 		if (old_bucket > new_bucket) {
644*33de042dSApple OSS Distributions 			/*
645*33de042dSApple OSS Distributions 			 * When lowering our bucket, we may unblock a thread request,
646*33de042dSApple OSS Distributions 			 * but we can't drop our priority before we have evaluated
647*33de042dSApple OSS Distributions 			 * whether this is the case, and if we ever drop the workqueue lock
648*33de042dSApple OSS Distributions 			 * that would cause a priority inversion.
649*33de042dSApple OSS Distributions 			 *
650*33de042dSApple OSS Distributions 			 * We hence have to disallow thread creation in that case.
651*33de042dSApple OSS Distributions 			 */
652*33de042dSApple OSS Distributions 			flags = 0;
653*33de042dSApple OSS Distributions 		}
654*33de042dSApple OSS Distributions 		workq_schedule_creator(p, wq, flags);
655*33de042dSApple OSS Distributions 	}
656*33de042dSApple OSS Distributions }
657*33de042dSApple OSS Distributions 
658*33de042dSApple OSS Distributions /*
659*33de042dSApple OSS Distributions  * Sets/resets the cpu percent limits on the current thread. We can't set
660*33de042dSApple OSS Distributions  * these limits from outside of the current thread, so this function needs
661*33de042dSApple OSS Distributions  * to be called when we're executing on the intended
662*33de042dSApple OSS Distributions  */
663*33de042dSApple OSS Distributions static void
workq_thread_reset_cpupercent(workq_threadreq_t req,struct uthread * uth)664*33de042dSApple OSS Distributions workq_thread_reset_cpupercent(workq_threadreq_t req, struct uthread *uth)
665*33de042dSApple OSS Distributions {
666*33de042dSApple OSS Distributions 	assert(uth == current_uthread());
667*33de042dSApple OSS Distributions 	workq_threadreq_param_t trp = { };
668*33de042dSApple OSS Distributions 
669*33de042dSApple OSS Distributions 	if (req && (req->tr_flags & WORKQ_TR_FLAG_WL_PARAMS)) {
670*33de042dSApple OSS Distributions 		trp = kqueue_threadreq_workloop_param(req);
671*33de042dSApple OSS Distributions 	}
672*33de042dSApple OSS Distributions 
673*33de042dSApple OSS Distributions 	if (uth->uu_workq_flags & UT_WORKQ_CPUPERCENT) {
674*33de042dSApple OSS Distributions 		/*
675*33de042dSApple OSS Distributions 		 * Going through disable when we have an existing CPU percent limit
676*33de042dSApple OSS Distributions 		 * set will force the ledger to refill the token bucket of the current
677*33de042dSApple OSS Distributions 		 * thread. Removing any penalty applied by previous thread use.
678*33de042dSApple OSS Distributions 		 */
679*33de042dSApple OSS Distributions 		thread_set_cpulimit(THREAD_CPULIMIT_DISABLE, 0, 0);
680*33de042dSApple OSS Distributions 		uth->uu_workq_flags &= ~UT_WORKQ_CPUPERCENT;
681*33de042dSApple OSS Distributions 	}
682*33de042dSApple OSS Distributions 
683*33de042dSApple OSS Distributions 	if (trp.trp_flags & TRP_CPUPERCENT) {
684*33de042dSApple OSS Distributions 		thread_set_cpulimit(THREAD_CPULIMIT_BLOCK, trp.trp_cpupercent,
685*33de042dSApple OSS Distributions 		    (uint64_t)trp.trp_refillms * NSEC_PER_SEC);
686*33de042dSApple OSS Distributions 		uth->uu_workq_flags |= UT_WORKQ_CPUPERCENT;
687*33de042dSApple OSS Distributions 	}
688*33de042dSApple OSS Distributions }
689*33de042dSApple OSS Distributions 
690*33de042dSApple OSS Distributions /*
691*33de042dSApple OSS Distributions  * This function is always called with the workq lock, except for the
692*33de042dSApple OSS Distributions  * permanently bound workqueue thread, which instead requires the kqlock.
693*33de042dSApple OSS Distributions  * See locking model for bound thread's uu_workq_flags.
694*33de042dSApple OSS Distributions  */
695*33de042dSApple OSS Distributions static void
workq_thread_reset_pri(struct workqueue * wq,struct uthread * uth,workq_threadreq_t req,bool unpark)696*33de042dSApple OSS Distributions workq_thread_reset_pri(struct workqueue *wq, struct uthread *uth,
697*33de042dSApple OSS Distributions     workq_threadreq_t req, bool unpark)
698*33de042dSApple OSS Distributions {
699*33de042dSApple OSS Distributions 	thread_t th = get_machthread(uth);
700*33de042dSApple OSS Distributions 	thread_qos_t qos = req ? req->tr_qos : WORKQ_THREAD_QOS_CLEANUP;
701*33de042dSApple OSS Distributions 	workq_threadreq_param_t trp = { };
702*33de042dSApple OSS Distributions 	int priority = 31;
703*33de042dSApple OSS Distributions 	int policy = POLICY_TIMESHARE;
704*33de042dSApple OSS Distributions 
705*33de042dSApple OSS Distributions 	if (req && (req->tr_flags & WORKQ_TR_FLAG_WL_PARAMS)) {
706*33de042dSApple OSS Distributions 		trp = kqueue_threadreq_workloop_param(req);
707*33de042dSApple OSS Distributions 	}
708*33de042dSApple OSS Distributions 
709*33de042dSApple OSS Distributions 	uth->uu_workq_pri = WORKQ_POLICY_INIT(qos);
710*33de042dSApple OSS Distributions 	uth->uu_workq_flags &= ~UT_WORKQ_OUTSIDE_QOS;
711*33de042dSApple OSS Distributions 
712*33de042dSApple OSS Distributions 	if (unpark) {
713*33de042dSApple OSS Distributions 		uth->uu_save.uus_workq_park_data.workloop_params = trp.trp_value;
714*33de042dSApple OSS Distributions 		// qos sent out to userspace (may differ from uu_workq_pri on param threads)
715*33de042dSApple OSS Distributions 		uth->uu_save.uus_workq_park_data.qos = qos;
716*33de042dSApple OSS Distributions 	}
717*33de042dSApple OSS Distributions 
718*33de042dSApple OSS Distributions 	if (qos == WORKQ_THREAD_QOS_MANAGER) {
719*33de042dSApple OSS Distributions 		uint32_t mgr_pri = wq->wq_event_manager_priority;
720*33de042dSApple OSS Distributions 		assert(trp.trp_value == 0); // manager qos and thread policy don't mix
721*33de042dSApple OSS Distributions 
722*33de042dSApple OSS Distributions 		if (_pthread_priority_has_sched_pri(mgr_pri)) {
723*33de042dSApple OSS Distributions 			mgr_pri &= _PTHREAD_PRIORITY_SCHED_PRI_MASK;
724*33de042dSApple OSS Distributions 			thread_set_workq_pri(th, THREAD_QOS_UNSPECIFIED, mgr_pri,
725*33de042dSApple OSS Distributions 			    POLICY_TIMESHARE);
726*33de042dSApple OSS Distributions 			return;
727*33de042dSApple OSS Distributions 		}
728*33de042dSApple OSS Distributions 
729*33de042dSApple OSS Distributions 		qos = _pthread_priority_thread_qos(mgr_pri);
730*33de042dSApple OSS Distributions 	} else {
731*33de042dSApple OSS Distributions 		if (trp.trp_flags & TRP_PRIORITY) {
732*33de042dSApple OSS Distributions 			qos = THREAD_QOS_UNSPECIFIED;
733*33de042dSApple OSS Distributions 			priority = trp.trp_pri;
734*33de042dSApple OSS Distributions 			uth->uu_workq_flags |= UT_WORKQ_OUTSIDE_QOS;
735*33de042dSApple OSS Distributions 		}
736*33de042dSApple OSS Distributions 
737*33de042dSApple OSS Distributions 		if (trp.trp_flags & TRP_POLICY) {
738*33de042dSApple OSS Distributions 			policy = trp.trp_pol;
739*33de042dSApple OSS Distributions 		}
740*33de042dSApple OSS Distributions 	}
741*33de042dSApple OSS Distributions 
742*33de042dSApple OSS Distributions #if CONFIG_PREADOPT_TG
743*33de042dSApple OSS Distributions 	if (req && (req->tr_flags & WORKQ_TR_FLAG_WORKLOOP)) {
744*33de042dSApple OSS Distributions 		/*
745*33de042dSApple OSS Distributions 		 * For kqwl permanently configured with a thread group, we can safely borrow
746*33de042dSApple OSS Distributions 		 * +1 ref from kqwl_preadopt_tg. A thread then takes additional +1 ref
747*33de042dSApple OSS Distributions 		 * for itself via thread_set_preadopt_thread_group.
748*33de042dSApple OSS Distributions 		 *
749*33de042dSApple OSS Distributions 		 * In all other cases, we cannot safely read and borrow the reference from the kqwl
750*33de042dSApple OSS Distributions 		 * since it can disappear from under us at any time due to the max-ing logic in
751*33de042dSApple OSS Distributions 		 * kqueue_set_preadopted_thread_group.
752*33de042dSApple OSS Distributions 		 *
753*33de042dSApple OSS Distributions 		 * As such, we do the following dance:
754*33de042dSApple OSS Distributions 		 *
755*33de042dSApple OSS Distributions 		 * 1) cmpxchng and steal the kqwl's preadopt thread group and leave
756*33de042dSApple OSS Distributions 		 * behind with (NULL + QoS). At this point, we have the reference
757*33de042dSApple OSS Distributions 		 * to the thread group from the kqwl.
758*33de042dSApple OSS Distributions 		 * 2) Have the thread set the preadoption thread group on itself.
759*33de042dSApple OSS Distributions 		 * 3) cmpxchng from (NULL + QoS) which we set earlier in (1), back to
760*33de042dSApple OSS Distributions 		 * thread_group + QoS. ie we try to give the reference back to the kqwl.
761*33de042dSApple OSS Distributions 		 * If we fail, that's because a higher QoS thread group was set on the
762*33de042dSApple OSS Distributions 		 * kqwl in kqueue_set_preadopted_thread_group in which case, we need to
763*33de042dSApple OSS Distributions 		 * go back to (1).
764*33de042dSApple OSS Distributions 		 */
765*33de042dSApple OSS Distributions 
766*33de042dSApple OSS Distributions 		_Atomic(struct thread_group *) * tg_loc = kqr_preadopt_thread_group_addr(req);
767*33de042dSApple OSS Distributions 
768*33de042dSApple OSS Distributions 		thread_group_qos_t old_tg, new_tg;
769*33de042dSApple OSS Distributions 		int ret = 0;
770*33de042dSApple OSS Distributions again:
771*33de042dSApple OSS Distributions 		ret = os_atomic_rmw_loop(tg_loc, old_tg, new_tg, relaxed, {
772*33de042dSApple OSS Distributions 			if ((!KQWL_HAS_VALID_PREADOPTED_TG(old_tg)) ||
773*33de042dSApple OSS Distributions 			KQWL_HAS_PERMANENT_PREADOPTED_TG(old_tg)) {
774*33de042dSApple OSS Distributions 			        os_atomic_rmw_loop_give_up(break);
775*33de042dSApple OSS Distributions 			}
776*33de042dSApple OSS Distributions 
777*33de042dSApple OSS Distributions 			/*
778*33de042dSApple OSS Distributions 			 * Leave the QoS behind - kqueue_set_preadopted_thread_group will
779*33de042dSApple OSS Distributions 			 * only modify it if there is a higher QoS thread group to attach
780*33de042dSApple OSS Distributions 			 */
781*33de042dSApple OSS Distributions 			new_tg = (thread_group_qos_t) ((uintptr_t) old_tg & KQWL_PREADOPT_TG_QOS_MASK);
782*33de042dSApple OSS Distributions 		});
783*33de042dSApple OSS Distributions 
784*33de042dSApple OSS Distributions 		if (ret) {
785*33de042dSApple OSS Distributions 			/*
786*33de042dSApple OSS Distributions 			 * We successfully took the ref from the kqwl so set it on the
787*33de042dSApple OSS Distributions 			 * thread now
788*33de042dSApple OSS Distributions 			 */
789*33de042dSApple OSS Distributions 			thread_set_preadopt_thread_group(th, KQWL_GET_PREADOPTED_TG(old_tg));
790*33de042dSApple OSS Distributions 
791*33de042dSApple OSS Distributions 			thread_group_qos_t thread_group_to_expect = new_tg;
792*33de042dSApple OSS Distributions 			thread_group_qos_t thread_group_to_set = old_tg;
793*33de042dSApple OSS Distributions 
794*33de042dSApple OSS Distributions 			os_atomic_rmw_loop(tg_loc, old_tg, new_tg, relaxed, {
795*33de042dSApple OSS Distributions 				if (old_tg != thread_group_to_expect) {
796*33de042dSApple OSS Distributions 				        /*
797*33de042dSApple OSS Distributions 				         * There was an intervening write to the kqwl_preadopt_tg,
798*33de042dSApple OSS Distributions 				         * and it has a higher QoS than what we are working with
799*33de042dSApple OSS Distributions 				         * here. Abandon our current adopted thread group and redo
800*33de042dSApple OSS Distributions 				         * the full dance
801*33de042dSApple OSS Distributions 				         */
802*33de042dSApple OSS Distributions 				        thread_group_deallocate_safe(KQWL_GET_PREADOPTED_TG(thread_group_to_set));
803*33de042dSApple OSS Distributions 				        os_atomic_rmw_loop_give_up(goto again);
804*33de042dSApple OSS Distributions 				}
805*33de042dSApple OSS Distributions 
806*33de042dSApple OSS Distributions 				new_tg = thread_group_to_set;
807*33de042dSApple OSS Distributions 			});
808*33de042dSApple OSS Distributions 		} else {
809*33de042dSApple OSS Distributions 			if (KQWL_HAS_PERMANENT_PREADOPTED_TG(old_tg)) {
810*33de042dSApple OSS Distributions 				thread_set_preadopt_thread_group(th, KQWL_GET_PREADOPTED_TG(old_tg));
811*33de042dSApple OSS Distributions 			} else {
812*33de042dSApple OSS Distributions 				/* Nothing valid on the kqwl, just clear what's on the thread */
813*33de042dSApple OSS Distributions 				thread_set_preadopt_thread_group(th, NULL);
814*33de042dSApple OSS Distributions 			}
815*33de042dSApple OSS Distributions 		}
816*33de042dSApple OSS Distributions 	} else {
817*33de042dSApple OSS Distributions 		/* Not even a kqwl, clear what's on the thread */
818*33de042dSApple OSS Distributions 		thread_set_preadopt_thread_group(th, NULL);
819*33de042dSApple OSS Distributions 	}
820*33de042dSApple OSS Distributions #endif
821*33de042dSApple OSS Distributions 	thread_set_workq_pri(th, qos, priority, policy);
822*33de042dSApple OSS Distributions }
823*33de042dSApple OSS Distributions 
824*33de042dSApple OSS Distributions /*
825*33de042dSApple OSS Distributions  * Called by kevent with the NOTE_WL_THREAD_REQUEST knote lock held,
826*33de042dSApple OSS Distributions  * every time a servicer is being told about a new max QoS.
827*33de042dSApple OSS Distributions  */
828*33de042dSApple OSS Distributions void
workq_thread_set_max_qos(struct proc * p,workq_threadreq_t kqr)829*33de042dSApple OSS Distributions workq_thread_set_max_qos(struct proc *p, workq_threadreq_t kqr)
830*33de042dSApple OSS Distributions {
831*33de042dSApple OSS Distributions 	struct uu_workq_policy old_pri, new_pri;
832*33de042dSApple OSS Distributions 	struct uthread *uth = current_uthread();
833*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr_fast(p);
834*33de042dSApple OSS Distributions 	thread_qos_t qos = kqr->tr_kq_qos_index;
835*33de042dSApple OSS Distributions 
836*33de042dSApple OSS Distributions 	if (uth->uu_workq_pri.qos_max == qos) {
837*33de042dSApple OSS Distributions 		return;
838*33de042dSApple OSS Distributions 	}
839*33de042dSApple OSS Distributions 
840*33de042dSApple OSS Distributions 	workq_lock_spin(wq);
841*33de042dSApple OSS Distributions 	old_pri = new_pri = uth->uu_workq_pri;
842*33de042dSApple OSS Distributions 	new_pri.qos_max = qos;
843*33de042dSApple OSS Distributions 	workq_thread_update_bucket(p, wq, uth, old_pri, new_pri, false);
844*33de042dSApple OSS Distributions 	workq_unlock(wq);
845*33de042dSApple OSS Distributions }
846*33de042dSApple OSS Distributions 
847*33de042dSApple OSS Distributions #pragma mark idle threads accounting and handling
848*33de042dSApple OSS Distributions 
849*33de042dSApple OSS Distributions static inline struct uthread *
workq_oldest_killable_idle_thread(struct workqueue * wq)850*33de042dSApple OSS Distributions workq_oldest_killable_idle_thread(struct workqueue *wq)
851*33de042dSApple OSS Distributions {
852*33de042dSApple OSS Distributions 	struct uthread *uth = TAILQ_LAST(&wq->wq_thidlelist, workq_uthread_head);
853*33de042dSApple OSS Distributions 
854*33de042dSApple OSS Distributions 	if (uth && !uth->uu_save.uus_workq_park_data.has_stack) {
855*33de042dSApple OSS Distributions 		uth = TAILQ_PREV(uth, workq_uthread_head, uu_workq_entry);
856*33de042dSApple OSS Distributions 		if (uth) {
857*33de042dSApple OSS Distributions 			assert(uth->uu_save.uus_workq_park_data.has_stack);
858*33de042dSApple OSS Distributions 		}
859*33de042dSApple OSS Distributions 	}
860*33de042dSApple OSS Distributions 	return uth;
861*33de042dSApple OSS Distributions }
862*33de042dSApple OSS Distributions 
863*33de042dSApple OSS Distributions static inline uint64_t
workq_kill_delay_for_idle_thread(struct workqueue * wq)864*33de042dSApple OSS Distributions workq_kill_delay_for_idle_thread(struct workqueue *wq)
865*33de042dSApple OSS Distributions {
866*33de042dSApple OSS Distributions 	uint64_t delay = wq_reduce_pool_window.abstime;
867*33de042dSApple OSS Distributions 	uint16_t idle = wq->wq_thidlecount;
868*33de042dSApple OSS Distributions 
869*33de042dSApple OSS Distributions 	/*
870*33de042dSApple OSS Distributions 	 * If we have less than wq_death_max_load threads, have a 5s timer.
871*33de042dSApple OSS Distributions 	 *
872*33de042dSApple OSS Distributions 	 * For the next wq_max_constrained_threads ones, decay linearly from
873*33de042dSApple OSS Distributions 	 * from 5s to 50ms.
874*33de042dSApple OSS Distributions 	 */
875*33de042dSApple OSS Distributions 	if (idle <= wq_death_max_load) {
876*33de042dSApple OSS Distributions 		return delay;
877*33de042dSApple OSS Distributions 	}
878*33de042dSApple OSS Distributions 
879*33de042dSApple OSS Distributions 	if (wq_max_constrained_threads > idle - wq_death_max_load) {
880*33de042dSApple OSS Distributions 		delay *= (wq_max_constrained_threads - (idle - wq_death_max_load));
881*33de042dSApple OSS Distributions 	}
882*33de042dSApple OSS Distributions 	return delay / wq_max_constrained_threads;
883*33de042dSApple OSS Distributions }
884*33de042dSApple OSS Distributions 
885*33de042dSApple OSS Distributions static inline bool
workq_should_kill_idle_thread(struct workqueue * wq,struct uthread * uth,uint64_t now)886*33de042dSApple OSS Distributions workq_should_kill_idle_thread(struct workqueue *wq, struct uthread *uth,
887*33de042dSApple OSS Distributions     uint64_t now)
888*33de042dSApple OSS Distributions {
889*33de042dSApple OSS Distributions 	uint64_t delay = workq_kill_delay_for_idle_thread(wq);
890*33de042dSApple OSS Distributions 	return now - uth->uu_save.uus_workq_park_data.idle_stamp > delay;
891*33de042dSApple OSS Distributions }
892*33de042dSApple OSS Distributions 
893*33de042dSApple OSS Distributions static void
workq_death_call_schedule(struct workqueue * wq,uint64_t deadline)894*33de042dSApple OSS Distributions workq_death_call_schedule(struct workqueue *wq, uint64_t deadline)
895*33de042dSApple OSS Distributions {
896*33de042dSApple OSS Distributions 	uint32_t wq_flags = os_atomic_load(&wq->wq_flags, relaxed);
897*33de042dSApple OSS Distributions 
898*33de042dSApple OSS Distributions 	if (wq_flags & (WQ_EXITING | WQ_DEATH_CALL_SCHEDULED)) {
899*33de042dSApple OSS Distributions 		return;
900*33de042dSApple OSS Distributions 	}
901*33de042dSApple OSS Distributions 	os_atomic_or(&wq->wq_flags, WQ_DEATH_CALL_SCHEDULED, relaxed);
902*33de042dSApple OSS Distributions 
903*33de042dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_death_call | DBG_FUNC_NONE, wq, 1, 0, 0);
904*33de042dSApple OSS Distributions 
905*33de042dSApple OSS Distributions 	/*
906*33de042dSApple OSS Distributions 	 * <rdar://problem/13139182> Due to how long term timers work, the leeway
907*33de042dSApple OSS Distributions 	 * can't be too short, so use 500ms which is long enough that we will not
908*33de042dSApple OSS Distributions 	 * wake up the CPU for killing threads, but short enough that it doesn't
909*33de042dSApple OSS Distributions 	 * fall into long-term timer list shenanigans.
910*33de042dSApple OSS Distributions 	 */
911*33de042dSApple OSS Distributions 	thread_call_enter_delayed_with_leeway(wq->wq_death_call, NULL, deadline,
912*33de042dSApple OSS Distributions 	    wq_reduce_pool_window.abstime / 10,
913*33de042dSApple OSS Distributions 	    THREAD_CALL_DELAY_LEEWAY | THREAD_CALL_DELAY_USER_BACKGROUND);
914*33de042dSApple OSS Distributions }
915*33de042dSApple OSS Distributions 
916*33de042dSApple OSS Distributions /*
917*33de042dSApple OSS Distributions  * `decrement` is set to the number of threads that are no longer dying:
918*33de042dSApple OSS Distributions  * - because they have been resuscitated just in time (workq_pop_idle_thread)
919*33de042dSApple OSS Distributions  * - or have been killed (workq_thread_terminate).
920*33de042dSApple OSS Distributions  */
921*33de042dSApple OSS Distributions static void
workq_death_policy_evaluate(struct workqueue * wq,uint16_t decrement)922*33de042dSApple OSS Distributions workq_death_policy_evaluate(struct workqueue *wq, uint16_t decrement)
923*33de042dSApple OSS Distributions {
924*33de042dSApple OSS Distributions 	struct uthread *uth;
925*33de042dSApple OSS Distributions 
926*33de042dSApple OSS Distributions 	assert(wq->wq_thdying_count >= decrement);
927*33de042dSApple OSS Distributions 	if ((wq->wq_thdying_count -= decrement) > 0) {
928*33de042dSApple OSS Distributions 		return;
929*33de042dSApple OSS Distributions 	}
930*33de042dSApple OSS Distributions 
931*33de042dSApple OSS Distributions 	if (wq->wq_thidlecount <= 1) {
932*33de042dSApple OSS Distributions 		return;
933*33de042dSApple OSS Distributions 	}
934*33de042dSApple OSS Distributions 
935*33de042dSApple OSS Distributions 	if ((uth = workq_oldest_killable_idle_thread(wq)) == NULL) {
936*33de042dSApple OSS Distributions 		return;
937*33de042dSApple OSS Distributions 	}
938*33de042dSApple OSS Distributions 
939*33de042dSApple OSS Distributions 	uint64_t now = mach_absolute_time();
940*33de042dSApple OSS Distributions 	uint64_t delay = workq_kill_delay_for_idle_thread(wq);
941*33de042dSApple OSS Distributions 
942*33de042dSApple OSS Distributions 	if (now - uth->uu_save.uus_workq_park_data.idle_stamp > delay) {
943*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_thread_terminate | DBG_FUNC_START,
944*33de042dSApple OSS Distributions 		    wq, wq->wq_thidlecount, 0, 0);
945*33de042dSApple OSS Distributions 		wq->wq_thdying_count++;
946*33de042dSApple OSS Distributions 		uth->uu_workq_flags |= UT_WORKQ_DYING;
947*33de042dSApple OSS Distributions 		if ((uth->uu_workq_flags & UT_WORKQ_IDLE_CLEANUP) == 0) {
948*33de042dSApple OSS Distributions 			workq_thread_wakeup(uth);
949*33de042dSApple OSS Distributions 		}
950*33de042dSApple OSS Distributions 		return;
951*33de042dSApple OSS Distributions 	}
952*33de042dSApple OSS Distributions 
953*33de042dSApple OSS Distributions 	workq_death_call_schedule(wq,
954*33de042dSApple OSS Distributions 	    uth->uu_save.uus_workq_park_data.idle_stamp + delay);
955*33de042dSApple OSS Distributions }
956*33de042dSApple OSS Distributions 
957*33de042dSApple OSS Distributions void
workq_thread_terminate(struct proc * p,struct uthread * uth)958*33de042dSApple OSS Distributions workq_thread_terminate(struct proc *p, struct uthread *uth)
959*33de042dSApple OSS Distributions {
960*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr_fast(p);
961*33de042dSApple OSS Distributions 
962*33de042dSApple OSS Distributions 	workq_lock_spin(wq);
963*33de042dSApple OSS Distributions 	if (!workq_thread_is_permanently_bound(uth)) {
964*33de042dSApple OSS Distributions 		TAILQ_REMOVE(&wq->wq_thrunlist, uth, uu_workq_entry);
965*33de042dSApple OSS Distributions 		if (uth->uu_workq_flags & UT_WORKQ_DYING) {
966*33de042dSApple OSS Distributions 			WQ_TRACE_WQ(TRACE_wq_thread_terminate | DBG_FUNC_END,
967*33de042dSApple OSS Distributions 			    wq, wq->wq_thidlecount, 0, 0);
968*33de042dSApple OSS Distributions 			workq_death_policy_evaluate(wq, 1);
969*33de042dSApple OSS Distributions 		}
970*33de042dSApple OSS Distributions 	}
971*33de042dSApple OSS Distributions 	if (wq->wq_nthreads-- == wq_max_threads) {
972*33de042dSApple OSS Distributions 		/*
973*33de042dSApple OSS Distributions 		 * We got under the thread limit again, which may have prevented
974*33de042dSApple OSS Distributions 		 * thread creation from happening, redrive if there are pending requests
975*33de042dSApple OSS Distributions 		 */
976*33de042dSApple OSS Distributions 		if (wq->wq_reqcount) {
977*33de042dSApple OSS Distributions 			workq_schedule_creator(p, wq, WORKQ_THREADREQ_CAN_CREATE_THREADS);
978*33de042dSApple OSS Distributions 		}
979*33de042dSApple OSS Distributions 	}
980*33de042dSApple OSS Distributions 	workq_unlock(wq);
981*33de042dSApple OSS Distributions 
982*33de042dSApple OSS Distributions 	thread_deallocate(get_machthread(uth));
983*33de042dSApple OSS Distributions }
984*33de042dSApple OSS Distributions 
985*33de042dSApple OSS Distributions static void
workq_kill_old_threads_call(void * param0,void * param1 __unused)986*33de042dSApple OSS Distributions workq_kill_old_threads_call(void *param0, void *param1 __unused)
987*33de042dSApple OSS Distributions {
988*33de042dSApple OSS Distributions 	struct workqueue *wq = param0;
989*33de042dSApple OSS Distributions 
990*33de042dSApple OSS Distributions 	workq_lock_spin(wq);
991*33de042dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_death_call | DBG_FUNC_START, wq, 0, 0, 0);
992*33de042dSApple OSS Distributions 	os_atomic_andnot(&wq->wq_flags, WQ_DEATH_CALL_SCHEDULED, relaxed);
993*33de042dSApple OSS Distributions 	workq_death_policy_evaluate(wq, 0);
994*33de042dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_death_call | DBG_FUNC_END, wq, 0, 0, 0);
995*33de042dSApple OSS Distributions 	workq_unlock(wq);
996*33de042dSApple OSS Distributions }
997*33de042dSApple OSS Distributions 
998*33de042dSApple OSS Distributions static struct uthread *
workq_pop_idle_thread(struct workqueue * wq,uint16_t uu_flags,bool * needs_wakeup)999*33de042dSApple OSS Distributions workq_pop_idle_thread(struct workqueue *wq, uint16_t uu_flags,
1000*33de042dSApple OSS Distributions     bool *needs_wakeup)
1001*33de042dSApple OSS Distributions {
1002*33de042dSApple OSS Distributions 	struct uthread *uth;
1003*33de042dSApple OSS Distributions 
1004*33de042dSApple OSS Distributions 	if ((uth = TAILQ_FIRST(&wq->wq_thidlelist))) {
1005*33de042dSApple OSS Distributions 		TAILQ_REMOVE(&wq->wq_thidlelist, uth, uu_workq_entry);
1006*33de042dSApple OSS Distributions 	} else {
1007*33de042dSApple OSS Distributions 		uth = TAILQ_FIRST(&wq->wq_thnewlist);
1008*33de042dSApple OSS Distributions 		TAILQ_REMOVE(&wq->wq_thnewlist, uth, uu_workq_entry);
1009*33de042dSApple OSS Distributions 	}
1010*33de042dSApple OSS Distributions 	TAILQ_INSERT_TAIL(&wq->wq_thrunlist, uth, uu_workq_entry);
1011*33de042dSApple OSS Distributions 
1012*33de042dSApple OSS Distributions 	assert((uth->uu_workq_flags & UT_WORKQ_RUNNING) == 0);
1013*33de042dSApple OSS Distributions 	uth->uu_workq_flags |= UT_WORKQ_RUNNING | uu_flags;
1014*33de042dSApple OSS Distributions 
1015*33de042dSApple OSS Distributions 	/* A thread is never woken up as part of the cooperative pool */
1016*33de042dSApple OSS Distributions 	assert((uu_flags & UT_WORKQ_COOPERATIVE) == 0);
1017*33de042dSApple OSS Distributions 
1018*33de042dSApple OSS Distributions 	if ((uu_flags & UT_WORKQ_OVERCOMMIT) == 0) {
1019*33de042dSApple OSS Distributions 		wq->wq_constrained_threads_scheduled++;
1020*33de042dSApple OSS Distributions 	}
1021*33de042dSApple OSS Distributions 	wq->wq_threads_scheduled++;
1022*33de042dSApple OSS Distributions 	wq->wq_thidlecount--;
1023*33de042dSApple OSS Distributions 
1024*33de042dSApple OSS Distributions 	if (__improbable(uth->uu_workq_flags & UT_WORKQ_DYING)) {
1025*33de042dSApple OSS Distributions 		uth->uu_workq_flags ^= UT_WORKQ_DYING;
1026*33de042dSApple OSS Distributions 		workq_death_policy_evaluate(wq, 1);
1027*33de042dSApple OSS Distributions 		*needs_wakeup = false;
1028*33de042dSApple OSS Distributions 	} else if (uth->uu_workq_flags & UT_WORKQ_IDLE_CLEANUP) {
1029*33de042dSApple OSS Distributions 		*needs_wakeup = false;
1030*33de042dSApple OSS Distributions 	} else {
1031*33de042dSApple OSS Distributions 		*needs_wakeup = true;
1032*33de042dSApple OSS Distributions 	}
1033*33de042dSApple OSS Distributions 	return uth;
1034*33de042dSApple OSS Distributions }
1035*33de042dSApple OSS Distributions 
1036*33de042dSApple OSS Distributions /*
1037*33de042dSApple OSS Distributions  * Called by thread_create_workq_waiting() during thread initialization, before
1038*33de042dSApple OSS Distributions  * assert_wait, before the thread has been started.
1039*33de042dSApple OSS Distributions  */
1040*33de042dSApple OSS Distributions event_t
workq_thread_init_and_wq_lock(task_t task,thread_t th)1041*33de042dSApple OSS Distributions workq_thread_init_and_wq_lock(task_t task, thread_t th)
1042*33de042dSApple OSS Distributions {
1043*33de042dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(th);
1044*33de042dSApple OSS Distributions 
1045*33de042dSApple OSS Distributions 	uth->uu_workq_flags = UT_WORKQ_NEW;
1046*33de042dSApple OSS Distributions 	uth->uu_workq_pri = WORKQ_POLICY_INIT(THREAD_QOS_LEGACY);
1047*33de042dSApple OSS Distributions 	uth->uu_workq_thport = MACH_PORT_NULL;
1048*33de042dSApple OSS Distributions 	uth->uu_workq_stackaddr = 0;
1049*33de042dSApple OSS Distributions 	uth->uu_workq_pthread_kill_allowed = 0;
1050*33de042dSApple OSS Distributions 
1051*33de042dSApple OSS Distributions 	thread_set_tag(th, THREAD_TAG_PTHREAD | THREAD_TAG_WORKQUEUE);
1052*33de042dSApple OSS Distributions 	thread_reset_workq_qos(th, THREAD_QOS_LEGACY);
1053*33de042dSApple OSS Distributions 
1054*33de042dSApple OSS Distributions 	workq_lock_spin(proc_get_wqptr_fast(get_bsdtask_info(task)));
1055*33de042dSApple OSS Distributions 	return workq_parked_wait_event(uth);
1056*33de042dSApple OSS Distributions }
1057*33de042dSApple OSS Distributions 
1058*33de042dSApple OSS Distributions /**
1059*33de042dSApple OSS Distributions  * Try to add a new workqueue thread.
1060*33de042dSApple OSS Distributions  *
1061*33de042dSApple OSS Distributions  * - called with workq lock held
1062*33de042dSApple OSS Distributions  * - dropped and retaken around thread creation
1063*33de042dSApple OSS Distributions  * - return with workq lock held
1064*33de042dSApple OSS Distributions  */
1065*33de042dSApple OSS Distributions static kern_return_t
workq_add_new_idle_thread(proc_t p,struct workqueue * wq,thread_continue_t continuation,bool is_permanently_bound,thread_t * new_thread)1066*33de042dSApple OSS Distributions workq_add_new_idle_thread(
1067*33de042dSApple OSS Distributions 	proc_t             p,
1068*33de042dSApple OSS Distributions 	struct workqueue  *wq,
1069*33de042dSApple OSS Distributions 	thread_continue_t continuation,
1070*33de042dSApple OSS Distributions 	bool              is_permanently_bound,
1071*33de042dSApple OSS Distributions 	thread_t          *new_thread)
1072*33de042dSApple OSS Distributions {
1073*33de042dSApple OSS Distributions 	mach_vm_offset_t th_stackaddr;
1074*33de042dSApple OSS Distributions 	kern_return_t kret;
1075*33de042dSApple OSS Distributions 	thread_t th;
1076*33de042dSApple OSS Distributions 
1077*33de042dSApple OSS Distributions 	wq->wq_nthreads++;
1078*33de042dSApple OSS Distributions 
1079*33de042dSApple OSS Distributions 	workq_unlock(wq);
1080*33de042dSApple OSS Distributions 
1081*33de042dSApple OSS Distributions 	vm_map_t vmap = get_task_map(proc_task(p));
1082*33de042dSApple OSS Distributions 
1083*33de042dSApple OSS Distributions 	kret = pthread_functions->workq_create_threadstack(p, vmap, &th_stackaddr);
1084*33de042dSApple OSS Distributions 	if (kret != KERN_SUCCESS) {
1085*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_thread_create_failed | DBG_FUNC_NONE, wq,
1086*33de042dSApple OSS Distributions 		    kret, 1, 0);
1087*33de042dSApple OSS Distributions 		goto out;
1088*33de042dSApple OSS Distributions 	}
1089*33de042dSApple OSS Distributions 
1090*33de042dSApple OSS Distributions 	kret = thread_create_workq_waiting(proc_task(p),
1091*33de042dSApple OSS Distributions 	    continuation,
1092*33de042dSApple OSS Distributions 	    &th,
1093*33de042dSApple OSS Distributions 	    is_permanently_bound);
1094*33de042dSApple OSS Distributions 	if (kret != KERN_SUCCESS) {
1095*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_thread_create_failed | DBG_FUNC_NONE, wq,
1096*33de042dSApple OSS Distributions 		    kret, 0, 0);
1097*33de042dSApple OSS Distributions 		pthread_functions->workq_destroy_threadstack(p, vmap, th_stackaddr);
1098*33de042dSApple OSS Distributions 		goto out;
1099*33de042dSApple OSS Distributions 	}
1100*33de042dSApple OSS Distributions 
1101*33de042dSApple OSS Distributions 	// thread_create_workq_waiting() will return with the wq lock held
1102*33de042dSApple OSS Distributions 	// on success, because it calls workq_thread_init_and_wq_lock() above
1103*33de042dSApple OSS Distributions 
1104*33de042dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(th);
1105*33de042dSApple OSS Distributions 	uth->uu_workq_stackaddr = (user_addr_t)th_stackaddr;
1106*33de042dSApple OSS Distributions 
1107*33de042dSApple OSS Distributions 	wq->wq_creations++;
1108*33de042dSApple OSS Distributions 	if (!is_permanently_bound) {
1109*33de042dSApple OSS Distributions 		wq->wq_thidlecount++;
1110*33de042dSApple OSS Distributions 		TAILQ_INSERT_TAIL(&wq->wq_thnewlist, uth, uu_workq_entry);
1111*33de042dSApple OSS Distributions 	}
1112*33de042dSApple OSS Distributions 
1113*33de042dSApple OSS Distributions 	if (new_thread) {
1114*33de042dSApple OSS Distributions 		*new_thread = th;
1115*33de042dSApple OSS Distributions 	}
1116*33de042dSApple OSS Distributions 
1117*33de042dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_thread_create | DBG_FUNC_NONE, wq, 0, 0, 0);
1118*33de042dSApple OSS Distributions 	return kret;
1119*33de042dSApple OSS Distributions 
1120*33de042dSApple OSS Distributions out:
1121*33de042dSApple OSS Distributions 	workq_lock_spin(wq);
1122*33de042dSApple OSS Distributions 	/*
1123*33de042dSApple OSS Distributions 	 * Do not redrive here if we went under wq_max_threads again,
1124*33de042dSApple OSS Distributions 	 * it is the responsibility of the callers of this function
1125*33de042dSApple OSS Distributions 	 * to do so when it fails.
1126*33de042dSApple OSS Distributions 	 */
1127*33de042dSApple OSS Distributions 	wq->wq_nthreads--;
1128*33de042dSApple OSS Distributions 	return kret;
1129*33de042dSApple OSS Distributions }
1130*33de042dSApple OSS Distributions 
1131*33de042dSApple OSS Distributions static inline bool
workq_thread_is_overcommit(struct uthread * uth)1132*33de042dSApple OSS Distributions workq_thread_is_overcommit(struct uthread *uth)
1133*33de042dSApple OSS Distributions {
1134*33de042dSApple OSS Distributions 	return (uth->uu_workq_flags & UT_WORKQ_OVERCOMMIT) != 0;
1135*33de042dSApple OSS Distributions }
1136*33de042dSApple OSS Distributions 
1137*33de042dSApple OSS Distributions static inline bool
workq_thread_is_nonovercommit(struct uthread * uth)1138*33de042dSApple OSS Distributions workq_thread_is_nonovercommit(struct uthread *uth)
1139*33de042dSApple OSS Distributions {
1140*33de042dSApple OSS Distributions 	return (uth->uu_workq_flags & (UT_WORKQ_OVERCOMMIT |
1141*33de042dSApple OSS Distributions 	       UT_WORKQ_COOPERATIVE)) == 0;
1142*33de042dSApple OSS Distributions }
1143*33de042dSApple OSS Distributions 
1144*33de042dSApple OSS Distributions static inline bool
workq_thread_is_cooperative(struct uthread * uth)1145*33de042dSApple OSS Distributions workq_thread_is_cooperative(struct uthread *uth)
1146*33de042dSApple OSS Distributions {
1147*33de042dSApple OSS Distributions 	return (uth->uu_workq_flags & UT_WORKQ_COOPERATIVE) != 0;
1148*33de042dSApple OSS Distributions }
1149*33de042dSApple OSS Distributions 
1150*33de042dSApple OSS Distributions bool
workq_thread_is_permanently_bound(struct uthread * uth)1151*33de042dSApple OSS Distributions workq_thread_is_permanently_bound(struct uthread *uth)
1152*33de042dSApple OSS Distributions {
1153*33de042dSApple OSS Distributions 	return (uth->uu_workq_flags & UT_WORKQ_PERMANENT_BIND) != 0;
1154*33de042dSApple OSS Distributions }
1155*33de042dSApple OSS Distributions 
1156*33de042dSApple OSS Distributions static inline void
workq_thread_set_type(struct uthread * uth,uint16_t flags)1157*33de042dSApple OSS Distributions workq_thread_set_type(struct uthread *uth, uint16_t flags)
1158*33de042dSApple OSS Distributions {
1159*33de042dSApple OSS Distributions 	uth->uu_workq_flags &= ~(UT_WORKQ_OVERCOMMIT | UT_WORKQ_COOPERATIVE);
1160*33de042dSApple OSS Distributions 	uth->uu_workq_flags |= flags;
1161*33de042dSApple OSS Distributions }
1162*33de042dSApple OSS Distributions 
1163*33de042dSApple OSS Distributions 
1164*33de042dSApple OSS Distributions #define WORKQ_UNPARK_FOR_DEATH_WAS_IDLE 0x1
1165*33de042dSApple OSS Distributions 
1166*33de042dSApple OSS Distributions __attribute__((noreturn, noinline))
1167*33de042dSApple OSS Distributions static void
workq_unpark_for_death_and_unlock(proc_t p,struct workqueue * wq,struct uthread * uth,uint32_t death_flags,uint32_t setup_flags)1168*33de042dSApple OSS Distributions workq_unpark_for_death_and_unlock(proc_t p, struct workqueue *wq,
1169*33de042dSApple OSS Distributions     struct uthread *uth, uint32_t death_flags, uint32_t setup_flags)
1170*33de042dSApple OSS Distributions {
1171*33de042dSApple OSS Distributions 	thread_qos_t qos = workq_pri_override(uth->uu_workq_pri);
1172*33de042dSApple OSS Distributions 	bool first_use = uth->uu_workq_flags & UT_WORKQ_NEW;
1173*33de042dSApple OSS Distributions 
1174*33de042dSApple OSS Distributions 	if (qos > WORKQ_THREAD_QOS_CLEANUP) {
1175*33de042dSApple OSS Distributions 		workq_thread_reset_pri(wq, uth, NULL, /*unpark*/ true);
1176*33de042dSApple OSS Distributions 		qos = WORKQ_THREAD_QOS_CLEANUP;
1177*33de042dSApple OSS Distributions 	}
1178*33de042dSApple OSS Distributions 
1179*33de042dSApple OSS Distributions 	workq_thread_reset_cpupercent(NULL, uth);
1180*33de042dSApple OSS Distributions 
1181*33de042dSApple OSS Distributions 	if (death_flags & WORKQ_UNPARK_FOR_DEATH_WAS_IDLE) {
1182*33de042dSApple OSS Distributions 		wq->wq_thidlecount--;
1183*33de042dSApple OSS Distributions 		if (first_use) {
1184*33de042dSApple OSS Distributions 			TAILQ_REMOVE(&wq->wq_thnewlist, uth, uu_workq_entry);
1185*33de042dSApple OSS Distributions 		} else {
1186*33de042dSApple OSS Distributions 			TAILQ_REMOVE(&wq->wq_thidlelist, uth, uu_workq_entry);
1187*33de042dSApple OSS Distributions 		}
1188*33de042dSApple OSS Distributions 	}
1189*33de042dSApple OSS Distributions 	TAILQ_INSERT_TAIL(&wq->wq_thrunlist, uth, uu_workq_entry);
1190*33de042dSApple OSS Distributions 
1191*33de042dSApple OSS Distributions 	workq_unlock(wq);
1192*33de042dSApple OSS Distributions 
1193*33de042dSApple OSS Distributions 	if (setup_flags & WQ_SETUP_CLEAR_VOUCHER) {
1194*33de042dSApple OSS Distributions 		__assert_only kern_return_t kr;
1195*33de042dSApple OSS Distributions 		kr = thread_set_voucher_name(MACH_PORT_NULL);
1196*33de042dSApple OSS Distributions 		assert(kr == KERN_SUCCESS);
1197*33de042dSApple OSS Distributions 	}
1198*33de042dSApple OSS Distributions 
1199*33de042dSApple OSS Distributions 	uint32_t flags = WQ_FLAG_THREAD_NEWSPI | qos | WQ_FLAG_THREAD_PRIO_QOS;
1200*33de042dSApple OSS Distributions 	thread_t th = get_machthread(uth);
1201*33de042dSApple OSS Distributions 	vm_map_t vmap = get_task_map(proc_task(p));
1202*33de042dSApple OSS Distributions 
1203*33de042dSApple OSS Distributions 	if (!first_use) {
1204*33de042dSApple OSS Distributions 		flags |= WQ_FLAG_THREAD_REUSE;
1205*33de042dSApple OSS Distributions 	}
1206*33de042dSApple OSS Distributions 
1207*33de042dSApple OSS Distributions 	pthread_functions->workq_setup_thread(p, th, vmap, uth->uu_workq_stackaddr,
1208*33de042dSApple OSS Distributions 	    uth->uu_workq_thport, 0, WQ_SETUP_EXIT_THREAD, flags);
1209*33de042dSApple OSS Distributions 	__builtin_unreachable();
1210*33de042dSApple OSS Distributions }
1211*33de042dSApple OSS Distributions 
1212*33de042dSApple OSS Distributions bool
workq_is_current_thread_updating_turnstile(struct workqueue * wq)1213*33de042dSApple OSS Distributions workq_is_current_thread_updating_turnstile(struct workqueue *wq)
1214*33de042dSApple OSS Distributions {
1215*33de042dSApple OSS Distributions 	return wq->wq_turnstile_updater == current_thread();
1216*33de042dSApple OSS Distributions }
1217*33de042dSApple OSS Distributions 
1218*33de042dSApple OSS Distributions __attribute__((always_inline))
1219*33de042dSApple OSS Distributions static inline void
1220*33de042dSApple OSS Distributions workq_perform_turnstile_operation_locked(struct workqueue *wq,
1221*33de042dSApple OSS Distributions     void (^operation)(void))
1222*33de042dSApple OSS Distributions {
1223*33de042dSApple OSS Distributions 	workq_lock_held(wq);
1224*33de042dSApple OSS Distributions 	wq->wq_turnstile_updater = current_thread();
1225*33de042dSApple OSS Distributions 	operation();
1226*33de042dSApple OSS Distributions 	wq->wq_turnstile_updater = THREAD_NULL;
1227*33de042dSApple OSS Distributions }
1228*33de042dSApple OSS Distributions 
1229*33de042dSApple OSS Distributions static void
workq_turnstile_update_inheritor(struct workqueue * wq,turnstile_inheritor_t inheritor,turnstile_update_flags_t flags)1230*33de042dSApple OSS Distributions workq_turnstile_update_inheritor(struct workqueue *wq,
1231*33de042dSApple OSS Distributions     turnstile_inheritor_t inheritor,
1232*33de042dSApple OSS Distributions     turnstile_update_flags_t flags)
1233*33de042dSApple OSS Distributions {
1234*33de042dSApple OSS Distributions 	if (wq->wq_inheritor == inheritor) {
1235*33de042dSApple OSS Distributions 		return;
1236*33de042dSApple OSS Distributions 	}
1237*33de042dSApple OSS Distributions 	wq->wq_inheritor = inheritor;
1238*33de042dSApple OSS Distributions 	workq_perform_turnstile_operation_locked(wq, ^{
1239*33de042dSApple OSS Distributions 		turnstile_update_inheritor(wq->wq_turnstile, inheritor,
1240*33de042dSApple OSS Distributions 		flags | TURNSTILE_IMMEDIATE_UPDATE);
1241*33de042dSApple OSS Distributions 		turnstile_update_inheritor_complete(wq->wq_turnstile,
1242*33de042dSApple OSS Distributions 		TURNSTILE_INTERLOCK_HELD);
1243*33de042dSApple OSS Distributions 	});
1244*33de042dSApple OSS Distributions }
1245*33de042dSApple OSS Distributions 
1246*33de042dSApple OSS Distributions static void
workq_push_idle_thread(proc_t p,struct workqueue * wq,struct uthread * uth,uint32_t setup_flags)1247*33de042dSApple OSS Distributions workq_push_idle_thread(proc_t p, struct workqueue *wq, struct uthread *uth,
1248*33de042dSApple OSS Distributions     uint32_t setup_flags)
1249*33de042dSApple OSS Distributions {
1250*33de042dSApple OSS Distributions 	uint64_t now = mach_absolute_time();
1251*33de042dSApple OSS Distributions 	bool is_creator = (uth == wq->wq_creator);
1252*33de042dSApple OSS Distributions 
1253*33de042dSApple OSS Distributions 	if (workq_thread_is_cooperative(uth)) {
1254*33de042dSApple OSS Distributions 		assert(!is_creator);
1255*33de042dSApple OSS Distributions 
1256*33de042dSApple OSS Distributions 		thread_qos_t thread_qos = uth->uu_workq_pri.qos_req;
1257*33de042dSApple OSS Distributions 		_wq_cooperative_queue_scheduled_count_dec(wq, thread_qos);
1258*33de042dSApple OSS Distributions 
1259*33de042dSApple OSS Distributions 		/* Before we get here, we always go through
1260*33de042dSApple OSS Distributions 		 * workq_select_threadreq_or_park_and_unlock. If we got here, it means
1261*33de042dSApple OSS Distributions 		 * that we went through the logic in workq_threadreq_select which
1262*33de042dSApple OSS Distributions 		 * did the refresh for the next best cooperative qos while
1263*33de042dSApple OSS Distributions 		 * excluding the current thread - we shouldn't need to do it again.
1264*33de042dSApple OSS Distributions 		 */
1265*33de042dSApple OSS Distributions 		assert(_wq_cooperative_queue_refresh_best_req_qos(wq) == false);
1266*33de042dSApple OSS Distributions 	} else if (workq_thread_is_nonovercommit(uth)) {
1267*33de042dSApple OSS Distributions 		assert(!is_creator);
1268*33de042dSApple OSS Distributions 
1269*33de042dSApple OSS Distributions 		wq->wq_constrained_threads_scheduled--;
1270*33de042dSApple OSS Distributions 	}
1271*33de042dSApple OSS Distributions 
1272*33de042dSApple OSS Distributions 	uth->uu_workq_flags &= ~(UT_WORKQ_RUNNING | UT_WORKQ_OVERCOMMIT | UT_WORKQ_COOPERATIVE);
1273*33de042dSApple OSS Distributions 	TAILQ_REMOVE(&wq->wq_thrunlist, uth, uu_workq_entry);
1274*33de042dSApple OSS Distributions 	wq->wq_threads_scheduled--;
1275*33de042dSApple OSS Distributions 
1276*33de042dSApple OSS Distributions 	if (is_creator) {
1277*33de042dSApple OSS Distributions 		wq->wq_creator = NULL;
1278*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_creator_select, wq, 3, 0,
1279*33de042dSApple OSS Distributions 		    uth->uu_save.uus_workq_park_data.yields);
1280*33de042dSApple OSS Distributions 	}
1281*33de042dSApple OSS Distributions 
1282*33de042dSApple OSS Distributions 	if (wq->wq_inheritor == get_machthread(uth)) {
1283*33de042dSApple OSS Distributions 		assert(wq->wq_creator == NULL);
1284*33de042dSApple OSS Distributions 		if (wq->wq_reqcount) {
1285*33de042dSApple OSS Distributions 			workq_turnstile_update_inheritor(wq, wq, TURNSTILE_INHERITOR_WORKQ);
1286*33de042dSApple OSS Distributions 		} else {
1287*33de042dSApple OSS Distributions 			workq_turnstile_update_inheritor(wq, TURNSTILE_INHERITOR_NULL, 0);
1288*33de042dSApple OSS Distributions 		}
1289*33de042dSApple OSS Distributions 	}
1290*33de042dSApple OSS Distributions 
1291*33de042dSApple OSS Distributions 	if (uth->uu_workq_flags & UT_WORKQ_NEW) {
1292*33de042dSApple OSS Distributions 		assert(is_creator || (_wq_flags(wq) & WQ_EXITING));
1293*33de042dSApple OSS Distributions 		TAILQ_INSERT_TAIL(&wq->wq_thnewlist, uth, uu_workq_entry);
1294*33de042dSApple OSS Distributions 		wq->wq_thidlecount++;
1295*33de042dSApple OSS Distributions 		return;
1296*33de042dSApple OSS Distributions 	}
1297*33de042dSApple OSS Distributions 
1298*33de042dSApple OSS Distributions 	if (!is_creator) {
1299*33de042dSApple OSS Distributions 		_wq_thactive_dec(wq, uth->uu_workq_pri.qos_bucket);
1300*33de042dSApple OSS Distributions 		wq->wq_thscheduled_count[_wq_bucket(uth->uu_workq_pri.qos_bucket)]--;
1301*33de042dSApple OSS Distributions 		uth->uu_workq_flags |= UT_WORKQ_IDLE_CLEANUP;
1302*33de042dSApple OSS Distributions 	}
1303*33de042dSApple OSS Distributions 
1304*33de042dSApple OSS Distributions 	uth->uu_save.uus_workq_park_data.idle_stamp = now;
1305*33de042dSApple OSS Distributions 
1306*33de042dSApple OSS Distributions 	struct uthread *oldest = workq_oldest_killable_idle_thread(wq);
1307*33de042dSApple OSS Distributions 	uint16_t cur_idle = wq->wq_thidlecount;
1308*33de042dSApple OSS Distributions 
1309*33de042dSApple OSS Distributions 	if (cur_idle >= wq_max_constrained_threads ||
1310*33de042dSApple OSS Distributions 	    (wq->wq_thdying_count == 0 && oldest &&
1311*33de042dSApple OSS Distributions 	    workq_should_kill_idle_thread(wq, oldest, now))) {
1312*33de042dSApple OSS Distributions 		/*
1313*33de042dSApple OSS Distributions 		 * Immediately kill threads if we have too may of them.
1314*33de042dSApple OSS Distributions 		 *
1315*33de042dSApple OSS Distributions 		 * And swap "place" with the oldest one we'd have woken up.
1316*33de042dSApple OSS Distributions 		 * This is a relatively desperate situation where we really
1317*33de042dSApple OSS Distributions 		 * need to kill threads quickly and it's best to kill
1318*33de042dSApple OSS Distributions 		 * the one that's currently on core than context switching.
1319*33de042dSApple OSS Distributions 		 */
1320*33de042dSApple OSS Distributions 		if (oldest) {
1321*33de042dSApple OSS Distributions 			oldest->uu_save.uus_workq_park_data.idle_stamp = now;
1322*33de042dSApple OSS Distributions 			TAILQ_REMOVE(&wq->wq_thidlelist, oldest, uu_workq_entry);
1323*33de042dSApple OSS Distributions 			TAILQ_INSERT_HEAD(&wq->wq_thidlelist, oldest, uu_workq_entry);
1324*33de042dSApple OSS Distributions 		}
1325*33de042dSApple OSS Distributions 
1326*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_thread_terminate | DBG_FUNC_START,
1327*33de042dSApple OSS Distributions 		    wq, cur_idle, 0, 0);
1328*33de042dSApple OSS Distributions 		wq->wq_thdying_count++;
1329*33de042dSApple OSS Distributions 		uth->uu_workq_flags |= UT_WORKQ_DYING;
1330*33de042dSApple OSS Distributions 		uth->uu_workq_flags &= ~UT_WORKQ_IDLE_CLEANUP;
1331*33de042dSApple OSS Distributions 		workq_unpark_for_death_and_unlock(p, wq, uth, 0, setup_flags);
1332*33de042dSApple OSS Distributions 		__builtin_unreachable();
1333*33de042dSApple OSS Distributions 	}
1334*33de042dSApple OSS Distributions 
1335*33de042dSApple OSS Distributions 	struct uthread *tail = TAILQ_LAST(&wq->wq_thidlelist, workq_uthread_head);
1336*33de042dSApple OSS Distributions 
1337*33de042dSApple OSS Distributions 	cur_idle += 1;
1338*33de042dSApple OSS Distributions 	wq->wq_thidlecount = cur_idle;
1339*33de042dSApple OSS Distributions 
1340*33de042dSApple OSS Distributions 	if (cur_idle >= wq_death_max_load && tail &&
1341*33de042dSApple OSS Distributions 	    tail->uu_save.uus_workq_park_data.has_stack) {
1342*33de042dSApple OSS Distributions 		uth->uu_save.uus_workq_park_data.has_stack = false;
1343*33de042dSApple OSS Distributions 		TAILQ_INSERT_TAIL(&wq->wq_thidlelist, uth, uu_workq_entry);
1344*33de042dSApple OSS Distributions 	} else {
1345*33de042dSApple OSS Distributions 		uth->uu_save.uus_workq_park_data.has_stack = true;
1346*33de042dSApple OSS Distributions 		TAILQ_INSERT_HEAD(&wq->wq_thidlelist, uth, uu_workq_entry);
1347*33de042dSApple OSS Distributions 	}
1348*33de042dSApple OSS Distributions 
1349*33de042dSApple OSS Distributions 	if (!tail) {
1350*33de042dSApple OSS Distributions 		uint64_t delay = workq_kill_delay_for_idle_thread(wq);
1351*33de042dSApple OSS Distributions 		workq_death_call_schedule(wq, now + delay);
1352*33de042dSApple OSS Distributions 	}
1353*33de042dSApple OSS Distributions }
1354*33de042dSApple OSS Distributions 
1355*33de042dSApple OSS Distributions #pragma mark thread requests
1356*33de042dSApple OSS Distributions 
1357*33de042dSApple OSS Distributions static inline bool
workq_tr_is_overcommit(workq_tr_flags_t tr_flags)1358*33de042dSApple OSS Distributions workq_tr_is_overcommit(workq_tr_flags_t tr_flags)
1359*33de042dSApple OSS Distributions {
1360*33de042dSApple OSS Distributions 	return (tr_flags & WORKQ_TR_FLAG_OVERCOMMIT) != 0;
1361*33de042dSApple OSS Distributions }
1362*33de042dSApple OSS Distributions 
1363*33de042dSApple OSS Distributions static inline bool
workq_tr_is_nonovercommit(workq_tr_flags_t tr_flags)1364*33de042dSApple OSS Distributions workq_tr_is_nonovercommit(workq_tr_flags_t tr_flags)
1365*33de042dSApple OSS Distributions {
1366*33de042dSApple OSS Distributions 	return (tr_flags & (WORKQ_TR_FLAG_OVERCOMMIT |
1367*33de042dSApple OSS Distributions 	       WORKQ_TR_FLAG_COOPERATIVE |
1368*33de042dSApple OSS Distributions 	       WORKQ_TR_FLAG_PERMANENT_BIND)) == 0;
1369*33de042dSApple OSS Distributions }
1370*33de042dSApple OSS Distributions 
1371*33de042dSApple OSS Distributions static inline bool
workq_tr_is_cooperative(workq_tr_flags_t tr_flags)1372*33de042dSApple OSS Distributions workq_tr_is_cooperative(workq_tr_flags_t tr_flags)
1373*33de042dSApple OSS Distributions {
1374*33de042dSApple OSS Distributions 	return (tr_flags & WORKQ_TR_FLAG_COOPERATIVE) != 0;
1375*33de042dSApple OSS Distributions }
1376*33de042dSApple OSS Distributions 
1377*33de042dSApple OSS Distributions #define workq_threadreq_is_overcommit(req) workq_tr_is_overcommit((req)->tr_flags)
1378*33de042dSApple OSS Distributions #define workq_threadreq_is_nonovercommit(req) workq_tr_is_nonovercommit((req)->tr_flags)
1379*33de042dSApple OSS Distributions #define workq_threadreq_is_cooperative(req) workq_tr_is_cooperative((req)->tr_flags)
1380*33de042dSApple OSS Distributions 
1381*33de042dSApple OSS Distributions static inline int
workq_priority_for_req(workq_threadreq_t req)1382*33de042dSApple OSS Distributions workq_priority_for_req(workq_threadreq_t req)
1383*33de042dSApple OSS Distributions {
1384*33de042dSApple OSS Distributions 	thread_qos_t qos = req->tr_qos;
1385*33de042dSApple OSS Distributions 
1386*33de042dSApple OSS Distributions 	if (req->tr_flags & WORKQ_TR_FLAG_WL_OUTSIDE_QOS) {
1387*33de042dSApple OSS Distributions 		workq_threadreq_param_t trp = kqueue_threadreq_workloop_param(req);
1388*33de042dSApple OSS Distributions 		assert(trp.trp_flags & TRP_PRIORITY);
1389*33de042dSApple OSS Distributions 		return trp.trp_pri;
1390*33de042dSApple OSS Distributions 	}
1391*33de042dSApple OSS Distributions 	return thread_workq_pri_for_qos(qos);
1392*33de042dSApple OSS Distributions }
1393*33de042dSApple OSS Distributions 
1394*33de042dSApple OSS Distributions static inline struct priority_queue_sched_max *
workq_priority_queue_for_req(struct workqueue * wq,workq_threadreq_t req)1395*33de042dSApple OSS Distributions workq_priority_queue_for_req(struct workqueue *wq, workq_threadreq_t req)
1396*33de042dSApple OSS Distributions {
1397*33de042dSApple OSS Distributions 	assert(!workq_tr_is_cooperative(req->tr_flags));
1398*33de042dSApple OSS Distributions 
1399*33de042dSApple OSS Distributions 	if (req->tr_flags & WORKQ_TR_FLAG_WL_OUTSIDE_QOS) {
1400*33de042dSApple OSS Distributions 		return &wq->wq_special_queue;
1401*33de042dSApple OSS Distributions 	} else if (workq_tr_is_overcommit(req->tr_flags)) {
1402*33de042dSApple OSS Distributions 		return &wq->wq_overcommit_queue;
1403*33de042dSApple OSS Distributions 	} else {
1404*33de042dSApple OSS Distributions 		return &wq->wq_constrained_queue;
1405*33de042dSApple OSS Distributions 	}
1406*33de042dSApple OSS Distributions }
1407*33de042dSApple OSS Distributions 
1408*33de042dSApple OSS Distributions /* Calculates the number of threads scheduled >= the input QoS */
1409*33de042dSApple OSS Distributions static uint64_t
workq_num_cooperative_threads_scheduled_to_qos_internal(struct workqueue * wq,thread_qos_t qos)1410*33de042dSApple OSS Distributions workq_num_cooperative_threads_scheduled_to_qos_internal(struct workqueue *wq, thread_qos_t qos)
1411*33de042dSApple OSS Distributions {
1412*33de042dSApple OSS Distributions 	uint64_t num_cooperative_threads = 0;
1413*33de042dSApple OSS Distributions 
1414*33de042dSApple OSS Distributions 	for (thread_qos_t cur_qos = WORKQ_THREAD_QOS_MAX; cur_qos >= qos; cur_qos--) {
1415*33de042dSApple OSS Distributions 		uint8_t bucket = _wq_bucket(cur_qos);
1416*33de042dSApple OSS Distributions 		num_cooperative_threads += wq->wq_cooperative_queue_scheduled_count[bucket];
1417*33de042dSApple OSS Distributions 	}
1418*33de042dSApple OSS Distributions 
1419*33de042dSApple OSS Distributions 	return num_cooperative_threads;
1420*33de042dSApple OSS Distributions }
1421*33de042dSApple OSS Distributions 
1422*33de042dSApple OSS Distributions /* Calculates the number of threads scheduled >= the input QoS */
1423*33de042dSApple OSS Distributions static uint64_t
workq_num_cooperative_threads_scheduled_to_qos_locked(struct workqueue * wq,thread_qos_t qos)1424*33de042dSApple OSS Distributions workq_num_cooperative_threads_scheduled_to_qos_locked(struct workqueue *wq, thread_qos_t qos)
1425*33de042dSApple OSS Distributions {
1426*33de042dSApple OSS Distributions 	workq_lock_held(wq);
1427*33de042dSApple OSS Distributions 	return workq_num_cooperative_threads_scheduled_to_qos_internal(wq, qos);
1428*33de042dSApple OSS Distributions }
1429*33de042dSApple OSS Distributions 
1430*33de042dSApple OSS Distributions static uint64_t
workq_num_cooperative_threads_scheduled_total(struct workqueue * wq)1431*33de042dSApple OSS Distributions workq_num_cooperative_threads_scheduled_total(struct workqueue *wq)
1432*33de042dSApple OSS Distributions {
1433*33de042dSApple OSS Distributions 	return workq_num_cooperative_threads_scheduled_to_qos_locked(wq, WORKQ_THREAD_QOS_MIN);
1434*33de042dSApple OSS Distributions }
1435*33de042dSApple OSS Distributions 
1436*33de042dSApple OSS Distributions static bool
workq_has_cooperative_thread_requests(struct workqueue * wq)1437*33de042dSApple OSS Distributions workq_has_cooperative_thread_requests(struct workqueue *wq)
1438*33de042dSApple OSS Distributions {
1439*33de042dSApple OSS Distributions 	for (thread_qos_t qos = WORKQ_THREAD_QOS_MAX; qos >= WORKQ_THREAD_QOS_MIN; qos--) {
1440*33de042dSApple OSS Distributions 		uint8_t bucket = _wq_bucket(qos);
1441*33de042dSApple OSS Distributions 		if (!STAILQ_EMPTY(&wq->wq_cooperative_queue[bucket])) {
1442*33de042dSApple OSS Distributions 			return true;
1443*33de042dSApple OSS Distributions 		}
1444*33de042dSApple OSS Distributions 	}
1445*33de042dSApple OSS Distributions 
1446*33de042dSApple OSS Distributions 	return false;
1447*33de042dSApple OSS Distributions }
1448*33de042dSApple OSS Distributions 
1449*33de042dSApple OSS Distributions /*
1450*33de042dSApple OSS Distributions  * Determines the next QoS bucket we should service next in the cooperative
1451*33de042dSApple OSS Distributions  * pool. This function will always return a QoS for cooperative pool as long as
1452*33de042dSApple OSS Distributions  * there are requests to be serviced.
1453*33de042dSApple OSS Distributions  *
1454*33de042dSApple OSS Distributions  * Unlike the other thread pools, for the cooperative thread pool the schedule
1455*33de042dSApple OSS Distributions  * counts for the various buckets in the pool affect the next best request for
1456*33de042dSApple OSS Distributions  * it.
1457*33de042dSApple OSS Distributions  *
1458*33de042dSApple OSS Distributions  * This function is called in the following contexts:
1459*33de042dSApple OSS Distributions  *
1460*33de042dSApple OSS Distributions  * a) When determining the best thread QoS for cooperative bucket for the
1461*33de042dSApple OSS Distributions  * creator/thread reuse
1462*33de042dSApple OSS Distributions  *
1463*33de042dSApple OSS Distributions  * b) Once (a) has happened and thread has bound to a thread request, figuring
1464*33de042dSApple OSS Distributions  * out whether the next best request for this pool has changed so that creator
1465*33de042dSApple OSS Distributions  * can be scheduled.
1466*33de042dSApple OSS Distributions  *
1467*33de042dSApple OSS Distributions  * Returns true if the cooperative queue's best qos changed from previous
1468*33de042dSApple OSS Distributions  * value.
1469*33de042dSApple OSS Distributions  */
1470*33de042dSApple OSS Distributions static bool
_wq_cooperative_queue_refresh_best_req_qos(struct workqueue * wq)1471*33de042dSApple OSS Distributions _wq_cooperative_queue_refresh_best_req_qos(struct workqueue *wq)
1472*33de042dSApple OSS Distributions {
1473*33de042dSApple OSS Distributions 	workq_lock_held(wq);
1474*33de042dSApple OSS Distributions 
1475*33de042dSApple OSS Distributions 	thread_qos_t old_best_req_qos = wq->wq_cooperative_queue_best_req_qos;
1476*33de042dSApple OSS Distributions 
1477*33de042dSApple OSS Distributions 	/* We determine the next best cooperative thread request based on the
1478*33de042dSApple OSS Distributions 	 * following:
1479*33de042dSApple OSS Distributions 	 *
1480*33de042dSApple OSS Distributions 	 * 1. Take the MAX of the following:
1481*33de042dSApple OSS Distributions 	 *		a) Highest qos with pending TRs such that number of scheduled
1482*33de042dSApple OSS Distributions 	 *		threads so far with >= qos is < wq_max_cooperative_threads
1483*33de042dSApple OSS Distributions 	 *		b) Highest qos bucket with pending TRs but no scheduled threads for that bucket
1484*33de042dSApple OSS Distributions 	 *
1485*33de042dSApple OSS Distributions 	 * 2. If the result of (1) is UN, then we pick the highest priority amongst
1486*33de042dSApple OSS Distributions 	 * pending thread requests in the pool.
1487*33de042dSApple OSS Distributions 	 *
1488*33de042dSApple OSS Distributions 	 */
1489*33de042dSApple OSS Distributions 	thread_qos_t highest_qos_with_no_scheduled = THREAD_QOS_UNSPECIFIED;
1490*33de042dSApple OSS Distributions 	thread_qos_t highest_qos_req_with_width = THREAD_QOS_UNSPECIFIED;
1491*33de042dSApple OSS Distributions 
1492*33de042dSApple OSS Distributions 	thread_qos_t highest_qos_req = THREAD_QOS_UNSPECIFIED;
1493*33de042dSApple OSS Distributions 
1494*33de042dSApple OSS Distributions 	int scheduled_count_till_qos = 0;
1495*33de042dSApple OSS Distributions 
1496*33de042dSApple OSS Distributions 	for (thread_qos_t qos = WORKQ_THREAD_QOS_MAX; qos >= WORKQ_THREAD_QOS_MIN; qos--) {
1497*33de042dSApple OSS Distributions 		uint8_t bucket = _wq_bucket(qos);
1498*33de042dSApple OSS Distributions 		uint8_t scheduled_count_for_bucket = wq->wq_cooperative_queue_scheduled_count[bucket];
1499*33de042dSApple OSS Distributions 		scheduled_count_till_qos += scheduled_count_for_bucket;
1500*33de042dSApple OSS Distributions 
1501*33de042dSApple OSS Distributions 		if (!STAILQ_EMPTY(&wq->wq_cooperative_queue[bucket])) {
1502*33de042dSApple OSS Distributions 			if (qos > highest_qos_req) {
1503*33de042dSApple OSS Distributions 				highest_qos_req = qos;
1504*33de042dSApple OSS Distributions 			}
1505*33de042dSApple OSS Distributions 			/*
1506*33de042dSApple OSS Distributions 			 * The pool isn't saturated for threads at and above this QoS, and
1507*33de042dSApple OSS Distributions 			 * this qos bucket has pending requests
1508*33de042dSApple OSS Distributions 			 */
1509*33de042dSApple OSS Distributions 			if (scheduled_count_till_qos < wq_cooperative_queue_max_size(wq)) {
1510*33de042dSApple OSS Distributions 				if (qos > highest_qos_req_with_width) {
1511*33de042dSApple OSS Distributions 					highest_qos_req_with_width = qos;
1512*33de042dSApple OSS Distributions 				}
1513*33de042dSApple OSS Distributions 			}
1514*33de042dSApple OSS Distributions 
1515*33de042dSApple OSS Distributions 			/*
1516*33de042dSApple OSS Distributions 			 * There are no threads scheduled for this bucket but there
1517*33de042dSApple OSS Distributions 			 * is work pending, give it at least 1 thread
1518*33de042dSApple OSS Distributions 			 */
1519*33de042dSApple OSS Distributions 			if (scheduled_count_for_bucket == 0) {
1520*33de042dSApple OSS Distributions 				if (qos > highest_qos_with_no_scheduled) {
1521*33de042dSApple OSS Distributions 					highest_qos_with_no_scheduled = qos;
1522*33de042dSApple OSS Distributions 				}
1523*33de042dSApple OSS Distributions 			}
1524*33de042dSApple OSS Distributions 		}
1525*33de042dSApple OSS Distributions 	}
1526*33de042dSApple OSS Distributions 
1527*33de042dSApple OSS Distributions 	wq->wq_cooperative_queue_best_req_qos = MAX(highest_qos_with_no_scheduled, highest_qos_req_with_width);
1528*33de042dSApple OSS Distributions 	if (wq->wq_cooperative_queue_best_req_qos == THREAD_QOS_UNSPECIFIED) {
1529*33de042dSApple OSS Distributions 		wq->wq_cooperative_queue_best_req_qos = highest_qos_req;
1530*33de042dSApple OSS Distributions 	}
1531*33de042dSApple OSS Distributions 
1532*33de042dSApple OSS Distributions #if MACH_ASSERT
1533*33de042dSApple OSS Distributions 	/* Assert that if we are showing up the next best req as UN, then there
1534*33de042dSApple OSS Distributions 	 * actually is no thread request in the cooperative pool buckets */
1535*33de042dSApple OSS Distributions 	if (wq->wq_cooperative_queue_best_req_qos == THREAD_QOS_UNSPECIFIED) {
1536*33de042dSApple OSS Distributions 		assert(!workq_has_cooperative_thread_requests(wq));
1537*33de042dSApple OSS Distributions 	}
1538*33de042dSApple OSS Distributions #endif
1539*33de042dSApple OSS Distributions 
1540*33de042dSApple OSS Distributions 	return old_best_req_qos != wq->wq_cooperative_queue_best_req_qos;
1541*33de042dSApple OSS Distributions }
1542*33de042dSApple OSS Distributions 
1543*33de042dSApple OSS Distributions /*
1544*33de042dSApple OSS Distributions  * Returns whether or not the input thread (or creator thread if uth is NULL)
1545*33de042dSApple OSS Distributions  * should be allowed to work as part of the cooperative pool for the <input qos>
1546*33de042dSApple OSS Distributions  * bucket.
1547*33de042dSApple OSS Distributions  *
1548*33de042dSApple OSS Distributions  * This function is called in a bunch of places:
1549*33de042dSApple OSS Distributions  *		a) Quantum expires for a thread and it is part of the cooperative pool
1550*33de042dSApple OSS Distributions  *		b) When trying to pick a thread request for the creator thread to
1551*33de042dSApple OSS Distributions  *		represent.
1552*33de042dSApple OSS Distributions  *		c) When a thread is trying to pick a thread request to actually bind to
1553*33de042dSApple OSS Distributions  *		and service.
1554*33de042dSApple OSS Distributions  *
1555*33de042dSApple OSS Distributions  * Called with workq lock held.
1556*33de042dSApple OSS Distributions  */
1557*33de042dSApple OSS Distributions 
1558*33de042dSApple OSS Distributions #define WQ_COOPERATIVE_POOL_UNSATURATED 1
1559*33de042dSApple OSS Distributions #define WQ_COOPERATIVE_BUCKET_UNSERVICED 2
1560*33de042dSApple OSS Distributions #define WQ_COOPERATIVE_POOL_SATURATED_UP_TO_QOS 3
1561*33de042dSApple OSS Distributions 
1562*33de042dSApple OSS Distributions static bool
workq_cooperative_allowance(struct workqueue * wq,thread_qos_t qos,struct uthread * uth,bool may_start_timer)1563*33de042dSApple OSS Distributions workq_cooperative_allowance(struct workqueue *wq, thread_qos_t qos, struct uthread *uth,
1564*33de042dSApple OSS Distributions     bool may_start_timer)
1565*33de042dSApple OSS Distributions {
1566*33de042dSApple OSS Distributions 	workq_lock_held(wq);
1567*33de042dSApple OSS Distributions 
1568*33de042dSApple OSS Distributions 	bool exclude_thread_as_scheduled = false;
1569*33de042dSApple OSS Distributions 	bool passed_admissions = false;
1570*33de042dSApple OSS Distributions 	uint8_t bucket = _wq_bucket(qos);
1571*33de042dSApple OSS Distributions 
1572*33de042dSApple OSS Distributions 	if (uth && workq_thread_is_cooperative(uth)) {
1573*33de042dSApple OSS Distributions 		exclude_thread_as_scheduled = true;
1574*33de042dSApple OSS Distributions 		_wq_cooperative_queue_scheduled_count_dec(wq, uth->uu_workq_pri.qos_req);
1575*33de042dSApple OSS Distributions 	}
1576*33de042dSApple OSS Distributions 
1577*33de042dSApple OSS Distributions 	/*
1578*33de042dSApple OSS Distributions 	 * We have not saturated the pool yet, let this thread continue
1579*33de042dSApple OSS Distributions 	 */
1580*33de042dSApple OSS Distributions 	uint64_t total_cooperative_threads;
1581*33de042dSApple OSS Distributions 	total_cooperative_threads = workq_num_cooperative_threads_scheduled_total(wq);
1582*33de042dSApple OSS Distributions 	if (total_cooperative_threads < wq_cooperative_queue_max_size(wq)) {
1583*33de042dSApple OSS Distributions 		passed_admissions = true;
1584*33de042dSApple OSS Distributions 		WQ_TRACE(TRACE_wq_cooperative_admission | DBG_FUNC_NONE,
1585*33de042dSApple OSS Distributions 		    total_cooperative_threads, qos, passed_admissions,
1586*33de042dSApple OSS Distributions 		    WQ_COOPERATIVE_POOL_UNSATURATED);
1587*33de042dSApple OSS Distributions 		goto out;
1588*33de042dSApple OSS Distributions 	}
1589*33de042dSApple OSS Distributions 
1590*33de042dSApple OSS Distributions 	/*
1591*33de042dSApple OSS Distributions 	 * Without this thread, nothing is servicing the bucket which has pending
1592*33de042dSApple OSS Distributions 	 * work
1593*33de042dSApple OSS Distributions 	 */
1594*33de042dSApple OSS Distributions 	uint64_t bucket_scheduled = wq->wq_cooperative_queue_scheduled_count[bucket];
1595*33de042dSApple OSS Distributions 	if (bucket_scheduled == 0 &&
1596*33de042dSApple OSS Distributions 	    !STAILQ_EMPTY(&wq->wq_cooperative_queue[bucket])) {
1597*33de042dSApple OSS Distributions 		passed_admissions = true;
1598*33de042dSApple OSS Distributions 		WQ_TRACE(TRACE_wq_cooperative_admission | DBG_FUNC_NONE,
1599*33de042dSApple OSS Distributions 		    total_cooperative_threads, qos, passed_admissions,
1600*33de042dSApple OSS Distributions 		    WQ_COOPERATIVE_BUCKET_UNSERVICED);
1601*33de042dSApple OSS Distributions 		goto out;
1602*33de042dSApple OSS Distributions 	}
1603*33de042dSApple OSS Distributions 
1604*33de042dSApple OSS Distributions 	/*
1605*33de042dSApple OSS Distributions 	 * If number of threads at the QoS bucket >= input QoS exceeds the max we want
1606*33de042dSApple OSS Distributions 	 * for the pool, deny this thread
1607*33de042dSApple OSS Distributions 	 */
1608*33de042dSApple OSS Distributions 	uint64_t aggregate_down_to_qos = workq_num_cooperative_threads_scheduled_to_qos_locked(wq, qos);
1609*33de042dSApple OSS Distributions 	passed_admissions = (aggregate_down_to_qos < wq_cooperative_queue_max_size(wq));
1610*33de042dSApple OSS Distributions 	WQ_TRACE(TRACE_wq_cooperative_admission | DBG_FUNC_NONE, aggregate_down_to_qos,
1611*33de042dSApple OSS Distributions 	    qos, passed_admissions, WQ_COOPERATIVE_POOL_SATURATED_UP_TO_QOS);
1612*33de042dSApple OSS Distributions 
1613*33de042dSApple OSS Distributions 	if (!passed_admissions && may_start_timer) {
1614*33de042dSApple OSS Distributions 		workq_schedule_delayed_thread_creation(wq, 0);
1615*33de042dSApple OSS Distributions 	}
1616*33de042dSApple OSS Distributions 
1617*33de042dSApple OSS Distributions out:
1618*33de042dSApple OSS Distributions 	if (exclude_thread_as_scheduled) {
1619*33de042dSApple OSS Distributions 		_wq_cooperative_queue_scheduled_count_inc(wq, uth->uu_workq_pri.qos_req);
1620*33de042dSApple OSS Distributions 	}
1621*33de042dSApple OSS Distributions 	return passed_admissions;
1622*33de042dSApple OSS Distributions }
1623*33de042dSApple OSS Distributions 
1624*33de042dSApple OSS Distributions /*
1625*33de042dSApple OSS Distributions  * returns true if the best request for the pool changed as a result of
1626*33de042dSApple OSS Distributions  * enqueuing this thread request.
1627*33de042dSApple OSS Distributions  */
1628*33de042dSApple OSS Distributions static bool
workq_threadreq_enqueue(struct workqueue * wq,workq_threadreq_t req)1629*33de042dSApple OSS Distributions workq_threadreq_enqueue(struct workqueue *wq, workq_threadreq_t req)
1630*33de042dSApple OSS Distributions {
1631*33de042dSApple OSS Distributions 	assert(req->tr_state == WORKQ_TR_STATE_NEW);
1632*33de042dSApple OSS Distributions 
1633*33de042dSApple OSS Distributions 	req->tr_state = WORKQ_TR_STATE_QUEUED;
1634*33de042dSApple OSS Distributions 	wq->wq_reqcount += req->tr_count;
1635*33de042dSApple OSS Distributions 
1636*33de042dSApple OSS Distributions 	if (req->tr_qos == WORKQ_THREAD_QOS_MANAGER) {
1637*33de042dSApple OSS Distributions 		assert(wq->wq_event_manager_threadreq == NULL);
1638*33de042dSApple OSS Distributions 		assert(req->tr_flags & WORKQ_TR_FLAG_KEVENT);
1639*33de042dSApple OSS Distributions 		assert(req->tr_count == 1);
1640*33de042dSApple OSS Distributions 		wq->wq_event_manager_threadreq = req;
1641*33de042dSApple OSS Distributions 		return true;
1642*33de042dSApple OSS Distributions 	}
1643*33de042dSApple OSS Distributions 
1644*33de042dSApple OSS Distributions 	if (workq_threadreq_is_cooperative(req)) {
1645*33de042dSApple OSS Distributions 		assert(req->tr_qos != WORKQ_THREAD_QOS_MANAGER);
1646*33de042dSApple OSS Distributions 		assert(req->tr_qos != WORKQ_THREAD_QOS_ABOVEUI);
1647*33de042dSApple OSS Distributions 
1648*33de042dSApple OSS Distributions 		struct workq_threadreq_tailq *bucket = &wq->wq_cooperative_queue[_wq_bucket(req->tr_qos)];
1649*33de042dSApple OSS Distributions 		STAILQ_INSERT_TAIL(bucket, req, tr_link);
1650*33de042dSApple OSS Distributions 
1651*33de042dSApple OSS Distributions 		return _wq_cooperative_queue_refresh_best_req_qos(wq);
1652*33de042dSApple OSS Distributions 	}
1653*33de042dSApple OSS Distributions 
1654*33de042dSApple OSS Distributions 	struct priority_queue_sched_max *q = workq_priority_queue_for_req(wq, req);
1655*33de042dSApple OSS Distributions 
1656*33de042dSApple OSS Distributions 	priority_queue_entry_set_sched_pri(q, &req->tr_entry,
1657*33de042dSApple OSS Distributions 	    workq_priority_for_req(req), false);
1658*33de042dSApple OSS Distributions 
1659*33de042dSApple OSS Distributions 	if (priority_queue_insert(q, &req->tr_entry)) {
1660*33de042dSApple OSS Distributions 		if (workq_threadreq_is_nonovercommit(req)) {
1661*33de042dSApple OSS Distributions 			_wq_thactive_refresh_best_constrained_req_qos(wq);
1662*33de042dSApple OSS Distributions 		}
1663*33de042dSApple OSS Distributions 		return true;
1664*33de042dSApple OSS Distributions 	}
1665*33de042dSApple OSS Distributions 	return false;
1666*33de042dSApple OSS Distributions }
1667*33de042dSApple OSS Distributions 
1668*33de042dSApple OSS Distributions /*
1669*33de042dSApple OSS Distributions  * returns true if one of the following is true (so as to update creator if
1670*33de042dSApple OSS Distributions  * needed):
1671*33de042dSApple OSS Distributions  *
1672*33de042dSApple OSS Distributions  * (a) the next highest request of the pool we dequeued the request from changed
1673*33de042dSApple OSS Distributions  * (b) the next highest requests of the pool the current thread used to be a
1674*33de042dSApple OSS Distributions  * part of, changed
1675*33de042dSApple OSS Distributions  *
1676*33de042dSApple OSS Distributions  * For overcommit, special and constrained pools, the next highest QoS for each
1677*33de042dSApple OSS Distributions  * pool just a MAX of pending requests so tracking (a) is sufficient.
1678*33de042dSApple OSS Distributions  *
1679*33de042dSApple OSS Distributions  * But for cooperative thread pool, the next highest QoS for the pool depends on
1680*33de042dSApple OSS Distributions  * schedule counts in the pool as well. So if the current thread used to be
1681*33de042dSApple OSS Distributions  * cooperative in it's previous logical run ie (b), then that can also affect
1682*33de042dSApple OSS Distributions  * cooperative pool's next best QoS requests.
1683*33de042dSApple OSS Distributions  */
1684*33de042dSApple OSS Distributions static bool
workq_threadreq_dequeue(struct workqueue * wq,workq_threadreq_t req,bool cooperative_sched_count_changed)1685*33de042dSApple OSS Distributions workq_threadreq_dequeue(struct workqueue *wq, workq_threadreq_t req,
1686*33de042dSApple OSS Distributions     bool cooperative_sched_count_changed)
1687*33de042dSApple OSS Distributions {
1688*33de042dSApple OSS Distributions 	wq->wq_reqcount--;
1689*33de042dSApple OSS Distributions 
1690*33de042dSApple OSS Distributions 	bool next_highest_request_changed = false;
1691*33de042dSApple OSS Distributions 
1692*33de042dSApple OSS Distributions 	if (--req->tr_count == 0) {
1693*33de042dSApple OSS Distributions 		if (req->tr_qos == WORKQ_THREAD_QOS_MANAGER) {
1694*33de042dSApple OSS Distributions 			assert(wq->wq_event_manager_threadreq == req);
1695*33de042dSApple OSS Distributions 			assert(req->tr_count == 0);
1696*33de042dSApple OSS Distributions 			wq->wq_event_manager_threadreq = NULL;
1697*33de042dSApple OSS Distributions 
1698*33de042dSApple OSS Distributions 			/* If a cooperative thread was the one which picked up the manager
1699*33de042dSApple OSS Distributions 			 * thread request, we need to reevaluate the cooperative pool
1700*33de042dSApple OSS Distributions 			 * anyways.
1701*33de042dSApple OSS Distributions 			 */
1702*33de042dSApple OSS Distributions 			if (cooperative_sched_count_changed) {
1703*33de042dSApple OSS Distributions 				_wq_cooperative_queue_refresh_best_req_qos(wq);
1704*33de042dSApple OSS Distributions 			}
1705*33de042dSApple OSS Distributions 			return true;
1706*33de042dSApple OSS Distributions 		}
1707*33de042dSApple OSS Distributions 
1708*33de042dSApple OSS Distributions 		if (workq_threadreq_is_cooperative(req)) {
1709*33de042dSApple OSS Distributions 			assert(req->tr_qos != WORKQ_THREAD_QOS_MANAGER);
1710*33de042dSApple OSS Distributions 			assert(req->tr_qos != WORKQ_THREAD_QOS_ABOVEUI);
1711*33de042dSApple OSS Distributions 			/* Account for the fact that BG and MT are coalesced when
1712*33de042dSApple OSS Distributions 			 * calculating best request for cooperative pool
1713*33de042dSApple OSS Distributions 			 */
1714*33de042dSApple OSS Distributions 			assert(_wq_bucket(req->tr_qos) == _wq_bucket(wq->wq_cooperative_queue_best_req_qos));
1715*33de042dSApple OSS Distributions 
1716*33de042dSApple OSS Distributions 			struct workq_threadreq_tailq *bucket = &wq->wq_cooperative_queue[_wq_bucket(req->tr_qos)];
1717*33de042dSApple OSS Distributions 			__assert_only workq_threadreq_t head = STAILQ_FIRST(bucket);
1718*33de042dSApple OSS Distributions 
1719*33de042dSApple OSS Distributions 			assert(head == req);
1720*33de042dSApple OSS Distributions 			STAILQ_REMOVE_HEAD(bucket, tr_link);
1721*33de042dSApple OSS Distributions 
1722*33de042dSApple OSS Distributions 			/*
1723*33de042dSApple OSS Distributions 			 * If the request we're dequeueing is cooperative, then the sched
1724*33de042dSApple OSS Distributions 			 * counts definitely changed.
1725*33de042dSApple OSS Distributions 			 */
1726*33de042dSApple OSS Distributions 			assert(cooperative_sched_count_changed);
1727*33de042dSApple OSS Distributions 		}
1728*33de042dSApple OSS Distributions 
1729*33de042dSApple OSS Distributions 		/*
1730*33de042dSApple OSS Distributions 		 * We want to do the cooperative pool refresh after dequeueing a
1731*33de042dSApple OSS Distributions 		 * cooperative thread request if any (to combine both effects into 1
1732*33de042dSApple OSS Distributions 		 * refresh operation)
1733*33de042dSApple OSS Distributions 		 */
1734*33de042dSApple OSS Distributions 		if (cooperative_sched_count_changed) {
1735*33de042dSApple OSS Distributions 			next_highest_request_changed = _wq_cooperative_queue_refresh_best_req_qos(wq);
1736*33de042dSApple OSS Distributions 		}
1737*33de042dSApple OSS Distributions 
1738*33de042dSApple OSS Distributions 		if (!workq_threadreq_is_cooperative(req)) {
1739*33de042dSApple OSS Distributions 			/*
1740*33de042dSApple OSS Distributions 			 * All other types of requests are enqueued in priority queues
1741*33de042dSApple OSS Distributions 			 */
1742*33de042dSApple OSS Distributions 
1743*33de042dSApple OSS Distributions 			if (priority_queue_remove(workq_priority_queue_for_req(wq, req),
1744*33de042dSApple OSS Distributions 			    &req->tr_entry)) {
1745*33de042dSApple OSS Distributions 				next_highest_request_changed |= true;
1746*33de042dSApple OSS Distributions 				if (workq_threadreq_is_nonovercommit(req)) {
1747*33de042dSApple OSS Distributions 					_wq_thactive_refresh_best_constrained_req_qos(wq);
1748*33de042dSApple OSS Distributions 				}
1749*33de042dSApple OSS Distributions 			}
1750*33de042dSApple OSS Distributions 		}
1751*33de042dSApple OSS Distributions 	}
1752*33de042dSApple OSS Distributions 
1753*33de042dSApple OSS Distributions 	return next_highest_request_changed;
1754*33de042dSApple OSS Distributions }
1755*33de042dSApple OSS Distributions 
1756*33de042dSApple OSS Distributions static void
workq_threadreq_destroy(proc_t p,workq_threadreq_t req)1757*33de042dSApple OSS Distributions workq_threadreq_destroy(proc_t p, workq_threadreq_t req)
1758*33de042dSApple OSS Distributions {
1759*33de042dSApple OSS Distributions 	req->tr_state = WORKQ_TR_STATE_CANCELED;
1760*33de042dSApple OSS Distributions 	if (req->tr_flags & (WORKQ_TR_FLAG_WORKLOOP | WORKQ_TR_FLAG_KEVENT)) {
1761*33de042dSApple OSS Distributions 		kqueue_threadreq_cancel(p, req);
1762*33de042dSApple OSS Distributions 	} else {
1763*33de042dSApple OSS Distributions 		zfree(workq_zone_threadreq, req);
1764*33de042dSApple OSS Distributions 	}
1765*33de042dSApple OSS Distributions }
1766*33de042dSApple OSS Distributions 
1767*33de042dSApple OSS Distributions #pragma mark workqueue thread creation thread calls
1768*33de042dSApple OSS Distributions 
1769*33de042dSApple OSS Distributions static inline bool
workq_thread_call_prepost(struct workqueue * wq,uint32_t sched,uint32_t pend,uint32_t fail_mask)1770*33de042dSApple OSS Distributions workq_thread_call_prepost(struct workqueue *wq, uint32_t sched, uint32_t pend,
1771*33de042dSApple OSS Distributions     uint32_t fail_mask)
1772*33de042dSApple OSS Distributions {
1773*33de042dSApple OSS Distributions 	uint32_t old_flags, new_flags;
1774*33de042dSApple OSS Distributions 
1775*33de042dSApple OSS Distributions 	os_atomic_rmw_loop(&wq->wq_flags, old_flags, new_flags, acquire, {
1776*33de042dSApple OSS Distributions 		if (__improbable(old_flags & (WQ_EXITING | sched | pend | fail_mask))) {
1777*33de042dSApple OSS Distributions 		        os_atomic_rmw_loop_give_up(return false);
1778*33de042dSApple OSS Distributions 		}
1779*33de042dSApple OSS Distributions 		if (__improbable(old_flags & WQ_PROC_SUSPENDED)) {
1780*33de042dSApple OSS Distributions 		        new_flags = old_flags | pend;
1781*33de042dSApple OSS Distributions 		} else {
1782*33de042dSApple OSS Distributions 		        new_flags = old_flags | sched;
1783*33de042dSApple OSS Distributions 		}
1784*33de042dSApple OSS Distributions 	});
1785*33de042dSApple OSS Distributions 
1786*33de042dSApple OSS Distributions 	return (old_flags & WQ_PROC_SUSPENDED) == 0;
1787*33de042dSApple OSS Distributions }
1788*33de042dSApple OSS Distributions 
1789*33de042dSApple OSS Distributions #define WORKQ_SCHEDULE_DELAYED_THREAD_CREATION_RESTART 0x1
1790*33de042dSApple OSS Distributions 
1791*33de042dSApple OSS Distributions static bool
workq_schedule_delayed_thread_creation(struct workqueue * wq,int flags)1792*33de042dSApple OSS Distributions workq_schedule_delayed_thread_creation(struct workqueue *wq, int flags)
1793*33de042dSApple OSS Distributions {
1794*33de042dSApple OSS Distributions 	assert(!preemption_enabled());
1795*33de042dSApple OSS Distributions 
1796*33de042dSApple OSS Distributions 	if (!workq_thread_call_prepost(wq, WQ_DELAYED_CALL_SCHEDULED,
1797*33de042dSApple OSS Distributions 	    WQ_DELAYED_CALL_PENDED, WQ_IMMEDIATE_CALL_PENDED |
1798*33de042dSApple OSS Distributions 	    WQ_IMMEDIATE_CALL_SCHEDULED)) {
1799*33de042dSApple OSS Distributions 		return false;
1800*33de042dSApple OSS Distributions 	}
1801*33de042dSApple OSS Distributions 
1802*33de042dSApple OSS Distributions 	uint64_t now = mach_absolute_time();
1803*33de042dSApple OSS Distributions 
1804*33de042dSApple OSS Distributions 	if (flags & WORKQ_SCHEDULE_DELAYED_THREAD_CREATION_RESTART) {
1805*33de042dSApple OSS Distributions 		/* do not change the window */
1806*33de042dSApple OSS Distributions 	} else if (now - wq->wq_thread_call_last_run <= wq->wq_timer_interval) {
1807*33de042dSApple OSS Distributions 		wq->wq_timer_interval *= 2;
1808*33de042dSApple OSS Distributions 		if (wq->wq_timer_interval > wq_max_timer_interval.abstime) {
1809*33de042dSApple OSS Distributions 			wq->wq_timer_interval = (uint32_t)wq_max_timer_interval.abstime;
1810*33de042dSApple OSS Distributions 		}
1811*33de042dSApple OSS Distributions 	} else if (now - wq->wq_thread_call_last_run > 2 * wq->wq_timer_interval) {
1812*33de042dSApple OSS Distributions 		wq->wq_timer_interval /= 2;
1813*33de042dSApple OSS Distributions 		if (wq->wq_timer_interval < wq_stalled_window.abstime) {
1814*33de042dSApple OSS Distributions 			wq->wq_timer_interval = (uint32_t)wq_stalled_window.abstime;
1815*33de042dSApple OSS Distributions 		}
1816*33de042dSApple OSS Distributions 	}
1817*33de042dSApple OSS Distributions 
1818*33de042dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_start_add_timer, wq, wq->wq_reqcount,
1819*33de042dSApple OSS Distributions 	    _wq_flags(wq), wq->wq_timer_interval);
1820*33de042dSApple OSS Distributions 
1821*33de042dSApple OSS Distributions 	thread_call_t call = wq->wq_delayed_call;
1822*33de042dSApple OSS Distributions 	uintptr_t arg = WQ_DELAYED_CALL_SCHEDULED;
1823*33de042dSApple OSS Distributions 	uint64_t deadline = now + wq->wq_timer_interval;
1824*33de042dSApple OSS Distributions 	if (thread_call_enter1_delayed(call, (void *)arg, deadline)) {
1825*33de042dSApple OSS Distributions 		panic("delayed_call was already enqueued");
1826*33de042dSApple OSS Distributions 	}
1827*33de042dSApple OSS Distributions 	return true;
1828*33de042dSApple OSS Distributions }
1829*33de042dSApple OSS Distributions 
1830*33de042dSApple OSS Distributions static void
workq_schedule_immediate_thread_creation(struct workqueue * wq)1831*33de042dSApple OSS Distributions workq_schedule_immediate_thread_creation(struct workqueue *wq)
1832*33de042dSApple OSS Distributions {
1833*33de042dSApple OSS Distributions 	assert(!preemption_enabled());
1834*33de042dSApple OSS Distributions 
1835*33de042dSApple OSS Distributions 	if (workq_thread_call_prepost(wq, WQ_IMMEDIATE_CALL_SCHEDULED,
1836*33de042dSApple OSS Distributions 	    WQ_IMMEDIATE_CALL_PENDED, 0)) {
1837*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_start_add_timer, wq, wq->wq_reqcount,
1838*33de042dSApple OSS Distributions 		    _wq_flags(wq), 0);
1839*33de042dSApple OSS Distributions 
1840*33de042dSApple OSS Distributions 		uintptr_t arg = WQ_IMMEDIATE_CALL_SCHEDULED;
1841*33de042dSApple OSS Distributions 		if (thread_call_enter1(wq->wq_immediate_call, (void *)arg)) {
1842*33de042dSApple OSS Distributions 			panic("immediate_call was already enqueued");
1843*33de042dSApple OSS Distributions 		}
1844*33de042dSApple OSS Distributions 	}
1845*33de042dSApple OSS Distributions }
1846*33de042dSApple OSS Distributions 
1847*33de042dSApple OSS Distributions void
workq_proc_suspended(struct proc * p)1848*33de042dSApple OSS Distributions workq_proc_suspended(struct proc *p)
1849*33de042dSApple OSS Distributions {
1850*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
1851*33de042dSApple OSS Distributions 
1852*33de042dSApple OSS Distributions 	if (wq) {
1853*33de042dSApple OSS Distributions 		os_atomic_or(&wq->wq_flags, WQ_PROC_SUSPENDED, relaxed);
1854*33de042dSApple OSS Distributions 	}
1855*33de042dSApple OSS Distributions }
1856*33de042dSApple OSS Distributions 
1857*33de042dSApple OSS Distributions void
workq_proc_resumed(struct proc * p)1858*33de042dSApple OSS Distributions workq_proc_resumed(struct proc *p)
1859*33de042dSApple OSS Distributions {
1860*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
1861*33de042dSApple OSS Distributions 	uint32_t wq_flags;
1862*33de042dSApple OSS Distributions 
1863*33de042dSApple OSS Distributions 	if (!wq) {
1864*33de042dSApple OSS Distributions 		return;
1865*33de042dSApple OSS Distributions 	}
1866*33de042dSApple OSS Distributions 
1867*33de042dSApple OSS Distributions 	wq_flags = os_atomic_andnot_orig(&wq->wq_flags, WQ_PROC_SUSPENDED |
1868*33de042dSApple OSS Distributions 	    WQ_DELAYED_CALL_PENDED | WQ_IMMEDIATE_CALL_PENDED, relaxed);
1869*33de042dSApple OSS Distributions 	if ((wq_flags & WQ_EXITING) == 0) {
1870*33de042dSApple OSS Distributions 		disable_preemption();
1871*33de042dSApple OSS Distributions 		if (wq_flags & WQ_IMMEDIATE_CALL_PENDED) {
1872*33de042dSApple OSS Distributions 			workq_schedule_immediate_thread_creation(wq);
1873*33de042dSApple OSS Distributions 		} else if (wq_flags & WQ_DELAYED_CALL_PENDED) {
1874*33de042dSApple OSS Distributions 			workq_schedule_delayed_thread_creation(wq,
1875*33de042dSApple OSS Distributions 			    WORKQ_SCHEDULE_DELAYED_THREAD_CREATION_RESTART);
1876*33de042dSApple OSS Distributions 		}
1877*33de042dSApple OSS Distributions 		enable_preemption();
1878*33de042dSApple OSS Distributions 	}
1879*33de042dSApple OSS Distributions }
1880*33de042dSApple OSS Distributions 
1881*33de042dSApple OSS Distributions /**
1882*33de042dSApple OSS Distributions  * returns whether lastblocked_tsp is within wq_stalled_window usecs of now
1883*33de042dSApple OSS Distributions  */
1884*33de042dSApple OSS Distributions static bool
workq_thread_is_busy(uint64_t now,_Atomic uint64_t * lastblocked_tsp)1885*33de042dSApple OSS Distributions workq_thread_is_busy(uint64_t now, _Atomic uint64_t *lastblocked_tsp)
1886*33de042dSApple OSS Distributions {
1887*33de042dSApple OSS Distributions 	uint64_t lastblocked_ts = os_atomic_load_wide(lastblocked_tsp, relaxed);
1888*33de042dSApple OSS Distributions 	if (now <= lastblocked_ts) {
1889*33de042dSApple OSS Distributions 		/*
1890*33de042dSApple OSS Distributions 		 * Because the update of the timestamp when a thread blocks
1891*33de042dSApple OSS Distributions 		 * isn't serialized against us looking at it (i.e. we don't hold
1892*33de042dSApple OSS Distributions 		 * the workq lock), it's possible to have a timestamp that matches
1893*33de042dSApple OSS Distributions 		 * the current time or that even looks to be in the future relative
1894*33de042dSApple OSS Distributions 		 * to when we grabbed the current time...
1895*33de042dSApple OSS Distributions 		 *
1896*33de042dSApple OSS Distributions 		 * Just treat this as a busy thread since it must have just blocked.
1897*33de042dSApple OSS Distributions 		 */
1898*33de042dSApple OSS Distributions 		return true;
1899*33de042dSApple OSS Distributions 	}
1900*33de042dSApple OSS Distributions 	return (now - lastblocked_ts) < wq_stalled_window.abstime;
1901*33de042dSApple OSS Distributions }
1902*33de042dSApple OSS Distributions 
1903*33de042dSApple OSS Distributions static void
workq_add_new_threads_call(void * _p,void * flags)1904*33de042dSApple OSS Distributions workq_add_new_threads_call(void *_p, void *flags)
1905*33de042dSApple OSS Distributions {
1906*33de042dSApple OSS Distributions 	proc_t p = _p;
1907*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
1908*33de042dSApple OSS Distributions 	uint32_t my_flag = (uint32_t)(uintptr_t)flags;
1909*33de042dSApple OSS Distributions 
1910*33de042dSApple OSS Distributions 	/*
1911*33de042dSApple OSS Distributions 	 * workq_exit() will set the workqueue to NULL before
1912*33de042dSApple OSS Distributions 	 * it cancels thread calls.
1913*33de042dSApple OSS Distributions 	 */
1914*33de042dSApple OSS Distributions 	if (!wq) {
1915*33de042dSApple OSS Distributions 		return;
1916*33de042dSApple OSS Distributions 	}
1917*33de042dSApple OSS Distributions 
1918*33de042dSApple OSS Distributions 	assert((my_flag == WQ_DELAYED_CALL_SCHEDULED) ||
1919*33de042dSApple OSS Distributions 	    (my_flag == WQ_IMMEDIATE_CALL_SCHEDULED));
1920*33de042dSApple OSS Distributions 
1921*33de042dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_add_timer | DBG_FUNC_START, wq, _wq_flags(wq),
1922*33de042dSApple OSS Distributions 	    wq->wq_nthreads, wq->wq_thidlecount);
1923*33de042dSApple OSS Distributions 
1924*33de042dSApple OSS Distributions 	workq_lock_spin(wq);
1925*33de042dSApple OSS Distributions 
1926*33de042dSApple OSS Distributions 	wq->wq_thread_call_last_run = mach_absolute_time();
1927*33de042dSApple OSS Distributions 	os_atomic_andnot(&wq->wq_flags, my_flag, release);
1928*33de042dSApple OSS Distributions 
1929*33de042dSApple OSS Distributions 	/* This can drop the workqueue lock, and take it again */
1930*33de042dSApple OSS Distributions 	workq_schedule_creator(p, wq, WORKQ_THREADREQ_CAN_CREATE_THREADS);
1931*33de042dSApple OSS Distributions 
1932*33de042dSApple OSS Distributions 	workq_unlock(wq);
1933*33de042dSApple OSS Distributions 
1934*33de042dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_add_timer | DBG_FUNC_END, wq, 0,
1935*33de042dSApple OSS Distributions 	    wq->wq_nthreads, wq->wq_thidlecount);
1936*33de042dSApple OSS Distributions }
1937*33de042dSApple OSS Distributions 
1938*33de042dSApple OSS Distributions #pragma mark thread state tracking
1939*33de042dSApple OSS Distributions 
1940*33de042dSApple OSS Distributions static void
workq_sched_callback(int type,thread_t thread)1941*33de042dSApple OSS Distributions workq_sched_callback(int type, thread_t thread)
1942*33de042dSApple OSS Distributions {
1943*33de042dSApple OSS Distributions 	thread_ro_t tro = get_thread_ro(thread);
1944*33de042dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(thread);
1945*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(tro->tro_proc);
1946*33de042dSApple OSS Distributions 	thread_qos_t req_qos, qos = uth->uu_workq_pri.qos_bucket;
1947*33de042dSApple OSS Distributions 	wq_thactive_t old_thactive;
1948*33de042dSApple OSS Distributions 	bool start_timer = false;
1949*33de042dSApple OSS Distributions 
1950*33de042dSApple OSS Distributions 	if (qos == WORKQ_THREAD_QOS_MANAGER) {
1951*33de042dSApple OSS Distributions 		return;
1952*33de042dSApple OSS Distributions 	}
1953*33de042dSApple OSS Distributions 
1954*33de042dSApple OSS Distributions 	switch (type) {
1955*33de042dSApple OSS Distributions 	case SCHED_CALL_BLOCK:
1956*33de042dSApple OSS Distributions 		old_thactive = _wq_thactive_dec(wq, qos);
1957*33de042dSApple OSS Distributions 		req_qos = WQ_THACTIVE_BEST_CONSTRAINED_REQ_QOS(old_thactive);
1958*33de042dSApple OSS Distributions 
1959*33de042dSApple OSS Distributions 		/*
1960*33de042dSApple OSS Distributions 		 * Remember the timestamp of the last thread that blocked in this
1961*33de042dSApple OSS Distributions 		 * bucket, it used used by admission checks to ignore one thread
1962*33de042dSApple OSS Distributions 		 * being inactive if this timestamp is recent enough.
1963*33de042dSApple OSS Distributions 		 *
1964*33de042dSApple OSS Distributions 		 * If we collide with another thread trying to update the
1965*33de042dSApple OSS Distributions 		 * last_blocked (really unlikely since another thread would have to
1966*33de042dSApple OSS Distributions 		 * get scheduled and then block after we start down this path), it's
1967*33de042dSApple OSS Distributions 		 * not a problem.  Either timestamp is adequate, so no need to retry
1968*33de042dSApple OSS Distributions 		 */
1969*33de042dSApple OSS Distributions 		os_atomic_store_wide(&wq->wq_lastblocked_ts[_wq_bucket(qos)],
1970*33de042dSApple OSS Distributions 		    thread_last_run_time(thread), relaxed);
1971*33de042dSApple OSS Distributions 
1972*33de042dSApple OSS Distributions 		if (req_qos == THREAD_QOS_UNSPECIFIED) {
1973*33de042dSApple OSS Distributions 			/*
1974*33de042dSApple OSS Distributions 			 * No pending request at the moment we could unblock, move on.
1975*33de042dSApple OSS Distributions 			 */
1976*33de042dSApple OSS Distributions 		} else if (qos < req_qos) {
1977*33de042dSApple OSS Distributions 			/*
1978*33de042dSApple OSS Distributions 			 * The blocking thread is at a lower QoS than the highest currently
1979*33de042dSApple OSS Distributions 			 * pending constrained request, nothing has to be redriven
1980*33de042dSApple OSS Distributions 			 */
1981*33de042dSApple OSS Distributions 		} else {
1982*33de042dSApple OSS Distributions 			uint32_t max_busycount, old_req_count;
1983*33de042dSApple OSS Distributions 			old_req_count = _wq_thactive_aggregate_downto_qos(wq, old_thactive,
1984*33de042dSApple OSS Distributions 			    req_qos, NULL, &max_busycount);
1985*33de042dSApple OSS Distributions 			/*
1986*33de042dSApple OSS Distributions 			 * If it is possible that may_start_constrained_thread had refused
1987*33de042dSApple OSS Distributions 			 * admission due to being over the max concurrency, we may need to
1988*33de042dSApple OSS Distributions 			 * spin up a new thread.
1989*33de042dSApple OSS Distributions 			 *
1990*33de042dSApple OSS Distributions 			 * We take into account the maximum number of busy threads
1991*33de042dSApple OSS Distributions 			 * that can affect may_start_constrained_thread as looking at the
1992*33de042dSApple OSS Distributions 			 * actual number may_start_constrained_thread will see is racy.
1993*33de042dSApple OSS Distributions 			 *
1994*33de042dSApple OSS Distributions 			 * IOW at NCPU = 4, for IN (req_qos = 1), if the old req count is
1995*33de042dSApple OSS Distributions 			 * between NCPU (4) and NCPU - 2 (2) we need to redrive.
1996*33de042dSApple OSS Distributions 			 */
1997*33de042dSApple OSS Distributions 			uint32_t conc = wq_max_parallelism[_wq_bucket(qos)];
1998*33de042dSApple OSS Distributions 			if (old_req_count <= conc && conc <= old_req_count + max_busycount) {
1999*33de042dSApple OSS Distributions 				start_timer = workq_schedule_delayed_thread_creation(wq, 0);
2000*33de042dSApple OSS Distributions 			}
2001*33de042dSApple OSS Distributions 		}
2002*33de042dSApple OSS Distributions 		if (__improbable(kdebug_enable)) {
2003*33de042dSApple OSS Distributions 			__unused uint32_t old = _wq_thactive_aggregate_downto_qos(wq,
2004*33de042dSApple OSS Distributions 			    old_thactive, qos, NULL, NULL);
2005*33de042dSApple OSS Distributions 			WQ_TRACE_WQ(TRACE_wq_thread_block | DBG_FUNC_START, wq,
2006*33de042dSApple OSS Distributions 			    old - 1, qos | (req_qos << 8),
2007*33de042dSApple OSS Distributions 			    wq->wq_reqcount << 1 | start_timer);
2008*33de042dSApple OSS Distributions 		}
2009*33de042dSApple OSS Distributions 		break;
2010*33de042dSApple OSS Distributions 
2011*33de042dSApple OSS Distributions 	case SCHED_CALL_UNBLOCK:
2012*33de042dSApple OSS Distributions 		/*
2013*33de042dSApple OSS Distributions 		 * we cannot take the workqueue_lock here...
2014*33de042dSApple OSS Distributions 		 * an UNBLOCK can occur from a timer event which
2015*33de042dSApple OSS Distributions 		 * is run from an interrupt context... if the workqueue_lock
2016*33de042dSApple OSS Distributions 		 * is already held by this processor, we'll deadlock...
2017*33de042dSApple OSS Distributions 		 * the thread lock for the thread being UNBLOCKED
2018*33de042dSApple OSS Distributions 		 * is also held
2019*33de042dSApple OSS Distributions 		 */
2020*33de042dSApple OSS Distributions 		old_thactive = _wq_thactive_inc(wq, qos);
2021*33de042dSApple OSS Distributions 		if (__improbable(kdebug_enable)) {
2022*33de042dSApple OSS Distributions 			__unused uint32_t old = _wq_thactive_aggregate_downto_qos(wq,
2023*33de042dSApple OSS Distributions 			    old_thactive, qos, NULL, NULL);
2024*33de042dSApple OSS Distributions 			req_qos = WQ_THACTIVE_BEST_CONSTRAINED_REQ_QOS(old_thactive);
2025*33de042dSApple OSS Distributions 			WQ_TRACE_WQ(TRACE_wq_thread_block | DBG_FUNC_END, wq,
2026*33de042dSApple OSS Distributions 			    old + 1, qos | (req_qos << 8),
2027*33de042dSApple OSS Distributions 			    wq->wq_threads_scheduled);
2028*33de042dSApple OSS Distributions 		}
2029*33de042dSApple OSS Distributions 		break;
2030*33de042dSApple OSS Distributions 	}
2031*33de042dSApple OSS Distributions }
2032*33de042dSApple OSS Distributions 
2033*33de042dSApple OSS Distributions #pragma mark workq lifecycle
2034*33de042dSApple OSS Distributions 
2035*33de042dSApple OSS Distributions void
workq_reference(struct workqueue * wq)2036*33de042dSApple OSS Distributions workq_reference(struct workqueue *wq)
2037*33de042dSApple OSS Distributions {
2038*33de042dSApple OSS Distributions 	os_ref_retain(&wq->wq_refcnt);
2039*33de042dSApple OSS Distributions }
2040*33de042dSApple OSS Distributions 
2041*33de042dSApple OSS Distributions static void
workq_deallocate_queue_invoke(mpsc_queue_chain_t e,__assert_only mpsc_daemon_queue_t dq)2042*33de042dSApple OSS Distributions workq_deallocate_queue_invoke(mpsc_queue_chain_t e,
2043*33de042dSApple OSS Distributions     __assert_only mpsc_daemon_queue_t dq)
2044*33de042dSApple OSS Distributions {
2045*33de042dSApple OSS Distributions 	struct workqueue *wq;
2046*33de042dSApple OSS Distributions 	struct turnstile *ts;
2047*33de042dSApple OSS Distributions 
2048*33de042dSApple OSS Distributions 	wq = mpsc_queue_element(e, struct workqueue, wq_destroy_link);
2049*33de042dSApple OSS Distributions 	assert(dq == &workq_deallocate_queue);
2050*33de042dSApple OSS Distributions 
2051*33de042dSApple OSS Distributions 	turnstile_complete((uintptr_t)wq, &wq->wq_turnstile, &ts, TURNSTILE_WORKQS);
2052*33de042dSApple OSS Distributions 	assert(ts);
2053*33de042dSApple OSS Distributions 	turnstile_cleanup();
2054*33de042dSApple OSS Distributions 	turnstile_deallocate(ts);
2055*33de042dSApple OSS Distributions 
2056*33de042dSApple OSS Distributions 	lck_ticket_destroy(&wq->wq_lock, &workq_lck_grp);
2057*33de042dSApple OSS Distributions 	zfree(workq_zone_workqueue, wq);
2058*33de042dSApple OSS Distributions }
2059*33de042dSApple OSS Distributions 
2060*33de042dSApple OSS Distributions static void
workq_deallocate(struct workqueue * wq)2061*33de042dSApple OSS Distributions workq_deallocate(struct workqueue *wq)
2062*33de042dSApple OSS Distributions {
2063*33de042dSApple OSS Distributions 	if (os_ref_release_relaxed(&wq->wq_refcnt) == 0) {
2064*33de042dSApple OSS Distributions 		workq_deallocate_queue_invoke(&wq->wq_destroy_link,
2065*33de042dSApple OSS Distributions 		    &workq_deallocate_queue);
2066*33de042dSApple OSS Distributions 	}
2067*33de042dSApple OSS Distributions }
2068*33de042dSApple OSS Distributions 
2069*33de042dSApple OSS Distributions void
workq_deallocate_safe(struct workqueue * wq)2070*33de042dSApple OSS Distributions workq_deallocate_safe(struct workqueue *wq)
2071*33de042dSApple OSS Distributions {
2072*33de042dSApple OSS Distributions 	if (__improbable(os_ref_release_relaxed(&wq->wq_refcnt) == 0)) {
2073*33de042dSApple OSS Distributions 		mpsc_daemon_enqueue(&workq_deallocate_queue, &wq->wq_destroy_link,
2074*33de042dSApple OSS Distributions 		    MPSC_QUEUE_DISABLE_PREEMPTION);
2075*33de042dSApple OSS Distributions 	}
2076*33de042dSApple OSS Distributions }
2077*33de042dSApple OSS Distributions 
2078*33de042dSApple OSS Distributions /**
2079*33de042dSApple OSS Distributions  * Setup per-process state for the workqueue.
2080*33de042dSApple OSS Distributions  */
2081*33de042dSApple OSS Distributions int
workq_open(struct proc * p,__unused struct workq_open_args * uap,__unused int32_t * retval)2082*33de042dSApple OSS Distributions workq_open(struct proc *p, __unused struct workq_open_args *uap,
2083*33de042dSApple OSS Distributions     __unused int32_t *retval)
2084*33de042dSApple OSS Distributions {
2085*33de042dSApple OSS Distributions 	struct workqueue *wq;
2086*33de042dSApple OSS Distributions 	int error = 0;
2087*33de042dSApple OSS Distributions 
2088*33de042dSApple OSS Distributions 	if ((p->p_lflag & P_LREGISTER) == 0) {
2089*33de042dSApple OSS Distributions 		return EINVAL;
2090*33de042dSApple OSS Distributions 	}
2091*33de042dSApple OSS Distributions 
2092*33de042dSApple OSS Distributions 	if (wq_init_constrained_limit) {
2093*33de042dSApple OSS Distributions 		uint32_t limit, num_cpus = ml_wait_max_cpus();
2094*33de042dSApple OSS Distributions 
2095*33de042dSApple OSS Distributions 		/*
2096*33de042dSApple OSS Distributions 		 * set up the limit for the constrained pool
2097*33de042dSApple OSS Distributions 		 * this is a virtual pool in that we don't
2098*33de042dSApple OSS Distributions 		 * maintain it on a separate idle and run list
2099*33de042dSApple OSS Distributions 		 */
2100*33de042dSApple OSS Distributions 		limit = num_cpus * WORKQUEUE_CONSTRAINED_FACTOR;
2101*33de042dSApple OSS Distributions 
2102*33de042dSApple OSS Distributions 		if (limit > wq_max_constrained_threads) {
2103*33de042dSApple OSS Distributions 			wq_max_constrained_threads = limit;
2104*33de042dSApple OSS Distributions 		}
2105*33de042dSApple OSS Distributions 
2106*33de042dSApple OSS Distributions 		if (wq_max_threads > WQ_THACTIVE_BUCKET_HALF) {
2107*33de042dSApple OSS Distributions 			wq_max_threads = WQ_THACTIVE_BUCKET_HALF;
2108*33de042dSApple OSS Distributions 		}
2109*33de042dSApple OSS Distributions 		if (wq_max_threads > CONFIG_THREAD_MAX - 20) {
2110*33de042dSApple OSS Distributions 			wq_max_threads = CONFIG_THREAD_MAX - 20;
2111*33de042dSApple OSS Distributions 		}
2112*33de042dSApple OSS Distributions 
2113*33de042dSApple OSS Distributions 		wq_death_max_load = (uint16_t)fls(num_cpus) + 1;
2114*33de042dSApple OSS Distributions 
2115*33de042dSApple OSS Distributions 		for (thread_qos_t qos = WORKQ_THREAD_QOS_MIN; qos <= WORKQ_THREAD_QOS_MAX; qos++) {
2116*33de042dSApple OSS Distributions 			wq_max_parallelism[_wq_bucket(qos)] =
2117*33de042dSApple OSS Distributions 			    qos_max_parallelism(qos, QOS_PARALLELISM_COUNT_LOGICAL);
2118*33de042dSApple OSS Distributions 		}
2119*33de042dSApple OSS Distributions 
2120*33de042dSApple OSS Distributions 		wq_max_cooperative_threads = num_cpus;
2121*33de042dSApple OSS Distributions 
2122*33de042dSApple OSS Distributions 		wq_init_constrained_limit = 0;
2123*33de042dSApple OSS Distributions 	}
2124*33de042dSApple OSS Distributions 
2125*33de042dSApple OSS Distributions 	if (proc_get_wqptr(p) == NULL) {
2126*33de042dSApple OSS Distributions 		if (proc_init_wqptr_or_wait(p) == FALSE) {
2127*33de042dSApple OSS Distributions 			assert(proc_get_wqptr(p) != NULL);
2128*33de042dSApple OSS Distributions 			goto out;
2129*33de042dSApple OSS Distributions 		}
2130*33de042dSApple OSS Distributions 
2131*33de042dSApple OSS Distributions 		wq = zalloc_flags(workq_zone_workqueue, Z_WAITOK | Z_ZERO);
2132*33de042dSApple OSS Distributions 
2133*33de042dSApple OSS Distributions 		os_ref_init_count(&wq->wq_refcnt, &workq_refgrp, 1);
2134*33de042dSApple OSS Distributions 
2135*33de042dSApple OSS Distributions 		// Start the event manager at the priority hinted at by the policy engine
2136*33de042dSApple OSS Distributions 		thread_qos_t mgr_priority_hint = task_get_default_manager_qos(current_task());
2137*33de042dSApple OSS Distributions 		pthread_priority_t pp = _pthread_priority_make_from_thread_qos(mgr_priority_hint, 0, 0);
2138*33de042dSApple OSS Distributions 		wq->wq_event_manager_priority = (uint32_t)pp;
2139*33de042dSApple OSS Distributions 		wq->wq_timer_interval = (uint32_t)wq_stalled_window.abstime;
2140*33de042dSApple OSS Distributions 		wq->wq_proc = p;
2141*33de042dSApple OSS Distributions 		turnstile_prepare((uintptr_t)wq, &wq->wq_turnstile, turnstile_alloc(),
2142*33de042dSApple OSS Distributions 		    TURNSTILE_WORKQS);
2143*33de042dSApple OSS Distributions 
2144*33de042dSApple OSS Distributions 		TAILQ_INIT(&wq->wq_thrunlist);
2145*33de042dSApple OSS Distributions 		TAILQ_INIT(&wq->wq_thnewlist);
2146*33de042dSApple OSS Distributions 		TAILQ_INIT(&wq->wq_thidlelist);
2147*33de042dSApple OSS Distributions 		priority_queue_init(&wq->wq_overcommit_queue);
2148*33de042dSApple OSS Distributions 		priority_queue_init(&wq->wq_constrained_queue);
2149*33de042dSApple OSS Distributions 		priority_queue_init(&wq->wq_special_queue);
2150*33de042dSApple OSS Distributions 		for (int bucket = 0; bucket < WORKQ_NUM_QOS_BUCKETS; bucket++) {
2151*33de042dSApple OSS Distributions 			STAILQ_INIT(&wq->wq_cooperative_queue[bucket]);
2152*33de042dSApple OSS Distributions 		}
2153*33de042dSApple OSS Distributions 
2154*33de042dSApple OSS Distributions 		/* We are only using the delayed thread call for the constrained pool
2155*33de042dSApple OSS Distributions 		 * which can't have work at >= UI QoS and so we can be fine with a
2156*33de042dSApple OSS Distributions 		 * UI QoS thread call.
2157*33de042dSApple OSS Distributions 		 */
2158*33de042dSApple OSS Distributions 		wq->wq_delayed_call = thread_call_allocate_with_qos(
2159*33de042dSApple OSS Distributions 			workq_add_new_threads_call, p, THREAD_QOS_USER_INTERACTIVE,
2160*33de042dSApple OSS Distributions 			THREAD_CALL_OPTIONS_ONCE);
2161*33de042dSApple OSS Distributions 		wq->wq_immediate_call = thread_call_allocate_with_options(
2162*33de042dSApple OSS Distributions 			workq_add_new_threads_call, p, THREAD_CALL_PRIORITY_KERNEL,
2163*33de042dSApple OSS Distributions 			THREAD_CALL_OPTIONS_ONCE);
2164*33de042dSApple OSS Distributions 		wq->wq_death_call = thread_call_allocate_with_options(
2165*33de042dSApple OSS Distributions 			workq_kill_old_threads_call, wq,
2166*33de042dSApple OSS Distributions 			THREAD_CALL_PRIORITY_USER, THREAD_CALL_OPTIONS_ONCE);
2167*33de042dSApple OSS Distributions 
2168*33de042dSApple OSS Distributions 		lck_ticket_init(&wq->wq_lock, &workq_lck_grp);
2169*33de042dSApple OSS Distributions 
2170*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_create | DBG_FUNC_NONE, wq,
2171*33de042dSApple OSS Distributions 		    VM_KERNEL_ADDRHIDE(wq), 0, 0);
2172*33de042dSApple OSS Distributions 		proc_set_wqptr(p, wq);
2173*33de042dSApple OSS Distributions 	}
2174*33de042dSApple OSS Distributions out:
2175*33de042dSApple OSS Distributions 
2176*33de042dSApple OSS Distributions 	return error;
2177*33de042dSApple OSS Distributions }
2178*33de042dSApple OSS Distributions 
2179*33de042dSApple OSS Distributions /*
2180*33de042dSApple OSS Distributions  * Routine:	workq_mark_exiting
2181*33de042dSApple OSS Distributions  *
2182*33de042dSApple OSS Distributions  * Function:	Mark the work queue such that new threads will not be added to the
2183*33de042dSApple OSS Distributions  *		work queue after we return.
2184*33de042dSApple OSS Distributions  *
2185*33de042dSApple OSS Distributions  * Conditions:	Called against the current process.
2186*33de042dSApple OSS Distributions  */
2187*33de042dSApple OSS Distributions void
workq_mark_exiting(struct proc * p)2188*33de042dSApple OSS Distributions workq_mark_exiting(struct proc *p)
2189*33de042dSApple OSS Distributions {
2190*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
2191*33de042dSApple OSS Distributions 	uint32_t wq_flags;
2192*33de042dSApple OSS Distributions 	workq_threadreq_t mgr_req;
2193*33de042dSApple OSS Distributions 
2194*33de042dSApple OSS Distributions 	if (!wq) {
2195*33de042dSApple OSS Distributions 		return;
2196*33de042dSApple OSS Distributions 	}
2197*33de042dSApple OSS Distributions 
2198*33de042dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_pthread_exit | DBG_FUNC_START, wq, 0, 0, 0);
2199*33de042dSApple OSS Distributions 
2200*33de042dSApple OSS Distributions 	workq_lock_spin(wq);
2201*33de042dSApple OSS Distributions 
2202*33de042dSApple OSS Distributions 	wq_flags = os_atomic_or_orig(&wq->wq_flags, WQ_EXITING, relaxed);
2203*33de042dSApple OSS Distributions 	if (__improbable(wq_flags & WQ_EXITING)) {
2204*33de042dSApple OSS Distributions 		panic("workq_mark_exiting called twice");
2205*33de042dSApple OSS Distributions 	}
2206*33de042dSApple OSS Distributions 
2207*33de042dSApple OSS Distributions 	/*
2208*33de042dSApple OSS Distributions 	 * Opportunistically try to cancel thread calls that are likely in flight.
2209*33de042dSApple OSS Distributions 	 * workq_exit() will do the proper cleanup.
2210*33de042dSApple OSS Distributions 	 */
2211*33de042dSApple OSS Distributions 	if (wq_flags & WQ_IMMEDIATE_CALL_SCHEDULED) {
2212*33de042dSApple OSS Distributions 		thread_call_cancel(wq->wq_immediate_call);
2213*33de042dSApple OSS Distributions 	}
2214*33de042dSApple OSS Distributions 	if (wq_flags & WQ_DELAYED_CALL_SCHEDULED) {
2215*33de042dSApple OSS Distributions 		thread_call_cancel(wq->wq_delayed_call);
2216*33de042dSApple OSS Distributions 	}
2217*33de042dSApple OSS Distributions 	if (wq_flags & WQ_DEATH_CALL_SCHEDULED) {
2218*33de042dSApple OSS Distributions 		thread_call_cancel(wq->wq_death_call);
2219*33de042dSApple OSS Distributions 	}
2220*33de042dSApple OSS Distributions 
2221*33de042dSApple OSS Distributions 	mgr_req = wq->wq_event_manager_threadreq;
2222*33de042dSApple OSS Distributions 	wq->wq_event_manager_threadreq = NULL;
2223*33de042dSApple OSS Distributions 	wq->wq_reqcount = 0; /* workq_schedule_creator must not look at queues */
2224*33de042dSApple OSS Distributions 	wq->wq_creator = NULL;
2225*33de042dSApple OSS Distributions 	workq_turnstile_update_inheritor(wq, TURNSTILE_INHERITOR_NULL, 0);
2226*33de042dSApple OSS Distributions 
2227*33de042dSApple OSS Distributions 	workq_unlock(wq);
2228*33de042dSApple OSS Distributions 
2229*33de042dSApple OSS Distributions 	if (mgr_req) {
2230*33de042dSApple OSS Distributions 		kqueue_threadreq_cancel(p, mgr_req);
2231*33de042dSApple OSS Distributions 	}
2232*33de042dSApple OSS Distributions 	/*
2233*33de042dSApple OSS Distributions 	 * No one touches the priority queues once WQ_EXITING is set.
2234*33de042dSApple OSS Distributions 	 * It is hence safe to do the tear down without holding any lock.
2235*33de042dSApple OSS Distributions 	 */
2236*33de042dSApple OSS Distributions 	priority_queue_destroy(&wq->wq_overcommit_queue,
2237*33de042dSApple OSS Distributions 	    struct workq_threadreq_s, tr_entry, ^(workq_threadreq_t e){
2238*33de042dSApple OSS Distributions 		workq_threadreq_destroy(p, e);
2239*33de042dSApple OSS Distributions 	});
2240*33de042dSApple OSS Distributions 	priority_queue_destroy(&wq->wq_constrained_queue,
2241*33de042dSApple OSS Distributions 	    struct workq_threadreq_s, tr_entry, ^(workq_threadreq_t e){
2242*33de042dSApple OSS Distributions 		workq_threadreq_destroy(p, e);
2243*33de042dSApple OSS Distributions 	});
2244*33de042dSApple OSS Distributions 	priority_queue_destroy(&wq->wq_special_queue,
2245*33de042dSApple OSS Distributions 	    struct workq_threadreq_s, tr_entry, ^(workq_threadreq_t e){
2246*33de042dSApple OSS Distributions 		workq_threadreq_destroy(p, e);
2247*33de042dSApple OSS Distributions 	});
2248*33de042dSApple OSS Distributions 
2249*33de042dSApple OSS Distributions 	WQ_TRACE(TRACE_wq_pthread_exit | DBG_FUNC_END, 0, 0, 0, 0);
2250*33de042dSApple OSS Distributions }
2251*33de042dSApple OSS Distributions 
2252*33de042dSApple OSS Distributions /*
2253*33de042dSApple OSS Distributions  * Routine:	workq_exit
2254*33de042dSApple OSS Distributions  *
2255*33de042dSApple OSS Distributions  * Function:	clean up the work queue structure(s) now that there are no threads
2256*33de042dSApple OSS Distributions  *		left running inside the work queue (except possibly current_thread).
2257*33de042dSApple OSS Distributions  *
2258*33de042dSApple OSS Distributions  * Conditions:	Called by the last thread in the process.
2259*33de042dSApple OSS Distributions  *		Called against current process.
2260*33de042dSApple OSS Distributions  */
2261*33de042dSApple OSS Distributions void
workq_exit(struct proc * p)2262*33de042dSApple OSS Distributions workq_exit(struct proc *p)
2263*33de042dSApple OSS Distributions {
2264*33de042dSApple OSS Distributions 	struct workqueue *wq;
2265*33de042dSApple OSS Distributions 	struct uthread *uth, *tmp;
2266*33de042dSApple OSS Distributions 
2267*33de042dSApple OSS Distributions 	wq = os_atomic_xchg(&p->p_wqptr, NULL, relaxed);
2268*33de042dSApple OSS Distributions 	if (wq != NULL) {
2269*33de042dSApple OSS Distributions 		thread_t th = current_thread();
2270*33de042dSApple OSS Distributions 
2271*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_workqueue_exit | DBG_FUNC_START, wq, 0, 0, 0);
2272*33de042dSApple OSS Distributions 
2273*33de042dSApple OSS Distributions 		if (thread_get_tag(th) & THREAD_TAG_WORKQUEUE) {
2274*33de042dSApple OSS Distributions 			/*
2275*33de042dSApple OSS Distributions 			 * <rdar://problem/40111515> Make sure we will no longer call the
2276*33de042dSApple OSS Distributions 			 * sched call, if we ever block this thread, which the cancel_wait
2277*33de042dSApple OSS Distributions 			 * below can do.
2278*33de042dSApple OSS Distributions 			 */
2279*33de042dSApple OSS Distributions 			thread_sched_call(th, NULL);
2280*33de042dSApple OSS Distributions 		}
2281*33de042dSApple OSS Distributions 
2282*33de042dSApple OSS Distributions 		/*
2283*33de042dSApple OSS Distributions 		 * Thread calls are always scheduled by the proc itself or under the
2284*33de042dSApple OSS Distributions 		 * workqueue spinlock if WQ_EXITING is not yet set.
2285*33de042dSApple OSS Distributions 		 *
2286*33de042dSApple OSS Distributions 		 * Either way, when this runs, the proc has no threads left beside
2287*33de042dSApple OSS Distributions 		 * the one running this very code, so we know no thread call can be
2288*33de042dSApple OSS Distributions 		 * dispatched anymore.
2289*33de042dSApple OSS Distributions 		 */
2290*33de042dSApple OSS Distributions 		thread_call_cancel_wait(wq->wq_delayed_call);
2291*33de042dSApple OSS Distributions 		thread_call_cancel_wait(wq->wq_immediate_call);
2292*33de042dSApple OSS Distributions 		thread_call_cancel_wait(wq->wq_death_call);
2293*33de042dSApple OSS Distributions 		thread_call_free(wq->wq_delayed_call);
2294*33de042dSApple OSS Distributions 		thread_call_free(wq->wq_immediate_call);
2295*33de042dSApple OSS Distributions 		thread_call_free(wq->wq_death_call);
2296*33de042dSApple OSS Distributions 
2297*33de042dSApple OSS Distributions 		/*
2298*33de042dSApple OSS Distributions 		 * Clean up workqueue data structures for threads that exited and
2299*33de042dSApple OSS Distributions 		 * didn't get a chance to clean up after themselves.
2300*33de042dSApple OSS Distributions 		 *
2301*33de042dSApple OSS Distributions 		 * idle/new threads should have been interrupted and died on their own
2302*33de042dSApple OSS Distributions 		 */
2303*33de042dSApple OSS Distributions 		TAILQ_FOREACH_SAFE(uth, &wq->wq_thrunlist, uu_workq_entry, tmp) {
2304*33de042dSApple OSS Distributions 			thread_t mth = get_machthread(uth);
2305*33de042dSApple OSS Distributions 			thread_sched_call(mth, NULL);
2306*33de042dSApple OSS Distributions 			thread_deallocate(mth);
2307*33de042dSApple OSS Distributions 		}
2308*33de042dSApple OSS Distributions 		assert(TAILQ_EMPTY(&wq->wq_thnewlist));
2309*33de042dSApple OSS Distributions 		assert(TAILQ_EMPTY(&wq->wq_thidlelist));
2310*33de042dSApple OSS Distributions 
2311*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_destroy | DBG_FUNC_END, wq,
2312*33de042dSApple OSS Distributions 		    VM_KERNEL_ADDRHIDE(wq), 0, 0);
2313*33de042dSApple OSS Distributions 
2314*33de042dSApple OSS Distributions 		workq_deallocate(wq);
2315*33de042dSApple OSS Distributions 
2316*33de042dSApple OSS Distributions 		WQ_TRACE(TRACE_wq_workqueue_exit | DBG_FUNC_END, 0, 0, 0, 0);
2317*33de042dSApple OSS Distributions 	}
2318*33de042dSApple OSS Distributions }
2319*33de042dSApple OSS Distributions 
2320*33de042dSApple OSS Distributions 
2321*33de042dSApple OSS Distributions #pragma mark bsd thread control
2322*33de042dSApple OSS Distributions 
2323*33de042dSApple OSS Distributions bool
bsdthread_part_of_cooperative_workqueue(struct uthread * uth)2324*33de042dSApple OSS Distributions bsdthread_part_of_cooperative_workqueue(struct uthread *uth)
2325*33de042dSApple OSS Distributions {
2326*33de042dSApple OSS Distributions 	return (workq_thread_is_cooperative(uth) || workq_thread_is_nonovercommit(uth)) &&
2327*33de042dSApple OSS Distributions 	       (uth->uu_workq_pri.qos_bucket != WORKQ_THREAD_QOS_MANAGER) &&
2328*33de042dSApple OSS Distributions 	       (!workq_thread_is_permanently_bound(uth));
2329*33de042dSApple OSS Distributions }
2330*33de042dSApple OSS Distributions 
2331*33de042dSApple OSS Distributions static bool
_pthread_priority_to_policy(pthread_priority_t priority,thread_qos_policy_data_t * data)2332*33de042dSApple OSS Distributions _pthread_priority_to_policy(pthread_priority_t priority,
2333*33de042dSApple OSS Distributions     thread_qos_policy_data_t *data)
2334*33de042dSApple OSS Distributions {
2335*33de042dSApple OSS Distributions 	data->qos_tier = _pthread_priority_thread_qos(priority);
2336*33de042dSApple OSS Distributions 	data->tier_importance = _pthread_priority_relpri(priority);
2337*33de042dSApple OSS Distributions 	if (data->qos_tier == THREAD_QOS_UNSPECIFIED || data->tier_importance > 0 ||
2338*33de042dSApple OSS Distributions 	    data->tier_importance < THREAD_QOS_MIN_TIER_IMPORTANCE) {
2339*33de042dSApple OSS Distributions 		return false;
2340*33de042dSApple OSS Distributions 	}
2341*33de042dSApple OSS Distributions 	return true;
2342*33de042dSApple OSS Distributions }
2343*33de042dSApple OSS Distributions 
2344*33de042dSApple OSS Distributions static int
bsdthread_set_self(proc_t p,thread_t th,pthread_priority_t priority,mach_port_name_t voucher,enum workq_set_self_flags flags)2345*33de042dSApple OSS Distributions bsdthread_set_self(proc_t p, thread_t th, pthread_priority_t priority,
2346*33de042dSApple OSS Distributions     mach_port_name_t voucher, enum workq_set_self_flags flags)
2347*33de042dSApple OSS Distributions {
2348*33de042dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(th);
2349*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
2350*33de042dSApple OSS Distributions 
2351*33de042dSApple OSS Distributions 	kern_return_t kr;
2352*33de042dSApple OSS Distributions 	int unbind_rv = 0, qos_rv = 0, voucher_rv = 0, fixedpri_rv = 0;
2353*33de042dSApple OSS Distributions 	bool is_wq_thread = (thread_get_tag(th) & THREAD_TAG_WORKQUEUE);
2354*33de042dSApple OSS Distributions 
2355*33de042dSApple OSS Distributions 	assert(th == current_thread());
2356*33de042dSApple OSS Distributions 	if (flags & WORKQ_SET_SELF_WQ_KEVENT_UNBIND) {
2357*33de042dSApple OSS Distributions 		if (!is_wq_thread) {
2358*33de042dSApple OSS Distributions 			unbind_rv = EINVAL;
2359*33de042dSApple OSS Distributions 			goto qos;
2360*33de042dSApple OSS Distributions 		}
2361*33de042dSApple OSS Distributions 
2362*33de042dSApple OSS Distributions 		if (uth->uu_workq_pri.qos_bucket == WORKQ_THREAD_QOS_MANAGER) {
2363*33de042dSApple OSS Distributions 			unbind_rv = EINVAL;
2364*33de042dSApple OSS Distributions 			goto qos;
2365*33de042dSApple OSS Distributions 		}
2366*33de042dSApple OSS Distributions 
2367*33de042dSApple OSS Distributions 		workq_threadreq_t kqr = uth->uu_kqr_bound;
2368*33de042dSApple OSS Distributions 		if (kqr == NULL) {
2369*33de042dSApple OSS Distributions 			unbind_rv = EALREADY;
2370*33de042dSApple OSS Distributions 			goto qos;
2371*33de042dSApple OSS Distributions 		}
2372*33de042dSApple OSS Distributions 
2373*33de042dSApple OSS Distributions 		if (kqr->tr_flags & WORKQ_TR_FLAG_WORKLOOP) {
2374*33de042dSApple OSS Distributions 			unbind_rv = EINVAL;
2375*33de042dSApple OSS Distributions 			goto qos;
2376*33de042dSApple OSS Distributions 		}
2377*33de042dSApple OSS Distributions 
2378*33de042dSApple OSS Distributions 		kqueue_threadreq_unbind(p, kqr);
2379*33de042dSApple OSS Distributions 	}
2380*33de042dSApple OSS Distributions 
2381*33de042dSApple OSS Distributions qos:
2382*33de042dSApple OSS Distributions 	if (flags & (WORKQ_SET_SELF_QOS_FLAG | WORKQ_SET_SELF_QOS_OVERRIDE_FLAG)) {
2383*33de042dSApple OSS Distributions 		assert(flags & WORKQ_SET_SELF_QOS_FLAG);
2384*33de042dSApple OSS Distributions 
2385*33de042dSApple OSS Distributions 		thread_qos_policy_data_t new_policy;
2386*33de042dSApple OSS Distributions 		thread_qos_t qos_override = THREAD_QOS_UNSPECIFIED;
2387*33de042dSApple OSS Distributions 
2388*33de042dSApple OSS Distributions 		if (!_pthread_priority_to_policy(priority, &new_policy)) {
2389*33de042dSApple OSS Distributions 			qos_rv = EINVAL;
2390*33de042dSApple OSS Distributions 			goto voucher;
2391*33de042dSApple OSS Distributions 		}
2392*33de042dSApple OSS Distributions 
2393*33de042dSApple OSS Distributions 		if (flags & WORKQ_SET_SELF_QOS_OVERRIDE_FLAG) {
2394*33de042dSApple OSS Distributions 			/*
2395*33de042dSApple OSS Distributions 			 * If the WORKQ_SET_SELF_QOS_OVERRIDE_FLAG is set, we definitely
2396*33de042dSApple OSS Distributions 			 * should have an override QoS in the pthread_priority_t and we should
2397*33de042dSApple OSS Distributions 			 * only come into this path for cooperative thread requests
2398*33de042dSApple OSS Distributions 			 */
2399*33de042dSApple OSS Distributions 			if (!_pthread_priority_has_override_qos(priority) ||
2400*33de042dSApple OSS Distributions 			    !_pthread_priority_is_cooperative(priority)) {
2401*33de042dSApple OSS Distributions 				qos_rv = EINVAL;
2402*33de042dSApple OSS Distributions 				goto voucher;
2403*33de042dSApple OSS Distributions 			}
2404*33de042dSApple OSS Distributions 			qos_override = _pthread_priority_thread_override_qos(priority);
2405*33de042dSApple OSS Distributions 		} else {
2406*33de042dSApple OSS Distributions 			/*
2407*33de042dSApple OSS Distributions 			 * If the WORKQ_SET_SELF_QOS_OVERRIDE_FLAG is not set, we definitely
2408*33de042dSApple OSS Distributions 			 * should not have an override QoS in the pthread_priority_t
2409*33de042dSApple OSS Distributions 			 */
2410*33de042dSApple OSS Distributions 			if (_pthread_priority_has_override_qos(priority)) {
2411*33de042dSApple OSS Distributions 				qos_rv = EINVAL;
2412*33de042dSApple OSS Distributions 				goto voucher;
2413*33de042dSApple OSS Distributions 			}
2414*33de042dSApple OSS Distributions 		}
2415*33de042dSApple OSS Distributions 
2416*33de042dSApple OSS Distributions 		if (!is_wq_thread) {
2417*33de042dSApple OSS Distributions 			/*
2418*33de042dSApple OSS Distributions 			 * Threads opted out of QoS can't change QoS
2419*33de042dSApple OSS Distributions 			 */
2420*33de042dSApple OSS Distributions 			if (!thread_has_qos_policy(th)) {
2421*33de042dSApple OSS Distributions 				qos_rv = EPERM;
2422*33de042dSApple OSS Distributions 				goto voucher;
2423*33de042dSApple OSS Distributions 			}
2424*33de042dSApple OSS Distributions 		} else if (uth->uu_workq_pri.qos_bucket == WORKQ_THREAD_QOS_MANAGER ||
2425*33de042dSApple OSS Distributions 		    uth->uu_workq_pri.qos_bucket == WORKQ_THREAD_QOS_ABOVEUI) {
2426*33de042dSApple OSS Distributions 			/*
2427*33de042dSApple OSS Distributions 			 * Workqueue manager threads or threads above UI can't change QoS
2428*33de042dSApple OSS Distributions 			 */
2429*33de042dSApple OSS Distributions 			qos_rv = EINVAL;
2430*33de042dSApple OSS Distributions 			goto voucher;
2431*33de042dSApple OSS Distributions 		} else {
2432*33de042dSApple OSS Distributions 			/*
2433*33de042dSApple OSS Distributions 			 * For workqueue threads, possibly adjust buckets and redrive thread
2434*33de042dSApple OSS Distributions 			 * requests.
2435*33de042dSApple OSS Distributions 			 *
2436*33de042dSApple OSS Distributions 			 * Transitions allowed:
2437*33de042dSApple OSS Distributions 			 *
2438*33de042dSApple OSS Distributions 			 * overcommit --> non-overcommit
2439*33de042dSApple OSS Distributions 			 * overcommit --> overcommit
2440*33de042dSApple OSS Distributions 			 * non-overcommit --> non-overcommit
2441*33de042dSApple OSS Distributions 			 * non-overcommit --> overcommit (to be deprecated later)
2442*33de042dSApple OSS Distributions 			 * cooperative --> cooperative
2443*33de042dSApple OSS Distributions 			 *
2444*33de042dSApple OSS Distributions 			 * All other transitions aren't allowed so reject them.
2445*33de042dSApple OSS Distributions 			 */
2446*33de042dSApple OSS Distributions 			if (workq_thread_is_overcommit(uth) && _pthread_priority_is_cooperative(priority)) {
2447*33de042dSApple OSS Distributions 				qos_rv = EINVAL;
2448*33de042dSApple OSS Distributions 				goto voucher;
2449*33de042dSApple OSS Distributions 			} else if (workq_thread_is_cooperative(uth) && !_pthread_priority_is_cooperative(priority)) {
2450*33de042dSApple OSS Distributions 				qos_rv = EINVAL;
2451*33de042dSApple OSS Distributions 				goto voucher;
2452*33de042dSApple OSS Distributions 			} else if (workq_thread_is_nonovercommit(uth) && _pthread_priority_is_cooperative(priority)) {
2453*33de042dSApple OSS Distributions 				qos_rv = EINVAL;
2454*33de042dSApple OSS Distributions 				goto voucher;
2455*33de042dSApple OSS Distributions 			}
2456*33de042dSApple OSS Distributions 
2457*33de042dSApple OSS Distributions 			struct uu_workq_policy old_pri, new_pri;
2458*33de042dSApple OSS Distributions 			bool force_run = false;
2459*33de042dSApple OSS Distributions 
2460*33de042dSApple OSS Distributions 			if (qos_override) {
2461*33de042dSApple OSS Distributions 				/*
2462*33de042dSApple OSS Distributions 				 * We're in the case of a thread clarifying that it is for eg. not IN
2463*33de042dSApple OSS Distributions 				 * req QoS but rather, UT req QoS with IN override. However, this can
2464*33de042dSApple OSS Distributions 				 * race with a concurrent override happening to the thread via
2465*33de042dSApple OSS Distributions 				 * workq_thread_add_dispatch_override so this needs to be
2466*33de042dSApple OSS Distributions 				 * synchronized with the thread mutex.
2467*33de042dSApple OSS Distributions 				 */
2468*33de042dSApple OSS Distributions 				thread_mtx_lock(th);
2469*33de042dSApple OSS Distributions 			}
2470*33de042dSApple OSS Distributions 
2471*33de042dSApple OSS Distributions 			workq_lock_spin(wq);
2472*33de042dSApple OSS Distributions 
2473*33de042dSApple OSS Distributions 			old_pri = new_pri = uth->uu_workq_pri;
2474*33de042dSApple OSS Distributions 			new_pri.qos_req = (thread_qos_t)new_policy.qos_tier;
2475*33de042dSApple OSS Distributions 
2476*33de042dSApple OSS Distributions 			if (old_pri.qos_override < qos_override) {
2477*33de042dSApple OSS Distributions 				/*
2478*33de042dSApple OSS Distributions 				 * Since this can race with a concurrent override via
2479*33de042dSApple OSS Distributions 				 * workq_thread_add_dispatch_override, only adjust override value if we
2480*33de042dSApple OSS Distributions 				 * are higher - this is a saturating function.
2481*33de042dSApple OSS Distributions 				 *
2482*33de042dSApple OSS Distributions 				 * We should not be changing the final override values, we should simply
2483*33de042dSApple OSS Distributions 				 * be redistributing the current value with a different breakdown of req
2484*33de042dSApple OSS Distributions 				 * vs override QoS - assert to that effect. Therefore, buckets should
2485*33de042dSApple OSS Distributions 				 * not change.
2486*33de042dSApple OSS Distributions 				 */
2487*33de042dSApple OSS Distributions 				new_pri.qos_override = qos_override;
2488*33de042dSApple OSS Distributions 				assert(workq_pri_override(new_pri) == workq_pri_override(old_pri));
2489*33de042dSApple OSS Distributions 				assert(workq_pri_bucket(new_pri) == workq_pri_bucket(old_pri));
2490*33de042dSApple OSS Distributions 			}
2491*33de042dSApple OSS Distributions 
2492*33de042dSApple OSS Distributions 			/* Adjust schedule counts for various types of transitions */
2493*33de042dSApple OSS Distributions 
2494*33de042dSApple OSS Distributions 			/* overcommit -> non-overcommit */
2495*33de042dSApple OSS Distributions 			if (workq_thread_is_overcommit(uth) && _pthread_priority_is_nonovercommit(priority)) {
2496*33de042dSApple OSS Distributions 				workq_thread_set_type(uth, 0);
2497*33de042dSApple OSS Distributions 				wq->wq_constrained_threads_scheduled++;
2498*33de042dSApple OSS Distributions 
2499*33de042dSApple OSS Distributions 				/* non-overcommit -> overcommit */
2500*33de042dSApple OSS Distributions 			} else if (workq_thread_is_nonovercommit(uth) && _pthread_priority_is_overcommit(priority)) {
2501*33de042dSApple OSS Distributions 				workq_thread_set_type(uth, UT_WORKQ_OVERCOMMIT);
2502*33de042dSApple OSS Distributions 				force_run = (wq->wq_constrained_threads_scheduled-- == wq_max_constrained_threads);
2503*33de042dSApple OSS Distributions 
2504*33de042dSApple OSS Distributions 				/* cooperative -> cooperative */
2505*33de042dSApple OSS Distributions 			} else if (workq_thread_is_cooperative(uth)) {
2506*33de042dSApple OSS Distributions 				_wq_cooperative_queue_scheduled_count_dec(wq, old_pri.qos_req);
2507*33de042dSApple OSS Distributions 				_wq_cooperative_queue_scheduled_count_inc(wq, new_pri.qos_req);
2508*33de042dSApple OSS Distributions 
2509*33de042dSApple OSS Distributions 				/* We're changing schedule counts within cooperative pool, we
2510*33de042dSApple OSS Distributions 				 * need to refresh best cooperative QoS logic again */
2511*33de042dSApple OSS Distributions 				force_run = _wq_cooperative_queue_refresh_best_req_qos(wq);
2512*33de042dSApple OSS Distributions 			}
2513*33de042dSApple OSS Distributions 
2514*33de042dSApple OSS Distributions 			/*
2515*33de042dSApple OSS Distributions 			 * This will set up an override on the thread if any and will also call
2516*33de042dSApple OSS Distributions 			 * schedule_creator if needed
2517*33de042dSApple OSS Distributions 			 */
2518*33de042dSApple OSS Distributions 			workq_thread_update_bucket(p, wq, uth, old_pri, new_pri, force_run);
2519*33de042dSApple OSS Distributions 			workq_unlock(wq);
2520*33de042dSApple OSS Distributions 
2521*33de042dSApple OSS Distributions 			if (qos_override) {
2522*33de042dSApple OSS Distributions 				thread_mtx_unlock(th);
2523*33de042dSApple OSS Distributions 			}
2524*33de042dSApple OSS Distributions 
2525*33de042dSApple OSS Distributions 			if (workq_thread_is_overcommit(uth)) {
2526*33de042dSApple OSS Distributions 				thread_disarm_workqueue_quantum(th);
2527*33de042dSApple OSS Distributions 			} else {
2528*33de042dSApple OSS Distributions 				/* If the thread changed QoS buckets, the quantum duration
2529*33de042dSApple OSS Distributions 				 * may have changed too */
2530*33de042dSApple OSS Distributions 				thread_arm_workqueue_quantum(th);
2531*33de042dSApple OSS Distributions 			}
2532*33de042dSApple OSS Distributions 		}
2533*33de042dSApple OSS Distributions 
2534*33de042dSApple OSS Distributions 		kr = thread_policy_set_internal(th, THREAD_QOS_POLICY,
2535*33de042dSApple OSS Distributions 		    (thread_policy_t)&new_policy, THREAD_QOS_POLICY_COUNT);
2536*33de042dSApple OSS Distributions 		if (kr != KERN_SUCCESS) {
2537*33de042dSApple OSS Distributions 			qos_rv = EINVAL;
2538*33de042dSApple OSS Distributions 		}
2539*33de042dSApple OSS Distributions 	}
2540*33de042dSApple OSS Distributions 
2541*33de042dSApple OSS Distributions voucher:
2542*33de042dSApple OSS Distributions 	if (flags & WORKQ_SET_SELF_VOUCHER_FLAG) {
2543*33de042dSApple OSS Distributions 		kr = thread_set_voucher_name(voucher);
2544*33de042dSApple OSS Distributions 		if (kr != KERN_SUCCESS) {
2545*33de042dSApple OSS Distributions 			voucher_rv = ENOENT;
2546*33de042dSApple OSS Distributions 			goto fixedpri;
2547*33de042dSApple OSS Distributions 		}
2548*33de042dSApple OSS Distributions 	}
2549*33de042dSApple OSS Distributions 
2550*33de042dSApple OSS Distributions fixedpri:
2551*33de042dSApple OSS Distributions 	if (qos_rv) {
2552*33de042dSApple OSS Distributions 		goto done;
2553*33de042dSApple OSS Distributions 	}
2554*33de042dSApple OSS Distributions 	if (flags & WORKQ_SET_SELF_FIXEDPRIORITY_FLAG) {
2555*33de042dSApple OSS Distributions 		thread_extended_policy_data_t extpol = {.timeshare = 0};
2556*33de042dSApple OSS Distributions 
2557*33de042dSApple OSS Distributions 		if (is_wq_thread) {
2558*33de042dSApple OSS Distributions 			/* Not allowed on workqueue threads */
2559*33de042dSApple OSS Distributions 			fixedpri_rv = ENOTSUP;
2560*33de042dSApple OSS Distributions 			goto done;
2561*33de042dSApple OSS Distributions 		}
2562*33de042dSApple OSS Distributions 
2563*33de042dSApple OSS Distributions 		kr = thread_policy_set_internal(th, THREAD_EXTENDED_POLICY,
2564*33de042dSApple OSS Distributions 		    (thread_policy_t)&extpol, THREAD_EXTENDED_POLICY_COUNT);
2565*33de042dSApple OSS Distributions 		if (kr != KERN_SUCCESS) {
2566*33de042dSApple OSS Distributions 			fixedpri_rv = EINVAL;
2567*33de042dSApple OSS Distributions 			goto done;
2568*33de042dSApple OSS Distributions 		}
2569*33de042dSApple OSS Distributions 	} else if (flags & WORKQ_SET_SELF_TIMESHARE_FLAG) {
2570*33de042dSApple OSS Distributions 		thread_extended_policy_data_t extpol = {.timeshare = 1};
2571*33de042dSApple OSS Distributions 
2572*33de042dSApple OSS Distributions 		if (is_wq_thread) {
2573*33de042dSApple OSS Distributions 			/* Not allowed on workqueue threads */
2574*33de042dSApple OSS Distributions 			fixedpri_rv = ENOTSUP;
2575*33de042dSApple OSS Distributions 			goto done;
2576*33de042dSApple OSS Distributions 		}
2577*33de042dSApple OSS Distributions 
2578*33de042dSApple OSS Distributions 		kr = thread_policy_set_internal(th, THREAD_EXTENDED_POLICY,
2579*33de042dSApple OSS Distributions 		    (thread_policy_t)&extpol, THREAD_EXTENDED_POLICY_COUNT);
2580*33de042dSApple OSS Distributions 		if (kr != KERN_SUCCESS) {
2581*33de042dSApple OSS Distributions 			fixedpri_rv = EINVAL;
2582*33de042dSApple OSS Distributions 			goto done;
2583*33de042dSApple OSS Distributions 		}
2584*33de042dSApple OSS Distributions 	}
2585*33de042dSApple OSS Distributions 
2586*33de042dSApple OSS Distributions done:
2587*33de042dSApple OSS Distributions 	if (qos_rv && voucher_rv) {
2588*33de042dSApple OSS Distributions 		/* Both failed, give that a unique error. */
2589*33de042dSApple OSS Distributions 		return EBADMSG;
2590*33de042dSApple OSS Distributions 	}
2591*33de042dSApple OSS Distributions 
2592*33de042dSApple OSS Distributions 	if (unbind_rv) {
2593*33de042dSApple OSS Distributions 		return unbind_rv;
2594*33de042dSApple OSS Distributions 	}
2595*33de042dSApple OSS Distributions 
2596*33de042dSApple OSS Distributions 	if (qos_rv) {
2597*33de042dSApple OSS Distributions 		return qos_rv;
2598*33de042dSApple OSS Distributions 	}
2599*33de042dSApple OSS Distributions 
2600*33de042dSApple OSS Distributions 	if (voucher_rv) {
2601*33de042dSApple OSS Distributions 		return voucher_rv;
2602*33de042dSApple OSS Distributions 	}
2603*33de042dSApple OSS Distributions 
2604*33de042dSApple OSS Distributions 	if (fixedpri_rv) {
2605*33de042dSApple OSS Distributions 		return fixedpri_rv;
2606*33de042dSApple OSS Distributions 	}
2607*33de042dSApple OSS Distributions 
2608*33de042dSApple OSS Distributions 
2609*33de042dSApple OSS Distributions 	return 0;
2610*33de042dSApple OSS Distributions }
2611*33de042dSApple OSS Distributions 
2612*33de042dSApple OSS Distributions static int
bsdthread_add_explicit_override(proc_t p,mach_port_name_t kport,pthread_priority_t pp,user_addr_t resource)2613*33de042dSApple OSS Distributions bsdthread_add_explicit_override(proc_t p, mach_port_name_t kport,
2614*33de042dSApple OSS Distributions     pthread_priority_t pp, user_addr_t resource)
2615*33de042dSApple OSS Distributions {
2616*33de042dSApple OSS Distributions 	thread_qos_t qos = _pthread_priority_thread_qos(pp);
2617*33de042dSApple OSS Distributions 	if (qos == THREAD_QOS_UNSPECIFIED) {
2618*33de042dSApple OSS Distributions 		return EINVAL;
2619*33de042dSApple OSS Distributions 	}
2620*33de042dSApple OSS Distributions 
2621*33de042dSApple OSS Distributions 	thread_t th = port_name_to_thread(kport,
2622*33de042dSApple OSS Distributions 	    PORT_INTRANS_THREAD_IN_CURRENT_TASK);
2623*33de042dSApple OSS Distributions 	if (th == THREAD_NULL) {
2624*33de042dSApple OSS Distributions 		return ESRCH;
2625*33de042dSApple OSS Distributions 	}
2626*33de042dSApple OSS Distributions 
2627*33de042dSApple OSS Distributions 	int rv = proc_thread_qos_add_override(proc_task(p), th, 0, qos, TRUE,
2628*33de042dSApple OSS Distributions 	    resource, THREAD_QOS_OVERRIDE_TYPE_PTHREAD_EXPLICIT_OVERRIDE);
2629*33de042dSApple OSS Distributions 
2630*33de042dSApple OSS Distributions 	thread_deallocate(th);
2631*33de042dSApple OSS Distributions 	return rv;
2632*33de042dSApple OSS Distributions }
2633*33de042dSApple OSS Distributions 
2634*33de042dSApple OSS Distributions static int
bsdthread_remove_explicit_override(proc_t p,mach_port_name_t kport,user_addr_t resource)2635*33de042dSApple OSS Distributions bsdthread_remove_explicit_override(proc_t p, mach_port_name_t kport,
2636*33de042dSApple OSS Distributions     user_addr_t resource)
2637*33de042dSApple OSS Distributions {
2638*33de042dSApple OSS Distributions 	thread_t th = port_name_to_thread(kport,
2639*33de042dSApple OSS Distributions 	    PORT_INTRANS_THREAD_IN_CURRENT_TASK);
2640*33de042dSApple OSS Distributions 	if (th == THREAD_NULL) {
2641*33de042dSApple OSS Distributions 		return ESRCH;
2642*33de042dSApple OSS Distributions 	}
2643*33de042dSApple OSS Distributions 
2644*33de042dSApple OSS Distributions 	int rv = proc_thread_qos_remove_override(proc_task(p), th, 0, resource,
2645*33de042dSApple OSS Distributions 	    THREAD_QOS_OVERRIDE_TYPE_PTHREAD_EXPLICIT_OVERRIDE);
2646*33de042dSApple OSS Distributions 
2647*33de042dSApple OSS Distributions 	thread_deallocate(th);
2648*33de042dSApple OSS Distributions 	return rv;
2649*33de042dSApple OSS Distributions }
2650*33de042dSApple OSS Distributions 
2651*33de042dSApple OSS Distributions static int
workq_thread_add_dispatch_override(proc_t p,mach_port_name_t kport,pthread_priority_t pp,user_addr_t ulock_addr)2652*33de042dSApple OSS Distributions workq_thread_add_dispatch_override(proc_t p, mach_port_name_t kport,
2653*33de042dSApple OSS Distributions     pthread_priority_t pp, user_addr_t ulock_addr)
2654*33de042dSApple OSS Distributions {
2655*33de042dSApple OSS Distributions 	struct uu_workq_policy old_pri, new_pri;
2656*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
2657*33de042dSApple OSS Distributions 
2658*33de042dSApple OSS Distributions 	thread_qos_t qos_override = _pthread_priority_thread_qos(pp);
2659*33de042dSApple OSS Distributions 	if (qos_override == THREAD_QOS_UNSPECIFIED) {
2660*33de042dSApple OSS Distributions 		return EINVAL;
2661*33de042dSApple OSS Distributions 	}
2662*33de042dSApple OSS Distributions 
2663*33de042dSApple OSS Distributions 	thread_t thread = port_name_to_thread(kport,
2664*33de042dSApple OSS Distributions 	    PORT_INTRANS_THREAD_IN_CURRENT_TASK);
2665*33de042dSApple OSS Distributions 	if (thread == THREAD_NULL) {
2666*33de042dSApple OSS Distributions 		return ESRCH;
2667*33de042dSApple OSS Distributions 	}
2668*33de042dSApple OSS Distributions 
2669*33de042dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(thread);
2670*33de042dSApple OSS Distributions 	if ((thread_get_tag(thread) & THREAD_TAG_WORKQUEUE) == 0) {
2671*33de042dSApple OSS Distributions 		thread_deallocate(thread);
2672*33de042dSApple OSS Distributions 		return EPERM;
2673*33de042dSApple OSS Distributions 	}
2674*33de042dSApple OSS Distributions 
2675*33de042dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_override_dispatch | DBG_FUNC_NONE,
2676*33de042dSApple OSS Distributions 	    wq, thread_tid(thread), 1, pp);
2677*33de042dSApple OSS Distributions 
2678*33de042dSApple OSS Distributions 	thread_mtx_lock(thread);
2679*33de042dSApple OSS Distributions 
2680*33de042dSApple OSS Distributions 	if (ulock_addr) {
2681*33de042dSApple OSS Distributions 		uint32_t val;
2682*33de042dSApple OSS Distributions 		int rc;
2683*33de042dSApple OSS Distributions 		/*
2684*33de042dSApple OSS Distributions 		 * Workaround lack of explicit support for 'no-fault copyin'
2685*33de042dSApple OSS Distributions 		 * <rdar://problem/24999882>, as disabling preemption prevents paging in
2686*33de042dSApple OSS Distributions 		 */
2687*33de042dSApple OSS Distributions 		disable_preemption();
2688*33de042dSApple OSS Distributions 		rc = copyin_atomic32(ulock_addr, &val);
2689*33de042dSApple OSS Distributions 		enable_preemption();
2690*33de042dSApple OSS Distributions 		if (rc == 0 && ulock_owner_value_to_port_name(val) != kport) {
2691*33de042dSApple OSS Distributions 			goto out;
2692*33de042dSApple OSS Distributions 		}
2693*33de042dSApple OSS Distributions 	}
2694*33de042dSApple OSS Distributions 
2695*33de042dSApple OSS Distributions 	workq_lock_spin(wq);
2696*33de042dSApple OSS Distributions 
2697*33de042dSApple OSS Distributions 	old_pri = uth->uu_workq_pri;
2698*33de042dSApple OSS Distributions 	if (old_pri.qos_override >= qos_override) {
2699*33de042dSApple OSS Distributions 		/* Nothing to do */
2700*33de042dSApple OSS Distributions 	} else if (thread == current_thread()) {
2701*33de042dSApple OSS Distributions 		new_pri = old_pri;
2702*33de042dSApple OSS Distributions 		new_pri.qos_override = qos_override;
2703*33de042dSApple OSS Distributions 		workq_thread_update_bucket(p, wq, uth, old_pri, new_pri, false);
2704*33de042dSApple OSS Distributions 	} else {
2705*33de042dSApple OSS Distributions 		uth->uu_workq_pri.qos_override = qos_override;
2706*33de042dSApple OSS Distributions 		if (qos_override > workq_pri_override(old_pri)) {
2707*33de042dSApple OSS Distributions 			thread_set_workq_override(thread, qos_override);
2708*33de042dSApple OSS Distributions 		}
2709*33de042dSApple OSS Distributions 	}
2710*33de042dSApple OSS Distributions 
2711*33de042dSApple OSS Distributions 	workq_unlock(wq);
2712*33de042dSApple OSS Distributions 
2713*33de042dSApple OSS Distributions out:
2714*33de042dSApple OSS Distributions 	thread_mtx_unlock(thread);
2715*33de042dSApple OSS Distributions 	thread_deallocate(thread);
2716*33de042dSApple OSS Distributions 	return 0;
2717*33de042dSApple OSS Distributions }
2718*33de042dSApple OSS Distributions 
2719*33de042dSApple OSS Distributions static int
workq_thread_reset_dispatch_override(proc_t p,thread_t thread)2720*33de042dSApple OSS Distributions workq_thread_reset_dispatch_override(proc_t p, thread_t thread)
2721*33de042dSApple OSS Distributions {
2722*33de042dSApple OSS Distributions 	struct uu_workq_policy old_pri, new_pri;
2723*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
2724*33de042dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(thread);
2725*33de042dSApple OSS Distributions 
2726*33de042dSApple OSS Distributions 	if ((thread_get_tag(thread) & THREAD_TAG_WORKQUEUE) == 0) {
2727*33de042dSApple OSS Distributions 		return EPERM;
2728*33de042dSApple OSS Distributions 	}
2729*33de042dSApple OSS Distributions 
2730*33de042dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_override_reset | DBG_FUNC_NONE, wq, 0, 0, 0);
2731*33de042dSApple OSS Distributions 
2732*33de042dSApple OSS Distributions 	/*
2733*33de042dSApple OSS Distributions 	 * workq_thread_add_dispatch_override takes the thread mutex before doing the
2734*33de042dSApple OSS Distributions 	 * copyin to validate the drainer and apply the override. We need to do the
2735*33de042dSApple OSS Distributions 	 * same here. See rdar://84472518
2736*33de042dSApple OSS Distributions 	 */
2737*33de042dSApple OSS Distributions 	thread_mtx_lock(thread);
2738*33de042dSApple OSS Distributions 
2739*33de042dSApple OSS Distributions 	workq_lock_spin(wq);
2740*33de042dSApple OSS Distributions 	old_pri = new_pri = uth->uu_workq_pri;
2741*33de042dSApple OSS Distributions 	new_pri.qos_override = THREAD_QOS_UNSPECIFIED;
2742*33de042dSApple OSS Distributions 	workq_thread_update_bucket(p, wq, uth, old_pri, new_pri, false);
2743*33de042dSApple OSS Distributions 	workq_unlock(wq);
2744*33de042dSApple OSS Distributions 
2745*33de042dSApple OSS Distributions 	thread_mtx_unlock(thread);
2746*33de042dSApple OSS Distributions 	return 0;
2747*33de042dSApple OSS Distributions }
2748*33de042dSApple OSS Distributions 
2749*33de042dSApple OSS Distributions static int
workq_thread_allow_kill(__unused proc_t p,thread_t thread,bool enable)2750*33de042dSApple OSS Distributions workq_thread_allow_kill(__unused proc_t p, thread_t thread, bool enable)
2751*33de042dSApple OSS Distributions {
2752*33de042dSApple OSS Distributions 	if (!(thread_get_tag(thread) & THREAD_TAG_WORKQUEUE)) {
2753*33de042dSApple OSS Distributions 		// If the thread isn't a workqueue thread, don't set the
2754*33de042dSApple OSS Distributions 		// kill_allowed bit; however, we still need to return 0
2755*33de042dSApple OSS Distributions 		// instead of an error code since this code is executed
2756*33de042dSApple OSS Distributions 		// on the abort path which needs to not depend on the
2757*33de042dSApple OSS Distributions 		// pthread_t (returning an error depends on pthread_t via
2758*33de042dSApple OSS Distributions 		// cerror_nocancel)
2759*33de042dSApple OSS Distributions 		return 0;
2760*33de042dSApple OSS Distributions 	}
2761*33de042dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(thread);
2762*33de042dSApple OSS Distributions 	uth->uu_workq_pthread_kill_allowed = enable;
2763*33de042dSApple OSS Distributions 	return 0;
2764*33de042dSApple OSS Distributions }
2765*33de042dSApple OSS Distributions 
2766*33de042dSApple OSS Distributions static int
workq_allow_sigmask(proc_t p,sigset_t mask)2767*33de042dSApple OSS Distributions workq_allow_sigmask(proc_t p, sigset_t mask)
2768*33de042dSApple OSS Distributions {
2769*33de042dSApple OSS Distributions 	if (mask & workq_threadmask) {
2770*33de042dSApple OSS Distributions 		return EINVAL;
2771*33de042dSApple OSS Distributions 	}
2772*33de042dSApple OSS Distributions 
2773*33de042dSApple OSS Distributions 	proc_lock(p);
2774*33de042dSApple OSS Distributions 	p->p_workq_allow_sigmask |= mask;
2775*33de042dSApple OSS Distributions 	proc_unlock(p);
2776*33de042dSApple OSS Distributions 
2777*33de042dSApple OSS Distributions 	return 0;
2778*33de042dSApple OSS Distributions }
2779*33de042dSApple OSS Distributions 
2780*33de042dSApple OSS Distributions static int
bsdthread_get_max_parallelism(thread_qos_t qos,unsigned long flags,int * retval)2781*33de042dSApple OSS Distributions bsdthread_get_max_parallelism(thread_qos_t qos, unsigned long flags,
2782*33de042dSApple OSS Distributions     int *retval)
2783*33de042dSApple OSS Distributions {
2784*33de042dSApple OSS Distributions 	static_assert(QOS_PARALLELISM_COUNT_LOGICAL ==
2785*33de042dSApple OSS Distributions 	    _PTHREAD_QOS_PARALLELISM_COUNT_LOGICAL, "logical");
2786*33de042dSApple OSS Distributions 	static_assert(QOS_PARALLELISM_REALTIME ==
2787*33de042dSApple OSS Distributions 	    _PTHREAD_QOS_PARALLELISM_REALTIME, "realtime");
2788*33de042dSApple OSS Distributions 	static_assert(QOS_PARALLELISM_CLUSTER_SHARED_RESOURCE ==
2789*33de042dSApple OSS Distributions 	    _PTHREAD_QOS_PARALLELISM_CLUSTER_SHARED_RSRC, "cluster shared resource");
2790*33de042dSApple OSS Distributions 
2791*33de042dSApple OSS Distributions 	if (flags & ~(QOS_PARALLELISM_REALTIME | QOS_PARALLELISM_COUNT_LOGICAL | QOS_PARALLELISM_CLUSTER_SHARED_RESOURCE)) {
2792*33de042dSApple OSS Distributions 		return EINVAL;
2793*33de042dSApple OSS Distributions 	}
2794*33de042dSApple OSS Distributions 
2795*33de042dSApple OSS Distributions 	/* No units are present */
2796*33de042dSApple OSS Distributions 	if (flags & QOS_PARALLELISM_CLUSTER_SHARED_RESOURCE) {
2797*33de042dSApple OSS Distributions 		return ENOTSUP;
2798*33de042dSApple OSS Distributions 	}
2799*33de042dSApple OSS Distributions 
2800*33de042dSApple OSS Distributions 	if (flags & QOS_PARALLELISM_REALTIME) {
2801*33de042dSApple OSS Distributions 		if (qos) {
2802*33de042dSApple OSS Distributions 			return EINVAL;
2803*33de042dSApple OSS Distributions 		}
2804*33de042dSApple OSS Distributions 	} else if (qos == THREAD_QOS_UNSPECIFIED || qos >= THREAD_QOS_LAST) {
2805*33de042dSApple OSS Distributions 		return EINVAL;
2806*33de042dSApple OSS Distributions 	}
2807*33de042dSApple OSS Distributions 
2808*33de042dSApple OSS Distributions 	*retval = qos_max_parallelism(qos, flags);
2809*33de042dSApple OSS Distributions 	return 0;
2810*33de042dSApple OSS Distributions }
2811*33de042dSApple OSS Distributions 
2812*33de042dSApple OSS Distributions static int
bsdthread_dispatch_apply_attr(__unused struct proc * p,thread_t thread,unsigned long flags,uint64_t value1,__unused uint64_t value2)2813*33de042dSApple OSS Distributions bsdthread_dispatch_apply_attr(__unused struct proc *p, thread_t thread,
2814*33de042dSApple OSS Distributions     unsigned long flags, uint64_t value1, __unused uint64_t value2)
2815*33de042dSApple OSS Distributions {
2816*33de042dSApple OSS Distributions 	uint32_t apply_worker_index;
2817*33de042dSApple OSS Distributions 	kern_return_t kr;
2818*33de042dSApple OSS Distributions 
2819*33de042dSApple OSS Distributions 	switch (flags) {
2820*33de042dSApple OSS Distributions 	case _PTHREAD_DISPATCH_APPLY_ATTR_CLUSTER_SHARED_RSRC_SET:
2821*33de042dSApple OSS Distributions 		apply_worker_index = (uint32_t)value1;
2822*33de042dSApple OSS Distributions 		kr = thread_shared_rsrc_policy_set(thread, apply_worker_index, CLUSTER_SHARED_RSRC_TYPE_RR, SHARED_RSRC_POLICY_AGENT_DISPATCH);
2823*33de042dSApple OSS Distributions 		/*
2824*33de042dSApple OSS Distributions 		 * KERN_INVALID_POLICY indicates that the thread was trying to bind to a
2825*33de042dSApple OSS Distributions 		 * cluster which it was not eligible to execute on.
2826*33de042dSApple OSS Distributions 		 */
2827*33de042dSApple OSS Distributions 		return (kr == KERN_SUCCESS) ? 0 : ((kr == KERN_INVALID_POLICY) ? ENOTSUP : EINVAL);
2828*33de042dSApple OSS Distributions 	case _PTHREAD_DISPATCH_APPLY_ATTR_CLUSTER_SHARED_RSRC_CLEAR:
2829*33de042dSApple OSS Distributions 		kr = thread_shared_rsrc_policy_clear(thread, CLUSTER_SHARED_RSRC_TYPE_RR, SHARED_RSRC_POLICY_AGENT_DISPATCH);
2830*33de042dSApple OSS Distributions 		return (kr == KERN_SUCCESS) ? 0 : EINVAL;
2831*33de042dSApple OSS Distributions 	default:
2832*33de042dSApple OSS Distributions 		return EINVAL;
2833*33de042dSApple OSS Distributions 	}
2834*33de042dSApple OSS Distributions }
2835*33de042dSApple OSS Distributions 
2836*33de042dSApple OSS Distributions #define ENSURE_UNUSED(arg) \
2837*33de042dSApple OSS Distributions 	        ({ if ((arg) != 0) { return EINVAL; } })
2838*33de042dSApple OSS Distributions 
2839*33de042dSApple OSS Distributions int
bsdthread_ctl(struct proc * p,struct bsdthread_ctl_args * uap,int * retval)2840*33de042dSApple OSS Distributions bsdthread_ctl(struct proc *p, struct bsdthread_ctl_args *uap, int *retval)
2841*33de042dSApple OSS Distributions {
2842*33de042dSApple OSS Distributions 	switch (uap->cmd) {
2843*33de042dSApple OSS Distributions 	case BSDTHREAD_CTL_QOS_OVERRIDE_START:
2844*33de042dSApple OSS Distributions 		return bsdthread_add_explicit_override(p, (mach_port_name_t)uap->arg1,
2845*33de042dSApple OSS Distributions 		           (pthread_priority_t)uap->arg2, uap->arg3);
2846*33de042dSApple OSS Distributions 	case BSDTHREAD_CTL_QOS_OVERRIDE_END:
2847*33de042dSApple OSS Distributions 		ENSURE_UNUSED(uap->arg3);
2848*33de042dSApple OSS Distributions 		return bsdthread_remove_explicit_override(p, (mach_port_name_t)uap->arg1,
2849*33de042dSApple OSS Distributions 		           (user_addr_t)uap->arg2);
2850*33de042dSApple OSS Distributions 
2851*33de042dSApple OSS Distributions 	case BSDTHREAD_CTL_QOS_OVERRIDE_DISPATCH:
2852*33de042dSApple OSS Distributions 		return workq_thread_add_dispatch_override(p, (mach_port_name_t)uap->arg1,
2853*33de042dSApple OSS Distributions 		           (pthread_priority_t)uap->arg2, uap->arg3);
2854*33de042dSApple OSS Distributions 	case BSDTHREAD_CTL_QOS_OVERRIDE_RESET:
2855*33de042dSApple OSS Distributions 		return workq_thread_reset_dispatch_override(p, current_thread());
2856*33de042dSApple OSS Distributions 
2857*33de042dSApple OSS Distributions 	case BSDTHREAD_CTL_SET_SELF:
2858*33de042dSApple OSS Distributions 		return bsdthread_set_self(p, current_thread(),
2859*33de042dSApple OSS Distributions 		           (pthread_priority_t)uap->arg1, (mach_port_name_t)uap->arg2,
2860*33de042dSApple OSS Distributions 		           (enum workq_set_self_flags)uap->arg3);
2861*33de042dSApple OSS Distributions 
2862*33de042dSApple OSS Distributions 	case BSDTHREAD_CTL_QOS_MAX_PARALLELISM:
2863*33de042dSApple OSS Distributions 		ENSURE_UNUSED(uap->arg3);
2864*33de042dSApple OSS Distributions 		return bsdthread_get_max_parallelism((thread_qos_t)uap->arg1,
2865*33de042dSApple OSS Distributions 		           (unsigned long)uap->arg2, retval);
2866*33de042dSApple OSS Distributions 	case BSDTHREAD_CTL_WORKQ_ALLOW_KILL:
2867*33de042dSApple OSS Distributions 		ENSURE_UNUSED(uap->arg2);
2868*33de042dSApple OSS Distributions 		ENSURE_UNUSED(uap->arg3);
2869*33de042dSApple OSS Distributions 		return workq_thread_allow_kill(p, current_thread(), (bool)uap->arg1);
2870*33de042dSApple OSS Distributions 	case BSDTHREAD_CTL_DISPATCH_APPLY_ATTR:
2871*33de042dSApple OSS Distributions 		return bsdthread_dispatch_apply_attr(p, current_thread(),
2872*33de042dSApple OSS Distributions 		           (unsigned long)uap->arg1, (uint64_t)uap->arg2,
2873*33de042dSApple OSS Distributions 		           (uint64_t)uap->arg3);
2874*33de042dSApple OSS Distributions 	case BSDTHREAD_CTL_WORKQ_ALLOW_SIGMASK:
2875*33de042dSApple OSS Distributions 		return workq_allow_sigmask(p, (int)uap->arg1);
2876*33de042dSApple OSS Distributions 	case BSDTHREAD_CTL_SET_QOS:
2877*33de042dSApple OSS Distributions 	case BSDTHREAD_CTL_QOS_DISPATCH_ASYNCHRONOUS_OVERRIDE_ADD:
2878*33de042dSApple OSS Distributions 	case BSDTHREAD_CTL_QOS_DISPATCH_ASYNCHRONOUS_OVERRIDE_RESET:
2879*33de042dSApple OSS Distributions 		/* no longer supported */
2880*33de042dSApple OSS Distributions 		return ENOTSUP;
2881*33de042dSApple OSS Distributions 
2882*33de042dSApple OSS Distributions 	default:
2883*33de042dSApple OSS Distributions 		return EINVAL;
2884*33de042dSApple OSS Distributions 	}
2885*33de042dSApple OSS Distributions }
2886*33de042dSApple OSS Distributions 
2887*33de042dSApple OSS Distributions #pragma mark workqueue thread manipulation
2888*33de042dSApple OSS Distributions 
2889*33de042dSApple OSS Distributions static void __dead2
2890*33de042dSApple OSS Distributions workq_unpark_select_threadreq_or_park_and_unlock(proc_t p, struct workqueue *wq,
2891*33de042dSApple OSS Distributions     struct uthread *uth, uint32_t setup_flags);
2892*33de042dSApple OSS Distributions 
2893*33de042dSApple OSS Distributions static void __dead2
2894*33de042dSApple OSS Distributions workq_select_threadreq_or_park_and_unlock(proc_t p, struct workqueue *wq,
2895*33de042dSApple OSS Distributions     struct uthread *uth, uint32_t setup_flags);
2896*33de042dSApple OSS Distributions 
2897*33de042dSApple OSS Distributions static void workq_setup_and_run(proc_t p, struct uthread *uth, int flags) __dead2;
2898*33de042dSApple OSS Distributions 
2899*33de042dSApple OSS Distributions #if KDEBUG_LEVEL >= KDEBUG_LEVEL_STANDARD
2900*33de042dSApple OSS Distributions static inline uint64_t
workq_trace_req_id(workq_threadreq_t req)2901*33de042dSApple OSS Distributions workq_trace_req_id(workq_threadreq_t req)
2902*33de042dSApple OSS Distributions {
2903*33de042dSApple OSS Distributions 	struct kqworkloop *kqwl;
2904*33de042dSApple OSS Distributions 	if (req->tr_flags & WORKQ_TR_FLAG_WORKLOOP) {
2905*33de042dSApple OSS Distributions 		kqwl = __container_of(req, struct kqworkloop, kqwl_request);
2906*33de042dSApple OSS Distributions 		return kqwl->kqwl_dynamicid;
2907*33de042dSApple OSS Distributions 	}
2908*33de042dSApple OSS Distributions 
2909*33de042dSApple OSS Distributions 	return VM_KERNEL_ADDRHIDE(req);
2910*33de042dSApple OSS Distributions }
2911*33de042dSApple OSS Distributions #endif
2912*33de042dSApple OSS Distributions 
2913*33de042dSApple OSS Distributions /**
2914*33de042dSApple OSS Distributions  * Entry point for libdispatch to ask for threads
2915*33de042dSApple OSS Distributions  */
2916*33de042dSApple OSS Distributions static int
workq_reqthreads(struct proc * p,uint32_t reqcount,pthread_priority_t pp,bool cooperative)2917*33de042dSApple OSS Distributions workq_reqthreads(struct proc *p, uint32_t reqcount, pthread_priority_t pp, bool cooperative)
2918*33de042dSApple OSS Distributions {
2919*33de042dSApple OSS Distributions 	thread_qos_t qos = _pthread_priority_thread_qos(pp);
2920*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
2921*33de042dSApple OSS Distributions 	uint32_t unpaced, upcall_flags = WQ_FLAG_THREAD_NEWSPI;
2922*33de042dSApple OSS Distributions 	int ret = 0;
2923*33de042dSApple OSS Distributions 
2924*33de042dSApple OSS Distributions 	if (wq == NULL || reqcount <= 0 || reqcount > UINT16_MAX ||
2925*33de042dSApple OSS Distributions 	    qos == THREAD_QOS_UNSPECIFIED) {
2926*33de042dSApple OSS Distributions 		ret = EINVAL;
2927*33de042dSApple OSS Distributions 		goto exit;
2928*33de042dSApple OSS Distributions 	}
2929*33de042dSApple OSS Distributions 
2930*33de042dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_wqops_reqthreads | DBG_FUNC_NONE,
2931*33de042dSApple OSS Distributions 	    wq, reqcount, pp, cooperative);
2932*33de042dSApple OSS Distributions 
2933*33de042dSApple OSS Distributions 	workq_threadreq_t req = zalloc(workq_zone_threadreq);
2934*33de042dSApple OSS Distributions 	priority_queue_entry_init(&req->tr_entry);
2935*33de042dSApple OSS Distributions 	req->tr_state = WORKQ_TR_STATE_NEW;
2936*33de042dSApple OSS Distributions 	req->tr_qos   = qos;
2937*33de042dSApple OSS Distributions 	workq_tr_flags_t tr_flags = 0;
2938*33de042dSApple OSS Distributions 
2939*33de042dSApple OSS Distributions 	if (pp & _PTHREAD_PRIORITY_OVERCOMMIT_FLAG) {
2940*33de042dSApple OSS Distributions 		tr_flags |= WORKQ_TR_FLAG_OVERCOMMIT;
2941*33de042dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_OVERCOMMIT;
2942*33de042dSApple OSS Distributions 	}
2943*33de042dSApple OSS Distributions 
2944*33de042dSApple OSS Distributions 	if (cooperative) {
2945*33de042dSApple OSS Distributions 		tr_flags |= WORKQ_TR_FLAG_COOPERATIVE;
2946*33de042dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_COOPERATIVE;
2947*33de042dSApple OSS Distributions 
2948*33de042dSApple OSS Distributions 		if (reqcount > 1) {
2949*33de042dSApple OSS Distributions 			ret = ENOTSUP;
2950*33de042dSApple OSS Distributions 			goto free_and_exit;
2951*33de042dSApple OSS Distributions 		}
2952*33de042dSApple OSS Distributions 	}
2953*33de042dSApple OSS Distributions 
2954*33de042dSApple OSS Distributions 	/* A thread request cannot be both overcommit and cooperative */
2955*33de042dSApple OSS Distributions 	if (workq_tr_is_cooperative(tr_flags) &&
2956*33de042dSApple OSS Distributions 	    workq_tr_is_overcommit(tr_flags)) {
2957*33de042dSApple OSS Distributions 		ret = EINVAL;
2958*33de042dSApple OSS Distributions 		goto free_and_exit;
2959*33de042dSApple OSS Distributions 	}
2960*33de042dSApple OSS Distributions 	req->tr_flags = tr_flags;
2961*33de042dSApple OSS Distributions 
2962*33de042dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_thread_request_initiate | DBG_FUNC_NONE,
2963*33de042dSApple OSS Distributions 	    wq, workq_trace_req_id(req), req->tr_qos, reqcount);
2964*33de042dSApple OSS Distributions 
2965*33de042dSApple OSS Distributions 	workq_lock_spin(wq);
2966*33de042dSApple OSS Distributions 	do {
2967*33de042dSApple OSS Distributions 		if (_wq_exiting(wq)) {
2968*33de042dSApple OSS Distributions 			goto unlock_and_exit;
2969*33de042dSApple OSS Distributions 		}
2970*33de042dSApple OSS Distributions 
2971*33de042dSApple OSS Distributions 		/*
2972*33de042dSApple OSS Distributions 		 * When userspace is asking for parallelism, wakeup up to (reqcount - 1)
2973*33de042dSApple OSS Distributions 		 * threads without pacing, to inform the scheduler of that workload.
2974*33de042dSApple OSS Distributions 		 *
2975*33de042dSApple OSS Distributions 		 * The last requests, or the ones that failed the admission checks are
2976*33de042dSApple OSS Distributions 		 * enqueued and go through the regular creator codepath.
2977*33de042dSApple OSS Distributions 		 *
2978*33de042dSApple OSS Distributions 		 * If there aren't enough threads, add one, but re-evaluate everything
2979*33de042dSApple OSS Distributions 		 * as conditions may now have changed.
2980*33de042dSApple OSS Distributions 		 */
2981*33de042dSApple OSS Distributions 		unpaced = reqcount - 1;
2982*33de042dSApple OSS Distributions 
2983*33de042dSApple OSS Distributions 		if (reqcount > 1) {
2984*33de042dSApple OSS Distributions 			/* We don't handle asking for parallelism on the cooperative
2985*33de042dSApple OSS Distributions 			 * workqueue just yet */
2986*33de042dSApple OSS Distributions 			assert(!workq_threadreq_is_cooperative(req));
2987*33de042dSApple OSS Distributions 
2988*33de042dSApple OSS Distributions 			if (workq_threadreq_is_nonovercommit(req)) {
2989*33de042dSApple OSS Distributions 				unpaced = workq_constrained_allowance(wq, qos, NULL, false, true);
2990*33de042dSApple OSS Distributions 				if (unpaced >= reqcount - 1) {
2991*33de042dSApple OSS Distributions 					unpaced = reqcount - 1;
2992*33de042dSApple OSS Distributions 				}
2993*33de042dSApple OSS Distributions 			}
2994*33de042dSApple OSS Distributions 		}
2995*33de042dSApple OSS Distributions 
2996*33de042dSApple OSS Distributions 		/*
2997*33de042dSApple OSS Distributions 		 * This path does not currently handle custom workloop parameters
2998*33de042dSApple OSS Distributions 		 * when creating threads for parallelism.
2999*33de042dSApple OSS Distributions 		 */
3000*33de042dSApple OSS Distributions 		assert(!(req->tr_flags & WORKQ_TR_FLAG_WL_PARAMS));
3001*33de042dSApple OSS Distributions 
3002*33de042dSApple OSS Distributions 		/*
3003*33de042dSApple OSS Distributions 		 * This is a trimmed down version of workq_threadreq_bind_and_unlock()
3004*33de042dSApple OSS Distributions 		 */
3005*33de042dSApple OSS Distributions 		while (unpaced > 0 && wq->wq_thidlecount) {
3006*33de042dSApple OSS Distributions 			struct uthread *uth;
3007*33de042dSApple OSS Distributions 			bool needs_wakeup;
3008*33de042dSApple OSS Distributions 			uint8_t uu_flags = UT_WORKQ_EARLY_BOUND;
3009*33de042dSApple OSS Distributions 
3010*33de042dSApple OSS Distributions 			if (workq_tr_is_overcommit(req->tr_flags)) {
3011*33de042dSApple OSS Distributions 				uu_flags |= UT_WORKQ_OVERCOMMIT;
3012*33de042dSApple OSS Distributions 			}
3013*33de042dSApple OSS Distributions 
3014*33de042dSApple OSS Distributions 			uth = workq_pop_idle_thread(wq, uu_flags, &needs_wakeup);
3015*33de042dSApple OSS Distributions 
3016*33de042dSApple OSS Distributions 			_wq_thactive_inc(wq, qos);
3017*33de042dSApple OSS Distributions 			wq->wq_thscheduled_count[_wq_bucket(qos)]++;
3018*33de042dSApple OSS Distributions 			workq_thread_reset_pri(wq, uth, req, /*unpark*/ true);
3019*33de042dSApple OSS Distributions 			wq->wq_fulfilled++;
3020*33de042dSApple OSS Distributions 
3021*33de042dSApple OSS Distributions 			uth->uu_save.uus_workq_park_data.upcall_flags = upcall_flags;
3022*33de042dSApple OSS Distributions 			uth->uu_save.uus_workq_park_data.thread_request = req;
3023*33de042dSApple OSS Distributions 			if (needs_wakeup) {
3024*33de042dSApple OSS Distributions 				workq_thread_wakeup(uth);
3025*33de042dSApple OSS Distributions 			}
3026*33de042dSApple OSS Distributions 			unpaced--;
3027*33de042dSApple OSS Distributions 			reqcount--;
3028*33de042dSApple OSS Distributions 		}
3029*33de042dSApple OSS Distributions 	} while (unpaced && wq->wq_nthreads < wq_max_threads &&
3030*33de042dSApple OSS Distributions 	    (workq_add_new_idle_thread(p, wq, workq_unpark_continue,
3031*33de042dSApple OSS Distributions 	    false, NULL) == KERN_SUCCESS));
3032*33de042dSApple OSS Distributions 
3033*33de042dSApple OSS Distributions 	if (_wq_exiting(wq)) {
3034*33de042dSApple OSS Distributions 		goto unlock_and_exit;
3035*33de042dSApple OSS Distributions 	}
3036*33de042dSApple OSS Distributions 
3037*33de042dSApple OSS Distributions 	req->tr_count = (uint16_t)reqcount;
3038*33de042dSApple OSS Distributions 	if (workq_threadreq_enqueue(wq, req)) {
3039*33de042dSApple OSS Distributions 		/* This can drop the workqueue lock, and take it again */
3040*33de042dSApple OSS Distributions 		workq_schedule_creator(p, wq, WORKQ_THREADREQ_CAN_CREATE_THREADS);
3041*33de042dSApple OSS Distributions 	}
3042*33de042dSApple OSS Distributions 	workq_unlock(wq);
3043*33de042dSApple OSS Distributions 	return 0;
3044*33de042dSApple OSS Distributions 
3045*33de042dSApple OSS Distributions unlock_and_exit:
3046*33de042dSApple OSS Distributions 	workq_unlock(wq);
3047*33de042dSApple OSS Distributions free_and_exit:
3048*33de042dSApple OSS Distributions 	zfree(workq_zone_threadreq, req);
3049*33de042dSApple OSS Distributions exit:
3050*33de042dSApple OSS Distributions 	return ret;
3051*33de042dSApple OSS Distributions }
3052*33de042dSApple OSS Distributions 
3053*33de042dSApple OSS Distributions bool
workq_kern_threadreq_initiate(struct proc * p,workq_threadreq_t req,struct turnstile * workloop_ts,thread_qos_t qos,workq_kern_threadreq_flags_t flags)3054*33de042dSApple OSS Distributions workq_kern_threadreq_initiate(struct proc *p, workq_threadreq_t req,
3055*33de042dSApple OSS Distributions     struct turnstile *workloop_ts, thread_qos_t qos,
3056*33de042dSApple OSS Distributions     workq_kern_threadreq_flags_t flags)
3057*33de042dSApple OSS Distributions {
3058*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr_fast(p);
3059*33de042dSApple OSS Distributions 	struct uthread *uth = NULL;
3060*33de042dSApple OSS Distributions 
3061*33de042dSApple OSS Distributions 	assert(req->tr_flags & (WORKQ_TR_FLAG_WORKLOOP | WORKQ_TR_FLAG_KEVENT));
3062*33de042dSApple OSS Distributions 
3063*33de042dSApple OSS Distributions 	/*
3064*33de042dSApple OSS Distributions 	 * For any new initialization changes done to workqueue thread request below,
3065*33de042dSApple OSS Distributions 	 * please also consider if they are relevant to permanently bound thread
3066*33de042dSApple OSS Distributions 	 * request. See workq_kern_threadreq_permanent_bind.
3067*33de042dSApple OSS Distributions 	 */
3068*33de042dSApple OSS Distributions 	if (req->tr_flags & WORKQ_TR_FLAG_WL_OUTSIDE_QOS) {
3069*33de042dSApple OSS Distributions 		workq_threadreq_param_t trp = kqueue_threadreq_workloop_param(req);
3070*33de042dSApple OSS Distributions 		qos = thread_workq_qos_for_pri(trp.trp_pri);
3071*33de042dSApple OSS Distributions 		if (qos == THREAD_QOS_UNSPECIFIED) {
3072*33de042dSApple OSS Distributions 			qos = WORKQ_THREAD_QOS_ABOVEUI;
3073*33de042dSApple OSS Distributions 		}
3074*33de042dSApple OSS Distributions 	}
3075*33de042dSApple OSS Distributions 
3076*33de042dSApple OSS Distributions 	assert(req->tr_state == WORKQ_TR_STATE_IDLE);
3077*33de042dSApple OSS Distributions 	priority_queue_entry_init(&req->tr_entry);
3078*33de042dSApple OSS Distributions 	req->tr_count = 1;
3079*33de042dSApple OSS Distributions 	req->tr_state = WORKQ_TR_STATE_NEW;
3080*33de042dSApple OSS Distributions 	req->tr_qos   = qos;
3081*33de042dSApple OSS Distributions 
3082*33de042dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_thread_request_initiate | DBG_FUNC_NONE, wq,
3083*33de042dSApple OSS Distributions 	    workq_trace_req_id(req), qos, 1);
3084*33de042dSApple OSS Distributions 
3085*33de042dSApple OSS Distributions 	if (flags & WORKQ_THREADREQ_ATTEMPT_REBIND) {
3086*33de042dSApple OSS Distributions 		/*
3087*33de042dSApple OSS Distributions 		 * we're called back synchronously from the context of
3088*33de042dSApple OSS Distributions 		 * kqueue_threadreq_unbind from within workq_thread_return()
3089*33de042dSApple OSS Distributions 		 * we can try to match up this thread with this request !
3090*33de042dSApple OSS Distributions 		 */
3091*33de042dSApple OSS Distributions 		uth = current_uthread();
3092*33de042dSApple OSS Distributions 		assert(uth->uu_kqr_bound == NULL);
3093*33de042dSApple OSS Distributions 	}
3094*33de042dSApple OSS Distributions 
3095*33de042dSApple OSS Distributions 	workq_lock_spin(wq);
3096*33de042dSApple OSS Distributions 	if (_wq_exiting(wq)) {
3097*33de042dSApple OSS Distributions 		req->tr_state = WORKQ_TR_STATE_IDLE;
3098*33de042dSApple OSS Distributions 		workq_unlock(wq);
3099*33de042dSApple OSS Distributions 		return false;
3100*33de042dSApple OSS Distributions 	}
3101*33de042dSApple OSS Distributions 
3102*33de042dSApple OSS Distributions 	if (uth && workq_threadreq_admissible(wq, uth, req)) {
3103*33de042dSApple OSS Distributions 		/* This is the case of the rebind - we were about to park and unbind
3104*33de042dSApple OSS Distributions 		 * when more events came so keep the binding.
3105*33de042dSApple OSS Distributions 		 */
3106*33de042dSApple OSS Distributions 		assert(uth != wq->wq_creator);
3107*33de042dSApple OSS Distributions 
3108*33de042dSApple OSS Distributions 		if (uth->uu_workq_pri.qos_bucket != req->tr_qos) {
3109*33de042dSApple OSS Distributions 			_wq_thactive_move(wq, uth->uu_workq_pri.qos_bucket, req->tr_qos);
3110*33de042dSApple OSS Distributions 			workq_thread_reset_pri(wq, uth, req, /*unpark*/ false);
3111*33de042dSApple OSS Distributions 		}
3112*33de042dSApple OSS Distributions 		/*
3113*33de042dSApple OSS Distributions 		 * We're called from workq_kern_threadreq_initiate()
3114*33de042dSApple OSS Distributions 		 * due to an unbind, with the kq req held.
3115*33de042dSApple OSS Distributions 		 */
3116*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_thread_logical_run | DBG_FUNC_START, wq,
3117*33de042dSApple OSS Distributions 		    workq_trace_req_id(req), req->tr_flags, 0);
3118*33de042dSApple OSS Distributions 		wq->wq_fulfilled++;
3119*33de042dSApple OSS Distributions 
3120*33de042dSApple OSS Distributions 		kqueue_threadreq_bind(p, req, get_machthread(uth), 0);
3121*33de042dSApple OSS Distributions 	} else {
3122*33de042dSApple OSS Distributions 		if (workloop_ts) {
3123*33de042dSApple OSS Distributions 			workq_perform_turnstile_operation_locked(wq, ^{
3124*33de042dSApple OSS Distributions 				turnstile_update_inheritor(workloop_ts, wq->wq_turnstile,
3125*33de042dSApple OSS Distributions 				TURNSTILE_IMMEDIATE_UPDATE | TURNSTILE_INHERITOR_TURNSTILE);
3126*33de042dSApple OSS Distributions 				turnstile_update_inheritor_complete(workloop_ts,
3127*33de042dSApple OSS Distributions 				TURNSTILE_INTERLOCK_HELD);
3128*33de042dSApple OSS Distributions 			});
3129*33de042dSApple OSS Distributions 		}
3130*33de042dSApple OSS Distributions 
3131*33de042dSApple OSS Distributions 		bool reevaluate_creator_thread_group = false;
3132*33de042dSApple OSS Distributions #if CONFIG_PREADOPT_TG
3133*33de042dSApple OSS Distributions 		reevaluate_creator_thread_group = (flags & WORKQ_THREADREQ_REEVALUATE_PREADOPT_TG);
3134*33de042dSApple OSS Distributions #endif
3135*33de042dSApple OSS Distributions 		/* We enqueued the highest priority item or we may need to reevaluate if
3136*33de042dSApple OSS Distributions 		 * the creator needs a thread group pre-adoption */
3137*33de042dSApple OSS Distributions 		if (workq_threadreq_enqueue(wq, req) || reevaluate_creator_thread_group) {
3138*33de042dSApple OSS Distributions 			workq_schedule_creator(p, wq, flags);
3139*33de042dSApple OSS Distributions 		}
3140*33de042dSApple OSS Distributions 	}
3141*33de042dSApple OSS Distributions 
3142*33de042dSApple OSS Distributions 	workq_unlock(wq);
3143*33de042dSApple OSS Distributions 
3144*33de042dSApple OSS Distributions 	return true;
3145*33de042dSApple OSS Distributions }
3146*33de042dSApple OSS Distributions 
3147*33de042dSApple OSS Distributions void
workq_kern_threadreq_modify(struct proc * p,workq_threadreq_t req,thread_qos_t qos,workq_kern_threadreq_flags_t flags)3148*33de042dSApple OSS Distributions workq_kern_threadreq_modify(struct proc *p, workq_threadreq_t req,
3149*33de042dSApple OSS Distributions     thread_qos_t qos, workq_kern_threadreq_flags_t flags)
3150*33de042dSApple OSS Distributions {
3151*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr_fast(p);
3152*33de042dSApple OSS Distributions 	bool make_overcommit = false;
3153*33de042dSApple OSS Distributions 
3154*33de042dSApple OSS Distributions 	if (req->tr_flags & WORKQ_TR_FLAG_WL_OUTSIDE_QOS) {
3155*33de042dSApple OSS Distributions 		/* Requests outside-of-QoS shouldn't accept modify operations */
3156*33de042dSApple OSS Distributions 		return;
3157*33de042dSApple OSS Distributions 	}
3158*33de042dSApple OSS Distributions 
3159*33de042dSApple OSS Distributions 	workq_lock_spin(wq);
3160*33de042dSApple OSS Distributions 
3161*33de042dSApple OSS Distributions 	assert(req->tr_qos != WORKQ_THREAD_QOS_MANAGER);
3162*33de042dSApple OSS Distributions 	assert(req->tr_flags & (WORKQ_TR_FLAG_KEVENT | WORKQ_TR_FLAG_WORKLOOP));
3163*33de042dSApple OSS Distributions 
3164*33de042dSApple OSS Distributions 	if (req->tr_state == WORKQ_TR_STATE_BINDING) {
3165*33de042dSApple OSS Distributions 		kqueue_threadreq_bind(p, req, req->tr_thread, 0);
3166*33de042dSApple OSS Distributions 		workq_unlock(wq);
3167*33de042dSApple OSS Distributions 		return;
3168*33de042dSApple OSS Distributions 	}
3169*33de042dSApple OSS Distributions 
3170*33de042dSApple OSS Distributions 	if (flags & WORKQ_THREADREQ_MAKE_OVERCOMMIT) {
3171*33de042dSApple OSS Distributions 		/* TODO (rokhinip): We come into this code path for kqwl thread
3172*33de042dSApple OSS Distributions 		 * requests. kqwl requests cannot be cooperative.
3173*33de042dSApple OSS Distributions 		 */
3174*33de042dSApple OSS Distributions 		assert(!workq_threadreq_is_cooperative(req));
3175*33de042dSApple OSS Distributions 
3176*33de042dSApple OSS Distributions 		make_overcommit = workq_threadreq_is_nonovercommit(req);
3177*33de042dSApple OSS Distributions 	}
3178*33de042dSApple OSS Distributions 
3179*33de042dSApple OSS Distributions 	if (_wq_exiting(wq) || (req->tr_qos == qos && !make_overcommit)) {
3180*33de042dSApple OSS Distributions 		workq_unlock(wq);
3181*33de042dSApple OSS Distributions 		return;
3182*33de042dSApple OSS Distributions 	}
3183*33de042dSApple OSS Distributions 
3184*33de042dSApple OSS Distributions 	assert(req->tr_count == 1);
3185*33de042dSApple OSS Distributions 	if (req->tr_state != WORKQ_TR_STATE_QUEUED) {
3186*33de042dSApple OSS Distributions 		panic("Invalid thread request (%p) state %d", req, req->tr_state);
3187*33de042dSApple OSS Distributions 	}
3188*33de042dSApple OSS Distributions 
3189*33de042dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_thread_request_modify | DBG_FUNC_NONE, wq,
3190*33de042dSApple OSS Distributions 	    workq_trace_req_id(req), qos, 0);
3191*33de042dSApple OSS Distributions 
3192*33de042dSApple OSS Distributions 	struct priority_queue_sched_max *pq = workq_priority_queue_for_req(wq, req);
3193*33de042dSApple OSS Distributions 	workq_threadreq_t req_max;
3194*33de042dSApple OSS Distributions 
3195*33de042dSApple OSS Distributions 	/*
3196*33de042dSApple OSS Distributions 	 * Stage 1: Dequeue the request from its priority queue.
3197*33de042dSApple OSS Distributions 	 *
3198*33de042dSApple OSS Distributions 	 * If we dequeue the root item of the constrained priority queue,
3199*33de042dSApple OSS Distributions 	 * maintain the best constrained request qos invariant.
3200*33de042dSApple OSS Distributions 	 */
3201*33de042dSApple OSS Distributions 	if (priority_queue_remove(pq, &req->tr_entry)) {
3202*33de042dSApple OSS Distributions 		if (workq_threadreq_is_nonovercommit(req)) {
3203*33de042dSApple OSS Distributions 			_wq_thactive_refresh_best_constrained_req_qos(wq);
3204*33de042dSApple OSS Distributions 		}
3205*33de042dSApple OSS Distributions 	}
3206*33de042dSApple OSS Distributions 
3207*33de042dSApple OSS Distributions 	/*
3208*33de042dSApple OSS Distributions 	 * Stage 2: Apply changes to the thread request
3209*33de042dSApple OSS Distributions 	 *
3210*33de042dSApple OSS Distributions 	 * If the item will not become the root of the priority queue it belongs to,
3211*33de042dSApple OSS Distributions 	 * then we need to wait in line, just enqueue and return quickly.
3212*33de042dSApple OSS Distributions 	 */
3213*33de042dSApple OSS Distributions 	if (__improbable(make_overcommit)) {
3214*33de042dSApple OSS Distributions 		req->tr_flags ^= WORKQ_TR_FLAG_OVERCOMMIT;
3215*33de042dSApple OSS Distributions 		pq = workq_priority_queue_for_req(wq, req);
3216*33de042dSApple OSS Distributions 	}
3217*33de042dSApple OSS Distributions 	req->tr_qos = qos;
3218*33de042dSApple OSS Distributions 
3219*33de042dSApple OSS Distributions 	req_max = priority_queue_max(pq, struct workq_threadreq_s, tr_entry);
3220*33de042dSApple OSS Distributions 	if (req_max && req_max->tr_qos >= qos) {
3221*33de042dSApple OSS Distributions 		priority_queue_entry_set_sched_pri(pq, &req->tr_entry,
3222*33de042dSApple OSS Distributions 		    workq_priority_for_req(req), false);
3223*33de042dSApple OSS Distributions 		priority_queue_insert(pq, &req->tr_entry);
3224*33de042dSApple OSS Distributions 		workq_unlock(wq);
3225*33de042dSApple OSS Distributions 		return;
3226*33de042dSApple OSS Distributions 	}
3227*33de042dSApple OSS Distributions 
3228*33de042dSApple OSS Distributions 	/*
3229*33de042dSApple OSS Distributions 	 * Stage 3: Reevaluate whether we should run the thread request.
3230*33de042dSApple OSS Distributions 	 *
3231*33de042dSApple OSS Distributions 	 * Pretend the thread request is new again:
3232*33de042dSApple OSS Distributions 	 * - adjust wq_reqcount to not count it anymore.
3233*33de042dSApple OSS Distributions 	 * - make its state WORKQ_TR_STATE_NEW (so that workq_threadreq_bind_and_unlock
3234*33de042dSApple OSS Distributions 	 *   properly attempts a synchronous bind)
3235*33de042dSApple OSS Distributions 	 */
3236*33de042dSApple OSS Distributions 	wq->wq_reqcount--;
3237*33de042dSApple OSS Distributions 	req->tr_state = WORKQ_TR_STATE_NEW;
3238*33de042dSApple OSS Distributions 
3239*33de042dSApple OSS Distributions 	/* We enqueued the highest priority item or we may need to reevaluate if
3240*33de042dSApple OSS Distributions 	 * the creator needs a thread group pre-adoption if the request got a new TG */
3241*33de042dSApple OSS Distributions 	bool reevaluate_creator_tg = false;
3242*33de042dSApple OSS Distributions 
3243*33de042dSApple OSS Distributions #if CONFIG_PREADOPT_TG
3244*33de042dSApple OSS Distributions 	reevaluate_creator_tg = (flags & WORKQ_THREADREQ_REEVALUATE_PREADOPT_TG);
3245*33de042dSApple OSS Distributions #endif
3246*33de042dSApple OSS Distributions 
3247*33de042dSApple OSS Distributions 	if (workq_threadreq_enqueue(wq, req) || reevaluate_creator_tg) {
3248*33de042dSApple OSS Distributions 		workq_schedule_creator(p, wq, flags);
3249*33de042dSApple OSS Distributions 	}
3250*33de042dSApple OSS Distributions 	workq_unlock(wq);
3251*33de042dSApple OSS Distributions }
3252*33de042dSApple OSS Distributions 
3253*33de042dSApple OSS Distributions void
workq_kern_bound_thread_reset_pri(workq_threadreq_t req,struct uthread * uth)3254*33de042dSApple OSS Distributions workq_kern_bound_thread_reset_pri(workq_threadreq_t req, struct uthread *uth)
3255*33de042dSApple OSS Distributions {
3256*33de042dSApple OSS Distributions 	assert(workq_thread_is_permanently_bound(uth));
3257*33de042dSApple OSS Distributions 
3258*33de042dSApple OSS Distributions 	if (req && (req->tr_flags & WORKQ_TR_FLAG_WL_OUTSIDE_QOS)) {
3259*33de042dSApple OSS Distributions 		/*
3260*33de042dSApple OSS Distributions 		 * For requests outside-of-QoS, we set the scheduling policy and
3261*33de042dSApple OSS Distributions 		 * absolute priority for the bound thread right at the initialization
3262*33de042dSApple OSS Distributions 		 * time. See workq_kern_threadreq_permanent_bind.
3263*33de042dSApple OSS Distributions 		 */
3264*33de042dSApple OSS Distributions 		return;
3265*33de042dSApple OSS Distributions 	}
3266*33de042dSApple OSS Distributions 
3267*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr_fast(current_proc());
3268*33de042dSApple OSS Distributions 	if (req) {
3269*33de042dSApple OSS Distributions 		assert(req->tr_qos != WORKQ_THREAD_QOS_MANAGER);
3270*33de042dSApple OSS Distributions 		workq_thread_reset_pri(wq, uth, req, /*unpark*/ true);
3271*33de042dSApple OSS Distributions 	} else {
3272*33de042dSApple OSS Distributions 		thread_qos_t qos = workq_pri_override(uth->uu_workq_pri);
3273*33de042dSApple OSS Distributions 		if (qos > WORKQ_THREAD_QOS_CLEANUP) {
3274*33de042dSApple OSS Distributions 			workq_thread_reset_pri(wq, uth, NULL, /*unpark*/ true);
3275*33de042dSApple OSS Distributions 		} else {
3276*33de042dSApple OSS Distributions 			uth->uu_save.uus_workq_park_data.qos = qos;
3277*33de042dSApple OSS Distributions 		}
3278*33de042dSApple OSS Distributions 	}
3279*33de042dSApple OSS Distributions }
3280*33de042dSApple OSS Distributions 
3281*33de042dSApple OSS Distributions void
workq_kern_threadreq_lock(struct proc * p)3282*33de042dSApple OSS Distributions workq_kern_threadreq_lock(struct proc *p)
3283*33de042dSApple OSS Distributions {
3284*33de042dSApple OSS Distributions 	workq_lock_spin(proc_get_wqptr_fast(p));
3285*33de042dSApple OSS Distributions }
3286*33de042dSApple OSS Distributions 
3287*33de042dSApple OSS Distributions void
workq_kern_threadreq_unlock(struct proc * p)3288*33de042dSApple OSS Distributions workq_kern_threadreq_unlock(struct proc *p)
3289*33de042dSApple OSS Distributions {
3290*33de042dSApple OSS Distributions 	workq_unlock(proc_get_wqptr_fast(p));
3291*33de042dSApple OSS Distributions }
3292*33de042dSApple OSS Distributions 
3293*33de042dSApple OSS Distributions void
workq_kern_threadreq_update_inheritor(struct proc * p,workq_threadreq_t req,thread_t owner,struct turnstile * wl_ts,turnstile_update_flags_t flags)3294*33de042dSApple OSS Distributions workq_kern_threadreq_update_inheritor(struct proc *p, workq_threadreq_t req,
3295*33de042dSApple OSS Distributions     thread_t owner, struct turnstile *wl_ts,
3296*33de042dSApple OSS Distributions     turnstile_update_flags_t flags)
3297*33de042dSApple OSS Distributions {
3298*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr_fast(p);
3299*33de042dSApple OSS Distributions 	turnstile_inheritor_t inheritor;
3300*33de042dSApple OSS Distributions 
3301*33de042dSApple OSS Distributions 	assert(req->tr_qos != WORKQ_THREAD_QOS_MANAGER);
3302*33de042dSApple OSS Distributions 	assert(req->tr_flags & WORKQ_TR_FLAG_WORKLOOP);
3303*33de042dSApple OSS Distributions 	workq_lock_held(wq);
3304*33de042dSApple OSS Distributions 
3305*33de042dSApple OSS Distributions 	if (req->tr_state == WORKQ_TR_STATE_BINDING) {
3306*33de042dSApple OSS Distributions 		kqueue_threadreq_bind(p, req, req->tr_thread,
3307*33de042dSApple OSS Distributions 		    KQUEUE_THREADREQ_BIND_NO_INHERITOR_UPDATE);
3308*33de042dSApple OSS Distributions 		return;
3309*33de042dSApple OSS Distributions 	}
3310*33de042dSApple OSS Distributions 
3311*33de042dSApple OSS Distributions 	if (_wq_exiting(wq)) {
3312*33de042dSApple OSS Distributions 		inheritor = TURNSTILE_INHERITOR_NULL;
3313*33de042dSApple OSS Distributions 	} else {
3314*33de042dSApple OSS Distributions 		if (req->tr_state != WORKQ_TR_STATE_QUEUED) {
3315*33de042dSApple OSS Distributions 			panic("Invalid thread request (%p) state %d", req, req->tr_state);
3316*33de042dSApple OSS Distributions 		}
3317*33de042dSApple OSS Distributions 
3318*33de042dSApple OSS Distributions 		if (owner) {
3319*33de042dSApple OSS Distributions 			inheritor = owner;
3320*33de042dSApple OSS Distributions 			flags |= TURNSTILE_INHERITOR_THREAD;
3321*33de042dSApple OSS Distributions 		} else {
3322*33de042dSApple OSS Distributions 			inheritor = wq->wq_turnstile;
3323*33de042dSApple OSS Distributions 			flags |= TURNSTILE_INHERITOR_TURNSTILE;
3324*33de042dSApple OSS Distributions 		}
3325*33de042dSApple OSS Distributions 	}
3326*33de042dSApple OSS Distributions 
3327*33de042dSApple OSS Distributions 	workq_perform_turnstile_operation_locked(wq, ^{
3328*33de042dSApple OSS Distributions 		turnstile_update_inheritor(wl_ts, inheritor, flags);
3329*33de042dSApple OSS Distributions 	});
3330*33de042dSApple OSS Distributions }
3331*33de042dSApple OSS Distributions 
3332*33de042dSApple OSS Distributions /*
3333*33de042dSApple OSS Distributions  * An entry point for kevent to request a newly created workqueue thread
3334*33de042dSApple OSS Distributions  * and bind it permanently to the given workqueue thread request.
3335*33de042dSApple OSS Distributions  *
3336*33de042dSApple OSS Distributions  * It currently only supports fixed scheduler priority thread requests.
3337*33de042dSApple OSS Distributions  *
3338*33de042dSApple OSS Distributions  * The newly created thread counts towards wq_nthreads. This function returns
3339*33de042dSApple OSS Distributions  * an error if we are above that limit. There is no concept of delayed thread
3340*33de042dSApple OSS Distributions  * creation for such specially configured kqworkloops.
3341*33de042dSApple OSS Distributions  *
3342*33de042dSApple OSS Distributions  * If successful, the newly created thread will be parked in
3343*33de042dSApple OSS Distributions  * workq_bound_thread_initialize_and_unpark_continue waiting for
3344*33de042dSApple OSS Distributions  * new incoming events.
3345*33de042dSApple OSS Distributions  */
3346*33de042dSApple OSS Distributions kern_return_t
workq_kern_threadreq_permanent_bind(struct proc * p,struct workq_threadreq_s * kqr)3347*33de042dSApple OSS Distributions workq_kern_threadreq_permanent_bind(struct proc *p, struct workq_threadreq_s *kqr)
3348*33de042dSApple OSS Distributions {
3349*33de042dSApple OSS Distributions 	kern_return_t ret = 0;
3350*33de042dSApple OSS Distributions 	thread_t new_thread = NULL;
3351*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr_fast(p);
3352*33de042dSApple OSS Distributions 
3353*33de042dSApple OSS Distributions 	workq_lock_spin(wq);
3354*33de042dSApple OSS Distributions 
3355*33de042dSApple OSS Distributions 	if (wq->wq_nthreads >= wq_max_threads) {
3356*33de042dSApple OSS Distributions 		ret = EDOM;
3357*33de042dSApple OSS Distributions 	} else {
3358*33de042dSApple OSS Distributions 		if (kqr->tr_flags & WORKQ_TR_FLAG_WL_OUTSIDE_QOS) {
3359*33de042dSApple OSS Distributions 			workq_threadreq_param_t trp = kqueue_threadreq_workloop_param(kqr);
3360*33de042dSApple OSS Distributions 			/*
3361*33de042dSApple OSS Distributions 			 * For requests outside-of-QoS, we fully initialize the thread
3362*33de042dSApple OSS Distributions 			 * request here followed by preadopting the scheduling properties
3363*33de042dSApple OSS Distributions 			 * on the newly created bound thread.
3364*33de042dSApple OSS Distributions 			 */
3365*33de042dSApple OSS Distributions 			thread_qos_t qos = thread_workq_qos_for_pri(trp.trp_pri);
3366*33de042dSApple OSS Distributions 			if (qos == THREAD_QOS_UNSPECIFIED) {
3367*33de042dSApple OSS Distributions 				qos = WORKQ_THREAD_QOS_ABOVEUI;
3368*33de042dSApple OSS Distributions 			}
3369*33de042dSApple OSS Distributions 			kqr->tr_qos = qos;
3370*33de042dSApple OSS Distributions 		}
3371*33de042dSApple OSS Distributions 		kqr->tr_count = 1;
3372*33de042dSApple OSS Distributions 
3373*33de042dSApple OSS Distributions 		/* workq_lock dropped and retaken around thread creation below. */
3374*33de042dSApple OSS Distributions 		ret = workq_add_new_idle_thread(p, wq,
3375*33de042dSApple OSS Distributions 		    workq_bound_thread_initialize_and_unpark_continue,
3376*33de042dSApple OSS Distributions 		    true, &new_thread);
3377*33de042dSApple OSS Distributions 		if (ret == KERN_SUCCESS) {
3378*33de042dSApple OSS Distributions 			struct uthread *uth = get_bsdthread_info(new_thread);
3379*33de042dSApple OSS Distributions 			if (kqr->tr_flags & WORKQ_TR_FLAG_WL_OUTSIDE_QOS) {
3380*33de042dSApple OSS Distributions 				workq_thread_reset_pri(wq, uth, kqr, /*unpark*/ true);
3381*33de042dSApple OSS Distributions 			}
3382*33de042dSApple OSS Distributions 			/*
3383*33de042dSApple OSS Distributions 			 * The newly created thread goes through a full bind to the kqwl
3384*33de042dSApple OSS Distributions 			 * right upon creation.
3385*33de042dSApple OSS Distributions 			 * It then falls back to soft bind/unbind upon wakeup/park.
3386*33de042dSApple OSS Distributions 			 */
3387*33de042dSApple OSS Distributions 			kqueue_threadreq_bind_prepost(p, kqr, uth);
3388*33de042dSApple OSS Distributions 			uth->uu_workq_flags |= UT_WORKQ_PERMANENT_BIND;
3389*33de042dSApple OSS Distributions 		}
3390*33de042dSApple OSS Distributions 	}
3391*33de042dSApple OSS Distributions 
3392*33de042dSApple OSS Distributions 	workq_unlock(wq);
3393*33de042dSApple OSS Distributions 
3394*33de042dSApple OSS Distributions 	if (ret == KERN_SUCCESS) {
3395*33de042dSApple OSS Distributions 		kqueue_threadreq_bind_commit(p, new_thread);
3396*33de042dSApple OSS Distributions 	}
3397*33de042dSApple OSS Distributions 	return ret;
3398*33de042dSApple OSS Distributions }
3399*33de042dSApple OSS Distributions 
3400*33de042dSApple OSS Distributions /*
3401*33de042dSApple OSS Distributions  * Called with kqlock held. It does not need to take the process wide
3402*33de042dSApple OSS Distributions  * global workq lock -> making it faster.
3403*33de042dSApple OSS Distributions  */
3404*33de042dSApple OSS Distributions void
workq_kern_bound_thread_wakeup(struct workq_threadreq_s * kqr)3405*33de042dSApple OSS Distributions workq_kern_bound_thread_wakeup(struct workq_threadreq_s *kqr)
3406*33de042dSApple OSS Distributions {
3407*33de042dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(kqr->tr_thread);
3408*33de042dSApple OSS Distributions 	workq_threadreq_param_t trp = kqueue_threadreq_workloop_param(kqr);
3409*33de042dSApple OSS Distributions 
3410*33de042dSApple OSS Distributions 	/*
3411*33de042dSApple OSS Distributions 	 * See "Locking model for accessing uu_workq_flags" for more information
3412*33de042dSApple OSS Distributions 	 * on how access to uu_workq_flags for the bound thread is synchronized.
3413*33de042dSApple OSS Distributions 	 */
3414*33de042dSApple OSS Distributions 	assert((uth->uu_workq_flags & (UT_WORKQ_RUNNING | UT_WORKQ_DYING)) == 0);
3415*33de042dSApple OSS Distributions 
3416*33de042dSApple OSS Distributions 	if (trp.trp_flags & TRP_RELEASED) {
3417*33de042dSApple OSS Distributions 		uth->uu_workq_flags |= UT_WORKQ_DYING;
3418*33de042dSApple OSS Distributions 	} else {
3419*33de042dSApple OSS Distributions 		uth->uu_workq_flags |= UT_WORKQ_RUNNING;
3420*33de042dSApple OSS Distributions 	}
3421*33de042dSApple OSS Distributions 
3422*33de042dSApple OSS Distributions 	workq_thread_wakeup(uth);
3423*33de042dSApple OSS Distributions }
3424*33de042dSApple OSS Distributions 
3425*33de042dSApple OSS Distributions /*
3426*33de042dSApple OSS Distributions  * Called with kqlock held. Dropped before parking.
3427*33de042dSApple OSS Distributions  * It does not need to take process wide global workqueue
3428*33de042dSApple OSS Distributions  * lock -> making it faster.
3429*33de042dSApple OSS Distributions  */
3430*33de042dSApple OSS Distributions __attribute__((noreturn, noinline))
3431*33de042dSApple OSS Distributions void
workq_kern_bound_thread_park(struct workq_threadreq_s * kqr)3432*33de042dSApple OSS Distributions workq_kern_bound_thread_park(struct workq_threadreq_s *kqr)
3433*33de042dSApple OSS Distributions {
3434*33de042dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(kqr->tr_thread);
3435*33de042dSApple OSS Distributions 	assert(uth == current_uthread());
3436*33de042dSApple OSS Distributions 
3437*33de042dSApple OSS Distributions 	/*
3438*33de042dSApple OSS Distributions 	 * See "Locking model for accessing uu_workq_flags" for more information
3439*33de042dSApple OSS Distributions 	 * on how access to uu_workq_flags for the bound thread is synchronized.
3440*33de042dSApple OSS Distributions 	 */
3441*33de042dSApple OSS Distributions 	uth->uu_workq_flags &= ~(UT_WORKQ_RUNNING);
3442*33de042dSApple OSS Distributions 
3443*33de042dSApple OSS Distributions 	thread_disarm_workqueue_quantum(get_machthread(uth));
3444*33de042dSApple OSS Distributions 
3445*33de042dSApple OSS Distributions 	/*
3446*33de042dSApple OSS Distributions 	 * TODO (pavhad) We could do the reusable userspace stack performance
3447*33de042dSApple OSS Distributions 	 * optimization here.
3448*33de042dSApple OSS Distributions 	 */
3449*33de042dSApple OSS Distributions 
3450*33de042dSApple OSS Distributions 	kqworkloop_bound_thread_park_prepost(kqr);
3451*33de042dSApple OSS Distributions 	/* KQ_SLEEP bit is set and kqlock is dropped. */
3452*33de042dSApple OSS Distributions 
3453*33de042dSApple OSS Distributions 	__assert_only kern_return_t kr;
3454*33de042dSApple OSS Distributions 	kr = thread_set_voucher_name(MACH_PORT_NULL);
3455*33de042dSApple OSS Distributions 	assert(kr == KERN_SUCCESS);
3456*33de042dSApple OSS Distributions 
3457*33de042dSApple OSS Distributions 	kqworkloop_bound_thread_park_commit(kqr,
3458*33de042dSApple OSS Distributions 	    workq_parked_wait_event(uth), workq_bound_thread_unpark_continue);
3459*33de042dSApple OSS Distributions 
3460*33de042dSApple OSS Distributions 	__builtin_unreachable();
3461*33de042dSApple OSS Distributions }
3462*33de042dSApple OSS Distributions 
3463*33de042dSApple OSS Distributions /*
3464*33de042dSApple OSS Distributions  * To terminate the permenantly bound workqueue thread. It unbinds itself
3465*33de042dSApple OSS Distributions  * with the kqwl during uthread_cleanup -> kqueue_threadreq_unbind.
3466*33de042dSApple OSS Distributions  * It is also when it will release its reference on the kqwl.
3467*33de042dSApple OSS Distributions  */
3468*33de042dSApple OSS Distributions __attribute__((noreturn, noinline))
3469*33de042dSApple OSS Distributions void
workq_kern_bound_thread_terminate(struct workq_threadreq_s * kqr)3470*33de042dSApple OSS Distributions workq_kern_bound_thread_terminate(struct workq_threadreq_s *kqr)
3471*33de042dSApple OSS Distributions {
3472*33de042dSApple OSS Distributions 	proc_t p = current_proc();
3473*33de042dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(kqr->tr_thread);
3474*33de042dSApple OSS Distributions 	uint16_t uu_workq_flags_orig;
3475*33de042dSApple OSS Distributions 
3476*33de042dSApple OSS Distributions 	assert(uth == current_uthread());
3477*33de042dSApple OSS Distributions 
3478*33de042dSApple OSS Distributions 	/*
3479*33de042dSApple OSS Distributions 	 * See "Locking model for accessing uu_workq_flags" for more information
3480*33de042dSApple OSS Distributions 	 * on how access to uu_workq_flags for the bound thread is synchronized.
3481*33de042dSApple OSS Distributions 	 */
3482*33de042dSApple OSS Distributions 	kqworkloop_bound_thread_terminate(kqr, &uu_workq_flags_orig);
3483*33de042dSApple OSS Distributions 
3484*33de042dSApple OSS Distributions 	if (uu_workq_flags_orig & UT_WORKQ_WORK_INTERVAL_JOINED) {
3485*33de042dSApple OSS Distributions 		__assert_only kern_return_t kr;
3486*33de042dSApple OSS Distributions 		kr = kern_work_interval_join(get_machthread(uth), MACH_PORT_NULL);
3487*33de042dSApple OSS Distributions 		/* The bound thread un-joins the work interval and drops its +1 ref. */
3488*33de042dSApple OSS Distributions 		assert(kr == KERN_SUCCESS);
3489*33de042dSApple OSS Distributions 	}
3490*33de042dSApple OSS Distributions 
3491*33de042dSApple OSS Distributions 	/*
3492*33de042dSApple OSS Distributions 	 * Drop the voucher now that we are on our way to termination.
3493*33de042dSApple OSS Distributions 	 */
3494*33de042dSApple OSS Distributions 	__assert_only kern_return_t kr;
3495*33de042dSApple OSS Distributions 	kr = thread_set_voucher_name(MACH_PORT_NULL);
3496*33de042dSApple OSS Distributions 	assert(kr == KERN_SUCCESS);
3497*33de042dSApple OSS Distributions 
3498*33de042dSApple OSS Distributions 	uint32_t upcall_flags = WQ_FLAG_THREAD_NEWSPI;
3499*33de042dSApple OSS Distributions 	upcall_flags |= uth->uu_save.uus_workq_park_data.qos |
3500*33de042dSApple OSS Distributions 	    WQ_FLAG_THREAD_PRIO_QOS;
3501*33de042dSApple OSS Distributions 
3502*33de042dSApple OSS Distributions 	thread_t th = get_machthread(uth);
3503*33de042dSApple OSS Distributions 	vm_map_t vmap = get_task_map(proc_task(p));
3504*33de042dSApple OSS Distributions 
3505*33de042dSApple OSS Distributions 	if ((uu_workq_flags_orig & UT_WORKQ_NEW) == 0) {
3506*33de042dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_REUSE;
3507*33de042dSApple OSS Distributions 	}
3508*33de042dSApple OSS Distributions 
3509*33de042dSApple OSS Distributions 	pthread_functions->workq_setup_thread(p, th, vmap, uth->uu_workq_stackaddr,
3510*33de042dSApple OSS Distributions 	    uth->uu_workq_thport, 0, WQ_SETUP_EXIT_THREAD, upcall_flags);
3511*33de042dSApple OSS Distributions 	__builtin_unreachable();
3512*33de042dSApple OSS Distributions }
3513*33de042dSApple OSS Distributions 
3514*33de042dSApple OSS Distributions void
workq_kern_threadreq_redrive(struct proc * p,workq_kern_threadreq_flags_t flags)3515*33de042dSApple OSS Distributions workq_kern_threadreq_redrive(struct proc *p, workq_kern_threadreq_flags_t flags)
3516*33de042dSApple OSS Distributions {
3517*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr_fast(p);
3518*33de042dSApple OSS Distributions 
3519*33de042dSApple OSS Distributions 	workq_lock_spin(wq);
3520*33de042dSApple OSS Distributions 	workq_schedule_creator(p, wq, flags);
3521*33de042dSApple OSS Distributions 	workq_unlock(wq);
3522*33de042dSApple OSS Distributions }
3523*33de042dSApple OSS Distributions 
3524*33de042dSApple OSS Distributions /*
3525*33de042dSApple OSS Distributions  * Always called at AST by the thread on itself
3526*33de042dSApple OSS Distributions  *
3527*33de042dSApple OSS Distributions  * Upon quantum expiry, the workqueue subsystem evaluates its state and decides
3528*33de042dSApple OSS Distributions  * on what the thread should do next. The TSD value is always set by the thread
3529*33de042dSApple OSS Distributions  * on itself in the kernel and cleared either by userspace when it acks the TSD
3530*33de042dSApple OSS Distributions  * value and takes action, or by the thread in the kernel when the quantum
3531*33de042dSApple OSS Distributions  * expires again.
3532*33de042dSApple OSS Distributions  */
3533*33de042dSApple OSS Distributions void
workq_kern_quantum_expiry_reevaluate(proc_t proc,thread_t thread)3534*33de042dSApple OSS Distributions workq_kern_quantum_expiry_reevaluate(proc_t proc, thread_t thread)
3535*33de042dSApple OSS Distributions {
3536*33de042dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(thread);
3537*33de042dSApple OSS Distributions 
3538*33de042dSApple OSS Distributions 	if (uth->uu_workq_flags & UT_WORKQ_DYING) {
3539*33de042dSApple OSS Distributions 		return;
3540*33de042dSApple OSS Distributions 	}
3541*33de042dSApple OSS Distributions 
3542*33de042dSApple OSS Distributions 	if (!thread_supports_cooperative_workqueue(thread)) {
3543*33de042dSApple OSS Distributions 		panic("Quantum expired for thread that doesn't support cooperative workqueue");
3544*33de042dSApple OSS Distributions 	}
3545*33de042dSApple OSS Distributions 
3546*33de042dSApple OSS Distributions 	thread_qos_t qos = uth->uu_workq_pri.qos_bucket;
3547*33de042dSApple OSS Distributions 	if (qos == THREAD_QOS_UNSPECIFIED) {
3548*33de042dSApple OSS Distributions 		panic("Thread should not have workq bucket of QoS UN");
3549*33de042dSApple OSS Distributions 	}
3550*33de042dSApple OSS Distributions 
3551*33de042dSApple OSS Distributions 	assert(thread_has_expired_workqueue_quantum(thread, false));
3552*33de042dSApple OSS Distributions 
3553*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(proc);
3554*33de042dSApple OSS Distributions 	assert(wq != NULL);
3555*33de042dSApple OSS Distributions 
3556*33de042dSApple OSS Distributions 	/*
3557*33de042dSApple OSS Distributions 	 * For starters, we're just going to evaluate and see if we need to narrow
3558*33de042dSApple OSS Distributions 	 * the pool and tell this thread to park if needed. In the future, we'll
3559*33de042dSApple OSS Distributions 	 * evaluate and convey other workqueue state information like needing to
3560*33de042dSApple OSS Distributions 	 * pump kevents, etc.
3561*33de042dSApple OSS Distributions 	 */
3562*33de042dSApple OSS Distributions 	uint64_t flags = 0;
3563*33de042dSApple OSS Distributions 
3564*33de042dSApple OSS Distributions 	workq_lock_spin(wq);
3565*33de042dSApple OSS Distributions 
3566*33de042dSApple OSS Distributions 	if (workq_thread_is_cooperative(uth)) {
3567*33de042dSApple OSS Distributions 		if (!workq_cooperative_allowance(wq, qos, uth, false)) {
3568*33de042dSApple OSS Distributions 			flags |= PTHREAD_WQ_QUANTUM_EXPIRY_NARROW;
3569*33de042dSApple OSS Distributions 		} else {
3570*33de042dSApple OSS Distributions 			/* In the future, when we have kevent hookups for the cooperative
3571*33de042dSApple OSS Distributions 			 * pool, we need fancier logic for what userspace should do. But
3572*33de042dSApple OSS Distributions 			 * right now, only userspace thread requests exist - so we'll just
3573*33de042dSApple OSS Distributions 			 * tell userspace to shuffle work items */
3574*33de042dSApple OSS Distributions 			flags |= PTHREAD_WQ_QUANTUM_EXPIRY_SHUFFLE;
3575*33de042dSApple OSS Distributions 		}
3576*33de042dSApple OSS Distributions 	} else if (workq_thread_is_nonovercommit(uth)) {
3577*33de042dSApple OSS Distributions 		if (!workq_constrained_allowance(wq, qos, uth, false, false)) {
3578*33de042dSApple OSS Distributions 			flags |= PTHREAD_WQ_QUANTUM_EXPIRY_NARROW;
3579*33de042dSApple OSS Distributions 		}
3580*33de042dSApple OSS Distributions 	}
3581*33de042dSApple OSS Distributions 	workq_unlock(wq);
3582*33de042dSApple OSS Distributions 
3583*33de042dSApple OSS Distributions 	WQ_TRACE(TRACE_wq_quantum_expiry_reevaluate, flags, 0, 0, 0);
3584*33de042dSApple OSS Distributions 
3585*33de042dSApple OSS Distributions 	kevent_set_workq_quantum_expiry_user_tsd(proc, thread, flags);
3586*33de042dSApple OSS Distributions 
3587*33de042dSApple OSS Distributions 	/* We have conveyed to userspace about what it needs to do upon quantum
3588*33de042dSApple OSS Distributions 	 * expiry, now rearm the workqueue quantum again */
3589*33de042dSApple OSS Distributions 	thread_arm_workqueue_quantum(get_machthread(uth));
3590*33de042dSApple OSS Distributions }
3591*33de042dSApple OSS Distributions 
3592*33de042dSApple OSS Distributions void
workq_schedule_creator_turnstile_redrive(struct workqueue * wq,bool locked)3593*33de042dSApple OSS Distributions workq_schedule_creator_turnstile_redrive(struct workqueue *wq, bool locked)
3594*33de042dSApple OSS Distributions {
3595*33de042dSApple OSS Distributions 	if (locked) {
3596*33de042dSApple OSS Distributions 		workq_schedule_creator(NULL, wq, WORKQ_THREADREQ_NONE);
3597*33de042dSApple OSS Distributions 	} else {
3598*33de042dSApple OSS Distributions 		workq_schedule_immediate_thread_creation(wq);
3599*33de042dSApple OSS Distributions 	}
3600*33de042dSApple OSS Distributions }
3601*33de042dSApple OSS Distributions 
3602*33de042dSApple OSS Distributions static int
workq_thread_return(struct proc * p,struct workq_kernreturn_args * uap,struct workqueue * wq)3603*33de042dSApple OSS Distributions workq_thread_return(struct proc *p, struct workq_kernreturn_args *uap,
3604*33de042dSApple OSS Distributions     struct workqueue *wq)
3605*33de042dSApple OSS Distributions {
3606*33de042dSApple OSS Distributions 	thread_t th = current_thread();
3607*33de042dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(th);
3608*33de042dSApple OSS Distributions 	workq_threadreq_t kqr = uth->uu_kqr_bound;
3609*33de042dSApple OSS Distributions 	workq_threadreq_param_t trp = { };
3610*33de042dSApple OSS Distributions 	int nevents = uap->affinity, error;
3611*33de042dSApple OSS Distributions 	user_addr_t eventlist = uap->item;
3612*33de042dSApple OSS Distributions 
3613*33de042dSApple OSS Distributions 	if (((thread_get_tag(th) & THREAD_TAG_WORKQUEUE) == 0) ||
3614*33de042dSApple OSS Distributions 	    (uth->uu_workq_flags & UT_WORKQ_DYING)) {
3615*33de042dSApple OSS Distributions 		return EINVAL;
3616*33de042dSApple OSS Distributions 	}
3617*33de042dSApple OSS Distributions 
3618*33de042dSApple OSS Distributions 	if (eventlist && nevents && kqr == NULL) {
3619*33de042dSApple OSS Distributions 		return EINVAL;
3620*33de042dSApple OSS Distributions 	}
3621*33de042dSApple OSS Distributions 
3622*33de042dSApple OSS Distributions 	/*
3623*33de042dSApple OSS Distributions 	 * Reset signal mask on the workqueue thread to default state,
3624*33de042dSApple OSS Distributions 	 * but do not touch any signals that are marked for preservation.
3625*33de042dSApple OSS Distributions 	 */
3626*33de042dSApple OSS Distributions 	sigset_t resettable = uth->uu_sigmask & ~p->p_workq_allow_sigmask;
3627*33de042dSApple OSS Distributions 	if (resettable != (sigset_t)~workq_threadmask) {
3628*33de042dSApple OSS Distributions 		proc_lock(p);
3629*33de042dSApple OSS Distributions 		uth->uu_sigmask |= ~workq_threadmask & ~p->p_workq_allow_sigmask;
3630*33de042dSApple OSS Distributions 		proc_unlock(p);
3631*33de042dSApple OSS Distributions 	}
3632*33de042dSApple OSS Distributions 
3633*33de042dSApple OSS Distributions 	if (kqr && kqr->tr_flags & WORKQ_TR_FLAG_WL_PARAMS) {
3634*33de042dSApple OSS Distributions 		/*
3635*33de042dSApple OSS Distributions 		 * Ensure we store the threadreq param before unbinding
3636*33de042dSApple OSS Distributions 		 * the kqr from this thread.
3637*33de042dSApple OSS Distributions 		 */
3638*33de042dSApple OSS Distributions 		trp = kqueue_threadreq_workloop_param(kqr);
3639*33de042dSApple OSS Distributions 	}
3640*33de042dSApple OSS Distributions 
3641*33de042dSApple OSS Distributions 	if (kqr && kqr->tr_flags & WORKQ_TR_FLAG_PERMANENT_BIND) {
3642*33de042dSApple OSS Distributions 		goto handle_stack_events;
3643*33de042dSApple OSS Distributions 	}
3644*33de042dSApple OSS Distributions 
3645*33de042dSApple OSS Distributions 	/*
3646*33de042dSApple OSS Distributions 	 * Freeze the base pri while we decide the fate of this thread.
3647*33de042dSApple OSS Distributions 	 *
3648*33de042dSApple OSS Distributions 	 * Either:
3649*33de042dSApple OSS Distributions 	 * - we return to user and kevent_cleanup will have unfrozen the base pri,
3650*33de042dSApple OSS Distributions 	 * - or we proceed to workq_select_threadreq_or_park_and_unlock() who will.
3651*33de042dSApple OSS Distributions 	 */
3652*33de042dSApple OSS Distributions 	thread_freeze_base_pri(th);
3653*33de042dSApple OSS Distributions 
3654*33de042dSApple OSS Distributions handle_stack_events:
3655*33de042dSApple OSS Distributions 
3656*33de042dSApple OSS Distributions 	if (kqr) {
3657*33de042dSApple OSS Distributions 		uint32_t upcall_flags = WQ_FLAG_THREAD_NEWSPI | WQ_FLAG_THREAD_REUSE;
3658*33de042dSApple OSS Distributions 		if (kqr->tr_flags & WORKQ_TR_FLAG_WORKLOOP) {
3659*33de042dSApple OSS Distributions 			upcall_flags |= WQ_FLAG_THREAD_WORKLOOP | WQ_FLAG_THREAD_KEVENT;
3660*33de042dSApple OSS Distributions 		} else {
3661*33de042dSApple OSS Distributions 			upcall_flags |= WQ_FLAG_THREAD_KEVENT;
3662*33de042dSApple OSS Distributions 		}
3663*33de042dSApple OSS Distributions 		if (uth->uu_workq_pri.qos_bucket == WORKQ_THREAD_QOS_MANAGER) {
3664*33de042dSApple OSS Distributions 			upcall_flags |= WQ_FLAG_THREAD_EVENT_MANAGER;
3665*33de042dSApple OSS Distributions 		} else {
3666*33de042dSApple OSS Distributions 			if (workq_thread_is_overcommit(uth)) {
3667*33de042dSApple OSS Distributions 				upcall_flags |= WQ_FLAG_THREAD_OVERCOMMIT;
3668*33de042dSApple OSS Distributions 			}
3669*33de042dSApple OSS Distributions 			if (uth->uu_workq_flags & UT_WORKQ_OUTSIDE_QOS) {
3670*33de042dSApple OSS Distributions 				upcall_flags |= WQ_FLAG_THREAD_OUTSIDEQOS;
3671*33de042dSApple OSS Distributions 			} else {
3672*33de042dSApple OSS Distributions 				upcall_flags |= uth->uu_workq_pri.qos_req |
3673*33de042dSApple OSS Distributions 				    WQ_FLAG_THREAD_PRIO_QOS;
3674*33de042dSApple OSS Distributions 			}
3675*33de042dSApple OSS Distributions 		}
3676*33de042dSApple OSS Distributions 		error = pthread_functions->workq_handle_stack_events(p, th,
3677*33de042dSApple OSS Distributions 		    get_task_map(proc_task(p)), uth->uu_workq_stackaddr,
3678*33de042dSApple OSS Distributions 		    uth->uu_workq_thport, eventlist, nevents, upcall_flags);
3679*33de042dSApple OSS Distributions 		if (error) {
3680*33de042dSApple OSS Distributions 			assert(uth->uu_kqr_bound == kqr);
3681*33de042dSApple OSS Distributions 			return error;
3682*33de042dSApple OSS Distributions 		}
3683*33de042dSApple OSS Distributions 
3684*33de042dSApple OSS Distributions 		// pthread is supposed to pass KEVENT_FLAG_PARKING here
3685*33de042dSApple OSS Distributions 		// which should cause the above call to either:
3686*33de042dSApple OSS Distributions 		// - not return
3687*33de042dSApple OSS Distributions 		// - return an error
3688*33de042dSApple OSS Distributions 		// - return 0 and have unbound properly
3689*33de042dSApple OSS Distributions 		assert(uth->uu_kqr_bound == NULL);
3690*33de042dSApple OSS Distributions 	}
3691*33de042dSApple OSS Distributions 
3692*33de042dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_runthread | DBG_FUNC_END, wq, uap->options, 0, 0);
3693*33de042dSApple OSS Distributions 
3694*33de042dSApple OSS Distributions 	thread_sched_call(th, NULL);
3695*33de042dSApple OSS Distributions 	thread_will_park_or_terminate(th);
3696*33de042dSApple OSS Distributions #if CONFIG_WORKLOOP_DEBUG
3697*33de042dSApple OSS Distributions 	UU_KEVENT_HISTORY_WRITE_ENTRY(uth, { .uu_error = -1, });
3698*33de042dSApple OSS Distributions #endif
3699*33de042dSApple OSS Distributions 
3700*33de042dSApple OSS Distributions 	workq_lock_spin(wq);
3701*33de042dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_thread_logical_run | DBG_FUNC_END, wq, 0, 0, 0);
3702*33de042dSApple OSS Distributions 	uth->uu_save.uus_workq_park_data.workloop_params = trp.trp_value;
3703*33de042dSApple OSS Distributions 	workq_select_threadreq_or_park_and_unlock(p, wq, uth,
3704*33de042dSApple OSS Distributions 	    WQ_SETUP_CLEAR_VOUCHER);
3705*33de042dSApple OSS Distributions 	__builtin_unreachable();
3706*33de042dSApple OSS Distributions }
3707*33de042dSApple OSS Distributions 
3708*33de042dSApple OSS Distributions /**
3709*33de042dSApple OSS Distributions  * Multiplexed call to interact with the workqueue mechanism
3710*33de042dSApple OSS Distributions  */
3711*33de042dSApple OSS Distributions int
workq_kernreturn(struct proc * p,struct workq_kernreturn_args * uap,int32_t * retval)3712*33de042dSApple OSS Distributions workq_kernreturn(struct proc *p, struct workq_kernreturn_args *uap, int32_t *retval)
3713*33de042dSApple OSS Distributions {
3714*33de042dSApple OSS Distributions 	int options = uap->options;
3715*33de042dSApple OSS Distributions 	int arg2 = uap->affinity;
3716*33de042dSApple OSS Distributions 	int arg3 = uap->prio;
3717*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
3718*33de042dSApple OSS Distributions 	int error = 0;
3719*33de042dSApple OSS Distributions 
3720*33de042dSApple OSS Distributions 	if ((p->p_lflag & P_LREGISTER) == 0) {
3721*33de042dSApple OSS Distributions 		return EINVAL;
3722*33de042dSApple OSS Distributions 	}
3723*33de042dSApple OSS Distributions 
3724*33de042dSApple OSS Distributions 	switch (options) {
3725*33de042dSApple OSS Distributions 	case WQOPS_QUEUE_NEWSPISUPP: {
3726*33de042dSApple OSS Distributions 		/*
3727*33de042dSApple OSS Distributions 		 * arg2 = offset of serialno into dispatch queue
3728*33de042dSApple OSS Distributions 		 * arg3 = kevent support
3729*33de042dSApple OSS Distributions 		 */
3730*33de042dSApple OSS Distributions 		int offset = arg2;
3731*33de042dSApple OSS Distributions 		if (arg3 & 0x01) {
3732*33de042dSApple OSS Distributions 			// If we get here, then userspace has indicated support for kevent delivery.
3733*33de042dSApple OSS Distributions 		}
3734*33de042dSApple OSS Distributions 
3735*33de042dSApple OSS Distributions 		p->p_dispatchqueue_serialno_offset = (uint64_t)offset;
3736*33de042dSApple OSS Distributions 		break;
3737*33de042dSApple OSS Distributions 	}
3738*33de042dSApple OSS Distributions 	case WQOPS_QUEUE_REQTHREADS: {
3739*33de042dSApple OSS Distributions 		/*
3740*33de042dSApple OSS Distributions 		 * arg2 = number of threads to start
3741*33de042dSApple OSS Distributions 		 * arg3 = priority
3742*33de042dSApple OSS Distributions 		 */
3743*33de042dSApple OSS Distributions 		error = workq_reqthreads(p, arg2, arg3, false);
3744*33de042dSApple OSS Distributions 		break;
3745*33de042dSApple OSS Distributions 	}
3746*33de042dSApple OSS Distributions 	/* For requesting threads for the cooperative pool */
3747*33de042dSApple OSS Distributions 	case WQOPS_QUEUE_REQTHREADS2: {
3748*33de042dSApple OSS Distributions 		/*
3749*33de042dSApple OSS Distributions 		 * arg2 = number of threads to start
3750*33de042dSApple OSS Distributions 		 * arg3 = priority
3751*33de042dSApple OSS Distributions 		 */
3752*33de042dSApple OSS Distributions 		error = workq_reqthreads(p, arg2, arg3, true);
3753*33de042dSApple OSS Distributions 		break;
3754*33de042dSApple OSS Distributions 	}
3755*33de042dSApple OSS Distributions 	case WQOPS_SET_EVENT_MANAGER_PRIORITY: {
3756*33de042dSApple OSS Distributions 		/*
3757*33de042dSApple OSS Distributions 		 * arg2 = priority for the manager thread
3758*33de042dSApple OSS Distributions 		 *
3759*33de042dSApple OSS Distributions 		 * if _PTHREAD_PRIORITY_SCHED_PRI_FLAG is set,
3760*33de042dSApple OSS Distributions 		 * the low bits of the value contains a scheduling priority
3761*33de042dSApple OSS Distributions 		 * instead of a QOS value
3762*33de042dSApple OSS Distributions 		 */
3763*33de042dSApple OSS Distributions 		pthread_priority_t pri = arg2;
3764*33de042dSApple OSS Distributions 
3765*33de042dSApple OSS Distributions 		if (wq == NULL) {
3766*33de042dSApple OSS Distributions 			error = EINVAL;
3767*33de042dSApple OSS Distributions 			break;
3768*33de042dSApple OSS Distributions 		}
3769*33de042dSApple OSS Distributions 
3770*33de042dSApple OSS Distributions 		/*
3771*33de042dSApple OSS Distributions 		 * Normalize the incoming priority so that it is ordered numerically.
3772*33de042dSApple OSS Distributions 		 */
3773*33de042dSApple OSS Distributions 		if (_pthread_priority_has_sched_pri(pri)) {
3774*33de042dSApple OSS Distributions 			pri &= (_PTHREAD_PRIORITY_SCHED_PRI_MASK |
3775*33de042dSApple OSS Distributions 			    _PTHREAD_PRIORITY_SCHED_PRI_FLAG);
3776*33de042dSApple OSS Distributions 		} else {
3777*33de042dSApple OSS Distributions 			thread_qos_t qos = _pthread_priority_thread_qos(pri);
3778*33de042dSApple OSS Distributions 			int relpri = _pthread_priority_relpri(pri);
3779*33de042dSApple OSS Distributions 			if (relpri > 0 || relpri < THREAD_QOS_MIN_TIER_IMPORTANCE ||
3780*33de042dSApple OSS Distributions 			    qos == THREAD_QOS_UNSPECIFIED) {
3781*33de042dSApple OSS Distributions 				error = EINVAL;
3782*33de042dSApple OSS Distributions 				break;
3783*33de042dSApple OSS Distributions 			}
3784*33de042dSApple OSS Distributions 			pri &= ~_PTHREAD_PRIORITY_FLAGS_MASK;
3785*33de042dSApple OSS Distributions 		}
3786*33de042dSApple OSS Distributions 
3787*33de042dSApple OSS Distributions 		/*
3788*33de042dSApple OSS Distributions 		 * If userspace passes a scheduling priority, that wins over any QoS.
3789*33de042dSApple OSS Distributions 		 * Userspace should takes care not to lower the priority this way.
3790*33de042dSApple OSS Distributions 		 */
3791*33de042dSApple OSS Distributions 		workq_lock_spin(wq);
3792*33de042dSApple OSS Distributions 		if (wq->wq_event_manager_priority < (uint32_t)pri) {
3793*33de042dSApple OSS Distributions 			wq->wq_event_manager_priority = (uint32_t)pri;
3794*33de042dSApple OSS Distributions 		}
3795*33de042dSApple OSS Distributions 		workq_unlock(wq);
3796*33de042dSApple OSS Distributions 		break;
3797*33de042dSApple OSS Distributions 	}
3798*33de042dSApple OSS Distributions 	case WQOPS_THREAD_KEVENT_RETURN:
3799*33de042dSApple OSS Distributions 	case WQOPS_THREAD_WORKLOOP_RETURN:
3800*33de042dSApple OSS Distributions 	case WQOPS_THREAD_RETURN: {
3801*33de042dSApple OSS Distributions 		error = workq_thread_return(p, uap, wq);
3802*33de042dSApple OSS Distributions 		break;
3803*33de042dSApple OSS Distributions 	}
3804*33de042dSApple OSS Distributions 
3805*33de042dSApple OSS Distributions 	case WQOPS_SHOULD_NARROW: {
3806*33de042dSApple OSS Distributions 		/*
3807*33de042dSApple OSS Distributions 		 * arg2 = priority to test
3808*33de042dSApple OSS Distributions 		 * arg3 = unused
3809*33de042dSApple OSS Distributions 		 */
3810*33de042dSApple OSS Distributions 		thread_t th = current_thread();
3811*33de042dSApple OSS Distributions 		struct uthread *uth = get_bsdthread_info(th);
3812*33de042dSApple OSS Distributions 		if (((thread_get_tag(th) & THREAD_TAG_WORKQUEUE) == 0) ||
3813*33de042dSApple OSS Distributions 		    (uth->uu_workq_flags & (UT_WORKQ_DYING | UT_WORKQ_OVERCOMMIT))) {
3814*33de042dSApple OSS Distributions 			error = EINVAL;
3815*33de042dSApple OSS Distributions 			break;
3816*33de042dSApple OSS Distributions 		}
3817*33de042dSApple OSS Distributions 
3818*33de042dSApple OSS Distributions 		thread_qos_t qos = _pthread_priority_thread_qos(arg2);
3819*33de042dSApple OSS Distributions 		if (qos == THREAD_QOS_UNSPECIFIED) {
3820*33de042dSApple OSS Distributions 			error = EINVAL;
3821*33de042dSApple OSS Distributions 			break;
3822*33de042dSApple OSS Distributions 		}
3823*33de042dSApple OSS Distributions 		workq_lock_spin(wq);
3824*33de042dSApple OSS Distributions 		bool should_narrow = !workq_constrained_allowance(wq, qos, uth, false, false);
3825*33de042dSApple OSS Distributions 		workq_unlock(wq);
3826*33de042dSApple OSS Distributions 
3827*33de042dSApple OSS Distributions 		*retval = should_narrow;
3828*33de042dSApple OSS Distributions 		break;
3829*33de042dSApple OSS Distributions 	}
3830*33de042dSApple OSS Distributions 	case WQOPS_SETUP_DISPATCH: {
3831*33de042dSApple OSS Distributions 		/*
3832*33de042dSApple OSS Distributions 		 * item = pointer to workq_dispatch_config structure
3833*33de042dSApple OSS Distributions 		 * arg2 = sizeof(item)
3834*33de042dSApple OSS Distributions 		 */
3835*33de042dSApple OSS Distributions 		struct workq_dispatch_config cfg;
3836*33de042dSApple OSS Distributions 		bzero(&cfg, sizeof(cfg));
3837*33de042dSApple OSS Distributions 
3838*33de042dSApple OSS Distributions 		error = copyin(uap->item, &cfg, MIN(sizeof(cfg), (unsigned long) arg2));
3839*33de042dSApple OSS Distributions 		if (error) {
3840*33de042dSApple OSS Distributions 			break;
3841*33de042dSApple OSS Distributions 		}
3842*33de042dSApple OSS Distributions 
3843*33de042dSApple OSS Distributions 		if (cfg.wdc_flags & ~WORKQ_DISPATCH_SUPPORTED_FLAGS ||
3844*33de042dSApple OSS Distributions 		    cfg.wdc_version < WORKQ_DISPATCH_MIN_SUPPORTED_VERSION) {
3845*33de042dSApple OSS Distributions 			error = ENOTSUP;
3846*33de042dSApple OSS Distributions 			break;
3847*33de042dSApple OSS Distributions 		}
3848*33de042dSApple OSS Distributions 
3849*33de042dSApple OSS Distributions 		/* Load fields from version 1 */
3850*33de042dSApple OSS Distributions 		p->p_dispatchqueue_serialno_offset = cfg.wdc_queue_serialno_offs;
3851*33de042dSApple OSS Distributions 
3852*33de042dSApple OSS Distributions 		/* Load fields from version 2 */
3853*33de042dSApple OSS Distributions 		if (cfg.wdc_version >= 2) {
3854*33de042dSApple OSS Distributions 			p->p_dispatchqueue_label_offset = cfg.wdc_queue_label_offs;
3855*33de042dSApple OSS Distributions 		}
3856*33de042dSApple OSS Distributions 
3857*33de042dSApple OSS Distributions 		break;
3858*33de042dSApple OSS Distributions 	}
3859*33de042dSApple OSS Distributions 	default:
3860*33de042dSApple OSS Distributions 		error = EINVAL;
3861*33de042dSApple OSS Distributions 		break;
3862*33de042dSApple OSS Distributions 	}
3863*33de042dSApple OSS Distributions 
3864*33de042dSApple OSS Distributions 	return error;
3865*33de042dSApple OSS Distributions }
3866*33de042dSApple OSS Distributions 
3867*33de042dSApple OSS Distributions /*
3868*33de042dSApple OSS Distributions  * We have no work to do, park ourselves on the idle list.
3869*33de042dSApple OSS Distributions  *
3870*33de042dSApple OSS Distributions  * Consumes the workqueue lock and does not return.
3871*33de042dSApple OSS Distributions  */
3872*33de042dSApple OSS Distributions __attribute__((noreturn, noinline))
3873*33de042dSApple OSS Distributions static void
workq_park_and_unlock(proc_t p,struct workqueue * wq,struct uthread * uth,uint32_t setup_flags)3874*33de042dSApple OSS Distributions workq_park_and_unlock(proc_t p, struct workqueue *wq, struct uthread *uth,
3875*33de042dSApple OSS Distributions     uint32_t setup_flags)
3876*33de042dSApple OSS Distributions {
3877*33de042dSApple OSS Distributions 	assert(uth == current_uthread());
3878*33de042dSApple OSS Distributions 	assert(uth->uu_kqr_bound == NULL);
3879*33de042dSApple OSS Distributions 	workq_push_idle_thread(p, wq, uth, setup_flags); // may not return
3880*33de042dSApple OSS Distributions 
3881*33de042dSApple OSS Distributions 	workq_thread_reset_cpupercent(NULL, uth);
3882*33de042dSApple OSS Distributions 
3883*33de042dSApple OSS Distributions #if CONFIG_PREADOPT_TG
3884*33de042dSApple OSS Distributions 	/* Clear the preadoption thread group on the thread.
3885*33de042dSApple OSS Distributions 	 *
3886*33de042dSApple OSS Distributions 	 * Case 1:
3887*33de042dSApple OSS Distributions 	 *		Creator thread which never picked up a thread request. We set a
3888*33de042dSApple OSS Distributions 	 *		preadoption thread group on creator threads but if it never picked
3889*33de042dSApple OSS Distributions 	 *		up a thread request and didn't go to userspace, then the thread will
3890*33de042dSApple OSS Distributions 	 *		park with a preadoption thread group but no explicitly adopted
3891*33de042dSApple OSS Distributions 	 *		voucher or work interval.
3892*33de042dSApple OSS Distributions 	 *
3893*33de042dSApple OSS Distributions 	 *		We drop the preadoption thread group here before proceeding to park.
3894*33de042dSApple OSS Distributions 	 *		Note - we may get preempted when we drop the workq lock below.
3895*33de042dSApple OSS Distributions 	 *
3896*33de042dSApple OSS Distributions 	 * Case 2:
3897*33de042dSApple OSS Distributions 	 *		Thread picked up a thread request and bound to it and returned back
3898*33de042dSApple OSS Distributions 	 *		from userspace and is parking. At this point, preadoption thread
3899*33de042dSApple OSS Distributions 	 *		group should be NULL since the thread has unbound from the thread
3900*33de042dSApple OSS Distributions 	 *		request. So this operation should be a no-op.
3901*33de042dSApple OSS Distributions 	 */
3902*33de042dSApple OSS Distributions 	thread_set_preadopt_thread_group(get_machthread(uth), NULL);
3903*33de042dSApple OSS Distributions #endif
3904*33de042dSApple OSS Distributions 
3905*33de042dSApple OSS Distributions 	if ((uth->uu_workq_flags & UT_WORKQ_IDLE_CLEANUP) &&
3906*33de042dSApple OSS Distributions 	    !(uth->uu_workq_flags & UT_WORKQ_DYING)) {
3907*33de042dSApple OSS Distributions 		workq_unlock(wq);
3908*33de042dSApple OSS Distributions 
3909*33de042dSApple OSS Distributions 		/*
3910*33de042dSApple OSS Distributions 		 * workq_push_idle_thread() will unset `has_stack`
3911*33de042dSApple OSS Distributions 		 * if it wants us to free the stack before parking.
3912*33de042dSApple OSS Distributions 		 */
3913*33de042dSApple OSS Distributions 		if (!uth->uu_save.uus_workq_park_data.has_stack) {
3914*33de042dSApple OSS Distributions 			pthread_functions->workq_markfree_threadstack(p,
3915*33de042dSApple OSS Distributions 			    get_machthread(uth), get_task_map(proc_task(p)),
3916*33de042dSApple OSS Distributions 			    uth->uu_workq_stackaddr);
3917*33de042dSApple OSS Distributions 		}
3918*33de042dSApple OSS Distributions 
3919*33de042dSApple OSS Distributions 		/*
3920*33de042dSApple OSS Distributions 		 * When we remove the voucher from the thread, we may lose our importance
3921*33de042dSApple OSS Distributions 		 * causing us to get preempted, so we do this after putting the thread on
3922*33de042dSApple OSS Distributions 		 * the idle list.  Then, when we get our importance back we'll be able to
3923*33de042dSApple OSS Distributions 		 * use this thread from e.g. the kevent call out to deliver a boosting
3924*33de042dSApple OSS Distributions 		 * message.
3925*33de042dSApple OSS Distributions 		 *
3926*33de042dSApple OSS Distributions 		 * Note that setting the voucher to NULL will not clear the preadoption
3927*33de042dSApple OSS Distributions 		 * thread since this thread could have become the creator again and
3928*33de042dSApple OSS Distributions 		 * perhaps acquired a preadoption thread group.
3929*33de042dSApple OSS Distributions 		 */
3930*33de042dSApple OSS Distributions 		__assert_only kern_return_t kr;
3931*33de042dSApple OSS Distributions 		kr = thread_set_voucher_name(MACH_PORT_NULL);
3932*33de042dSApple OSS Distributions 		assert(kr == KERN_SUCCESS);
3933*33de042dSApple OSS Distributions 
3934*33de042dSApple OSS Distributions 		workq_lock_spin(wq);
3935*33de042dSApple OSS Distributions 		uth->uu_workq_flags &= ~UT_WORKQ_IDLE_CLEANUP;
3936*33de042dSApple OSS Distributions 		setup_flags &= ~WQ_SETUP_CLEAR_VOUCHER;
3937*33de042dSApple OSS Distributions 	}
3938*33de042dSApple OSS Distributions 
3939*33de042dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_thread_logical_run | DBG_FUNC_END, wq, 0, 0, 0);
3940*33de042dSApple OSS Distributions 
3941*33de042dSApple OSS Distributions 	if (uth->uu_workq_flags & UT_WORKQ_RUNNING) {
3942*33de042dSApple OSS Distributions 		/*
3943*33de042dSApple OSS Distributions 		 * While we'd dropped the lock to unset our voucher, someone came
3944*33de042dSApple OSS Distributions 		 * around and made us runnable.  But because we weren't waiting on the
3945*33de042dSApple OSS Distributions 		 * event their thread_wakeup() was ineffectual.  To correct for that,
3946*33de042dSApple OSS Distributions 		 * we just run the continuation ourselves.
3947*33de042dSApple OSS Distributions 		 */
3948*33de042dSApple OSS Distributions 		workq_unpark_select_threadreq_or_park_and_unlock(p, wq, uth, setup_flags);
3949*33de042dSApple OSS Distributions 		__builtin_unreachable();
3950*33de042dSApple OSS Distributions 	}
3951*33de042dSApple OSS Distributions 
3952*33de042dSApple OSS Distributions 	if (uth->uu_workq_flags & UT_WORKQ_DYING) {
3953*33de042dSApple OSS Distributions 		workq_unpark_for_death_and_unlock(p, wq, uth,
3954*33de042dSApple OSS Distributions 		    WORKQ_UNPARK_FOR_DEATH_WAS_IDLE, setup_flags);
3955*33de042dSApple OSS Distributions 		__builtin_unreachable();
3956*33de042dSApple OSS Distributions 	}
3957*33de042dSApple OSS Distributions 
3958*33de042dSApple OSS Distributions 	/* Disarm the workqueue quantum since the thread is now idle */
3959*33de042dSApple OSS Distributions 	thread_disarm_workqueue_quantum(get_machthread(uth));
3960*33de042dSApple OSS Distributions 
3961*33de042dSApple OSS Distributions 	thread_set_pending_block_hint(get_machthread(uth), kThreadWaitParkedWorkQueue);
3962*33de042dSApple OSS Distributions 	assert_wait(workq_parked_wait_event(uth), THREAD_INTERRUPTIBLE);
3963*33de042dSApple OSS Distributions 	workq_unlock(wq);
3964*33de042dSApple OSS Distributions 	thread_block(workq_unpark_continue);
3965*33de042dSApple OSS Distributions 	__builtin_unreachable();
3966*33de042dSApple OSS Distributions }
3967*33de042dSApple OSS Distributions 
3968*33de042dSApple OSS Distributions static inline bool
workq_may_start_event_mgr_thread(struct workqueue * wq,struct uthread * uth)3969*33de042dSApple OSS Distributions workq_may_start_event_mgr_thread(struct workqueue *wq, struct uthread *uth)
3970*33de042dSApple OSS Distributions {
3971*33de042dSApple OSS Distributions 	/*
3972*33de042dSApple OSS Distributions 	 * There's an event manager request and either:
3973*33de042dSApple OSS Distributions 	 * - no event manager currently running
3974*33de042dSApple OSS Distributions 	 * - we are re-using the event manager
3975*33de042dSApple OSS Distributions 	 */
3976*33de042dSApple OSS Distributions 	return wq->wq_thscheduled_count[_wq_bucket(WORKQ_THREAD_QOS_MANAGER)] == 0 ||
3977*33de042dSApple OSS Distributions 	       (uth && uth->uu_workq_pri.qos_bucket == WORKQ_THREAD_QOS_MANAGER);
3978*33de042dSApple OSS Distributions }
3979*33de042dSApple OSS Distributions 
3980*33de042dSApple OSS Distributions /* Called with workq lock held. */
3981*33de042dSApple OSS Distributions static uint32_t
workq_constrained_allowance(struct workqueue * wq,thread_qos_t at_qos,struct uthread * uth,bool may_start_timer,bool record_failed_allowance)3982*33de042dSApple OSS Distributions workq_constrained_allowance(struct workqueue *wq, thread_qos_t at_qos,
3983*33de042dSApple OSS Distributions     struct uthread *uth, bool may_start_timer, bool record_failed_allowance)
3984*33de042dSApple OSS Distributions {
3985*33de042dSApple OSS Distributions 	assert(at_qos != WORKQ_THREAD_QOS_MANAGER);
3986*33de042dSApple OSS Distributions 	uint32_t allowance_passed = 0;
3987*33de042dSApple OSS Distributions 	uint32_t count = 0;
3988*33de042dSApple OSS Distributions 
3989*33de042dSApple OSS Distributions 	uint32_t max_count = wq->wq_constrained_threads_scheduled;
3990*33de042dSApple OSS Distributions 	if (uth && workq_thread_is_nonovercommit(uth)) {
3991*33de042dSApple OSS Distributions 		/*
3992*33de042dSApple OSS Distributions 		 * don't count the current thread as scheduled
3993*33de042dSApple OSS Distributions 		 */
3994*33de042dSApple OSS Distributions 		assert(max_count > 0);
3995*33de042dSApple OSS Distributions 		max_count--;
3996*33de042dSApple OSS Distributions 	}
3997*33de042dSApple OSS Distributions 	if (max_count >= wq_max_constrained_threads) {
3998*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_constrained_admission | DBG_FUNC_NONE, wq, 1,
3999*33de042dSApple OSS Distributions 		    wq->wq_constrained_threads_scheduled,
4000*33de042dSApple OSS Distributions 		    wq_max_constrained_threads);
4001*33de042dSApple OSS Distributions 		/*
4002*33de042dSApple OSS Distributions 		 * we need 1 or more constrained threads to return to the kernel before
4003*33de042dSApple OSS Distributions 		 * we can dispatch additional work
4004*33de042dSApple OSS Distributions 		 */
4005*33de042dSApple OSS Distributions 		allowance_passed = 0;
4006*33de042dSApple OSS Distributions 		goto out;
4007*33de042dSApple OSS Distributions 	}
4008*33de042dSApple OSS Distributions 	max_count -= wq_max_constrained_threads;
4009*33de042dSApple OSS Distributions 
4010*33de042dSApple OSS Distributions 	/*
4011*33de042dSApple OSS Distributions 	 * Compute a metric for many how many threads are active.  We find the
4012*33de042dSApple OSS Distributions 	 * highest priority request outstanding and then add up the number of active
4013*33de042dSApple OSS Distributions 	 * threads in that and all higher-priority buckets.  We'll also add any
4014*33de042dSApple OSS Distributions 	 * "busy" threads which are not currently active but blocked recently enough
4015*33de042dSApple OSS Distributions 	 * that we can't be sure that they won't be unblocked soon and start
4016*33de042dSApple OSS Distributions 	 * being active again.
4017*33de042dSApple OSS Distributions 	 *
4018*33de042dSApple OSS Distributions 	 * We'll then compare this metric to our max concurrency to decide whether
4019*33de042dSApple OSS Distributions 	 * to add a new thread.
4020*33de042dSApple OSS Distributions 	 */
4021*33de042dSApple OSS Distributions 
4022*33de042dSApple OSS Distributions 	uint32_t busycount, thactive_count;
4023*33de042dSApple OSS Distributions 
4024*33de042dSApple OSS Distributions 	thactive_count = _wq_thactive_aggregate_downto_qos(wq, _wq_thactive(wq),
4025*33de042dSApple OSS Distributions 	    at_qos, &busycount, NULL);
4026*33de042dSApple OSS Distributions 
4027*33de042dSApple OSS Distributions 	if (uth && uth->uu_workq_pri.qos_bucket != WORKQ_THREAD_QOS_MANAGER &&
4028*33de042dSApple OSS Distributions 	    at_qos <= uth->uu_workq_pri.qos_bucket) {
4029*33de042dSApple OSS Distributions 		/*
4030*33de042dSApple OSS Distributions 		 * Don't count this thread as currently active, but only if it's not
4031*33de042dSApple OSS Distributions 		 * a manager thread, as _wq_thactive_aggregate_downto_qos ignores active
4032*33de042dSApple OSS Distributions 		 * managers.
4033*33de042dSApple OSS Distributions 		 */
4034*33de042dSApple OSS Distributions 		assert(thactive_count > 0);
4035*33de042dSApple OSS Distributions 		thactive_count--;
4036*33de042dSApple OSS Distributions 	}
4037*33de042dSApple OSS Distributions 
4038*33de042dSApple OSS Distributions 	count = wq_max_parallelism[_wq_bucket(at_qos)];
4039*33de042dSApple OSS Distributions 	if (count > thactive_count + busycount) {
4040*33de042dSApple OSS Distributions 		count -= thactive_count + busycount;
4041*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_constrained_admission | DBG_FUNC_NONE, wq, 2,
4042*33de042dSApple OSS Distributions 		    thactive_count, busycount);
4043*33de042dSApple OSS Distributions 		allowance_passed = MIN(count, max_count);
4044*33de042dSApple OSS Distributions 		goto out;
4045*33de042dSApple OSS Distributions 	} else {
4046*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_constrained_admission | DBG_FUNC_NONE, wq, 3,
4047*33de042dSApple OSS Distributions 		    thactive_count, busycount);
4048*33de042dSApple OSS Distributions 		allowance_passed = 0;
4049*33de042dSApple OSS Distributions 	}
4050*33de042dSApple OSS Distributions 
4051*33de042dSApple OSS Distributions 	if (may_start_timer) {
4052*33de042dSApple OSS Distributions 		/*
4053*33de042dSApple OSS Distributions 		 * If this is called from the add timer, we won't have another timer
4054*33de042dSApple OSS Distributions 		 * fire when the thread exits the "busy" state, so rearm the timer.
4055*33de042dSApple OSS Distributions 		 */
4056*33de042dSApple OSS Distributions 		workq_schedule_delayed_thread_creation(wq, 0);
4057*33de042dSApple OSS Distributions 	}
4058*33de042dSApple OSS Distributions 
4059*33de042dSApple OSS Distributions out:
4060*33de042dSApple OSS Distributions 	if (record_failed_allowance) {
4061*33de042dSApple OSS Distributions 		wq->wq_exceeded_active_constrained_thread_limit = !allowance_passed;
4062*33de042dSApple OSS Distributions 	}
4063*33de042dSApple OSS Distributions 	return allowance_passed;
4064*33de042dSApple OSS Distributions }
4065*33de042dSApple OSS Distributions 
4066*33de042dSApple OSS Distributions static bool
workq_threadreq_admissible(struct workqueue * wq,struct uthread * uth,workq_threadreq_t req)4067*33de042dSApple OSS Distributions workq_threadreq_admissible(struct workqueue *wq, struct uthread *uth,
4068*33de042dSApple OSS Distributions     workq_threadreq_t req)
4069*33de042dSApple OSS Distributions {
4070*33de042dSApple OSS Distributions 	if (req->tr_qos == WORKQ_THREAD_QOS_MANAGER) {
4071*33de042dSApple OSS Distributions 		return workq_may_start_event_mgr_thread(wq, uth);
4072*33de042dSApple OSS Distributions 	}
4073*33de042dSApple OSS Distributions 	if (workq_threadreq_is_cooperative(req)) {
4074*33de042dSApple OSS Distributions 		return workq_cooperative_allowance(wq, req->tr_qos, uth, true);
4075*33de042dSApple OSS Distributions 	}
4076*33de042dSApple OSS Distributions 	if (workq_threadreq_is_nonovercommit(req)) {
4077*33de042dSApple OSS Distributions 		return workq_constrained_allowance(wq, req->tr_qos, uth, true, true);
4078*33de042dSApple OSS Distributions 	}
4079*33de042dSApple OSS Distributions 
4080*33de042dSApple OSS Distributions 	return true;
4081*33de042dSApple OSS Distributions }
4082*33de042dSApple OSS Distributions 
4083*33de042dSApple OSS Distributions /*
4084*33de042dSApple OSS Distributions  * Called from the context of selecting thread requests for threads returning
4085*33de042dSApple OSS Distributions  * from userspace or creator thread
4086*33de042dSApple OSS Distributions  */
4087*33de042dSApple OSS Distributions static workq_threadreq_t
workq_cooperative_queue_best_req(struct workqueue * wq,struct uthread * uth)4088*33de042dSApple OSS Distributions workq_cooperative_queue_best_req(struct workqueue *wq, struct uthread *uth)
4089*33de042dSApple OSS Distributions {
4090*33de042dSApple OSS Distributions 	workq_lock_held(wq);
4091*33de042dSApple OSS Distributions 
4092*33de042dSApple OSS Distributions 	/*
4093*33de042dSApple OSS Distributions 	 * If the current thread is cooperative, we need to exclude it as part of
4094*33de042dSApple OSS Distributions 	 * cooperative schedule count since this thread is looking for a new
4095*33de042dSApple OSS Distributions 	 * request. Change in the schedule count for cooperative pool therefore
4096*33de042dSApple OSS Distributions 	 * requires us to reeevaluate the next best request for it.
4097*33de042dSApple OSS Distributions 	 */
4098*33de042dSApple OSS Distributions 	if (uth && workq_thread_is_cooperative(uth)) {
4099*33de042dSApple OSS Distributions 		_wq_cooperative_queue_scheduled_count_dec(wq, uth->uu_workq_pri.qos_req);
4100*33de042dSApple OSS Distributions 
4101*33de042dSApple OSS Distributions 		(void) _wq_cooperative_queue_refresh_best_req_qos(wq);
4102*33de042dSApple OSS Distributions 
4103*33de042dSApple OSS Distributions 		_wq_cooperative_queue_scheduled_count_inc(wq, uth->uu_workq_pri.qos_req);
4104*33de042dSApple OSS Distributions 	} else {
4105*33de042dSApple OSS Distributions 		/*
4106*33de042dSApple OSS Distributions 		 * The old value that was already precomputed should be safe to use -
4107*33de042dSApple OSS Distributions 		 * add an assert that asserts that the best req QoS doesn't change in
4108*33de042dSApple OSS Distributions 		 * this case
4109*33de042dSApple OSS Distributions 		 */
4110*33de042dSApple OSS Distributions 		assert(_wq_cooperative_queue_refresh_best_req_qos(wq) == false);
4111*33de042dSApple OSS Distributions 	}
4112*33de042dSApple OSS Distributions 
4113*33de042dSApple OSS Distributions 	thread_qos_t qos = wq->wq_cooperative_queue_best_req_qos;
4114*33de042dSApple OSS Distributions 
4115*33de042dSApple OSS Distributions 	/* There are no eligible requests in the cooperative pool */
4116*33de042dSApple OSS Distributions 	if (qos == THREAD_QOS_UNSPECIFIED) {
4117*33de042dSApple OSS Distributions 		return NULL;
4118*33de042dSApple OSS Distributions 	}
4119*33de042dSApple OSS Distributions 	assert(qos != WORKQ_THREAD_QOS_ABOVEUI);
4120*33de042dSApple OSS Distributions 	assert(qos != WORKQ_THREAD_QOS_MANAGER);
4121*33de042dSApple OSS Distributions 
4122*33de042dSApple OSS Distributions 	uint8_t bucket = _wq_bucket(qos);
4123*33de042dSApple OSS Distributions 	assert(!STAILQ_EMPTY(&wq->wq_cooperative_queue[bucket]));
4124*33de042dSApple OSS Distributions 
4125*33de042dSApple OSS Distributions 	return STAILQ_FIRST(&wq->wq_cooperative_queue[bucket]);
4126*33de042dSApple OSS Distributions }
4127*33de042dSApple OSS Distributions 
4128*33de042dSApple OSS Distributions static workq_threadreq_t
workq_threadreq_select_for_creator(struct workqueue * wq)4129*33de042dSApple OSS Distributions workq_threadreq_select_for_creator(struct workqueue *wq)
4130*33de042dSApple OSS Distributions {
4131*33de042dSApple OSS Distributions 	workq_threadreq_t req_qos, req_pri, req_tmp, req_mgr;
4132*33de042dSApple OSS Distributions 	thread_qos_t qos = THREAD_QOS_UNSPECIFIED;
4133*33de042dSApple OSS Distributions 	uint8_t pri = 0;
4134*33de042dSApple OSS Distributions 
4135*33de042dSApple OSS Distributions 	/*
4136*33de042dSApple OSS Distributions 	 * Compute the best priority request, and ignore the turnstile for now
4137*33de042dSApple OSS Distributions 	 */
4138*33de042dSApple OSS Distributions 
4139*33de042dSApple OSS Distributions 	req_pri = priority_queue_max(&wq->wq_special_queue,
4140*33de042dSApple OSS Distributions 	    struct workq_threadreq_s, tr_entry);
4141*33de042dSApple OSS Distributions 	if (req_pri) {
4142*33de042dSApple OSS Distributions 		pri = (uint8_t)priority_queue_entry_sched_pri(&wq->wq_special_queue,
4143*33de042dSApple OSS Distributions 		    &req_pri->tr_entry);
4144*33de042dSApple OSS Distributions 	}
4145*33de042dSApple OSS Distributions 
4146*33de042dSApple OSS Distributions 	/*
4147*33de042dSApple OSS Distributions 	 * Handle the manager thread request. The special queue might yield
4148*33de042dSApple OSS Distributions 	 * a higher priority, but the manager always beats the QoS world.
4149*33de042dSApple OSS Distributions 	 */
4150*33de042dSApple OSS Distributions 
4151*33de042dSApple OSS Distributions 	req_mgr = wq->wq_event_manager_threadreq;
4152*33de042dSApple OSS Distributions 	if (req_mgr && workq_may_start_event_mgr_thread(wq, NULL)) {
4153*33de042dSApple OSS Distributions 		uint32_t mgr_pri = wq->wq_event_manager_priority;
4154*33de042dSApple OSS Distributions 
4155*33de042dSApple OSS Distributions 		if (mgr_pri & _PTHREAD_PRIORITY_SCHED_PRI_FLAG) {
4156*33de042dSApple OSS Distributions 			mgr_pri &= _PTHREAD_PRIORITY_SCHED_PRI_MASK;
4157*33de042dSApple OSS Distributions 		} else {
4158*33de042dSApple OSS Distributions 			mgr_pri = thread_workq_pri_for_qos(
4159*33de042dSApple OSS Distributions 				_pthread_priority_thread_qos(mgr_pri));
4160*33de042dSApple OSS Distributions 		}
4161*33de042dSApple OSS Distributions 
4162*33de042dSApple OSS Distributions 		return mgr_pri >= pri ? req_mgr : req_pri;
4163*33de042dSApple OSS Distributions 	}
4164*33de042dSApple OSS Distributions 
4165*33de042dSApple OSS Distributions 	/*
4166*33de042dSApple OSS Distributions 	 * Compute the best QoS Request, and check whether it beats the "pri" one
4167*33de042dSApple OSS Distributions 	 *
4168*33de042dSApple OSS Distributions 	 * Start by comparing the overcommit and the cooperative pool
4169*33de042dSApple OSS Distributions 	 */
4170*33de042dSApple OSS Distributions 	req_qos = priority_queue_max(&wq->wq_overcommit_queue,
4171*33de042dSApple OSS Distributions 	    struct workq_threadreq_s, tr_entry);
4172*33de042dSApple OSS Distributions 	if (req_qos) {
4173*33de042dSApple OSS Distributions 		qos = req_qos->tr_qos;
4174*33de042dSApple OSS Distributions 	}
4175*33de042dSApple OSS Distributions 
4176*33de042dSApple OSS Distributions 	req_tmp = workq_cooperative_queue_best_req(wq, NULL);
4177*33de042dSApple OSS Distributions 	if (req_tmp && qos <= req_tmp->tr_qos) {
4178*33de042dSApple OSS Distributions 		/*
4179*33de042dSApple OSS Distributions 		 * Cooperative TR is better between overcommit and cooperative.  Note
4180*33de042dSApple OSS Distributions 		 * that if qos is same between overcommit and cooperative, we choose
4181*33de042dSApple OSS Distributions 		 * cooperative.
4182*33de042dSApple OSS Distributions 		 *
4183*33de042dSApple OSS Distributions 		 * Pick cooperative pool if it passes the admissions check
4184*33de042dSApple OSS Distributions 		 */
4185*33de042dSApple OSS Distributions 		if (workq_cooperative_allowance(wq, req_tmp->tr_qos, NULL, true)) {
4186*33de042dSApple OSS Distributions 			req_qos = req_tmp;
4187*33de042dSApple OSS Distributions 			qos = req_qos->tr_qos;
4188*33de042dSApple OSS Distributions 		}
4189*33de042dSApple OSS Distributions 	}
4190*33de042dSApple OSS Distributions 
4191*33de042dSApple OSS Distributions 	/*
4192*33de042dSApple OSS Distributions 	 * Compare the best QoS so far - either from overcommit or from cooperative
4193*33de042dSApple OSS Distributions 	 * pool - and compare it with the constrained pool
4194*33de042dSApple OSS Distributions 	 */
4195*33de042dSApple OSS Distributions 	req_tmp = priority_queue_max(&wq->wq_constrained_queue,
4196*33de042dSApple OSS Distributions 	    struct workq_threadreq_s, tr_entry);
4197*33de042dSApple OSS Distributions 
4198*33de042dSApple OSS Distributions 	if (req_tmp && qos < req_tmp->tr_qos) {
4199*33de042dSApple OSS Distributions 		/*
4200*33de042dSApple OSS Distributions 		 * Constrained pool is best in QoS between overcommit, cooperative
4201*33de042dSApple OSS Distributions 		 * and constrained. Now check how it fairs against the priority case
4202*33de042dSApple OSS Distributions 		 */
4203*33de042dSApple OSS Distributions 		if (pri && pri >= thread_workq_pri_for_qos(req_tmp->tr_qos)) {
4204*33de042dSApple OSS Distributions 			return req_pri;
4205*33de042dSApple OSS Distributions 		}
4206*33de042dSApple OSS Distributions 
4207*33de042dSApple OSS Distributions 		if (workq_constrained_allowance(wq, req_tmp->tr_qos, NULL, true, true)) {
4208*33de042dSApple OSS Distributions 			/*
4209*33de042dSApple OSS Distributions 			 * If the constrained thread request is the best one and passes
4210*33de042dSApple OSS Distributions 			 * the admission check, pick it.
4211*33de042dSApple OSS Distributions 			 */
4212*33de042dSApple OSS Distributions 			return req_tmp;
4213*33de042dSApple OSS Distributions 		}
4214*33de042dSApple OSS Distributions 	}
4215*33de042dSApple OSS Distributions 
4216*33de042dSApple OSS Distributions 	/*
4217*33de042dSApple OSS Distributions 	 * Compare the best of the QoS world with the priority
4218*33de042dSApple OSS Distributions 	 */
4219*33de042dSApple OSS Distributions 	if (pri && (!qos || pri >= thread_workq_pri_for_qos(qos))) {
4220*33de042dSApple OSS Distributions 		return req_pri;
4221*33de042dSApple OSS Distributions 	}
4222*33de042dSApple OSS Distributions 
4223*33de042dSApple OSS Distributions 	if (req_qos) {
4224*33de042dSApple OSS Distributions 		return req_qos;
4225*33de042dSApple OSS Distributions 	}
4226*33de042dSApple OSS Distributions 
4227*33de042dSApple OSS Distributions 	/*
4228*33de042dSApple OSS Distributions 	 * If we had no eligible request but we have a turnstile push,
4229*33de042dSApple OSS Distributions 	 * it must be a non overcommit thread request that failed
4230*33de042dSApple OSS Distributions 	 * the admission check.
4231*33de042dSApple OSS Distributions 	 *
4232*33de042dSApple OSS Distributions 	 * Just fake a BG thread request so that if the push stops the creator
4233*33de042dSApple OSS Distributions 	 * priority just drops to 4.
4234*33de042dSApple OSS Distributions 	 */
4235*33de042dSApple OSS Distributions 	if (turnstile_workq_proprietor_of_max_turnstile(wq->wq_turnstile, NULL)) {
4236*33de042dSApple OSS Distributions 		static struct workq_threadreq_s workq_sync_push_fake_req = {
4237*33de042dSApple OSS Distributions 			.tr_qos = THREAD_QOS_BACKGROUND,
4238*33de042dSApple OSS Distributions 		};
4239*33de042dSApple OSS Distributions 
4240*33de042dSApple OSS Distributions 		return &workq_sync_push_fake_req;
4241*33de042dSApple OSS Distributions 	}
4242*33de042dSApple OSS Distributions 
4243*33de042dSApple OSS Distributions 	return NULL;
4244*33de042dSApple OSS Distributions }
4245*33de042dSApple OSS Distributions 
4246*33de042dSApple OSS Distributions /*
4247*33de042dSApple OSS Distributions  * Returns true if this caused a change in the schedule counts of the
4248*33de042dSApple OSS Distributions  * cooperative pool
4249*33de042dSApple OSS Distributions  */
4250*33de042dSApple OSS Distributions static bool
workq_adjust_cooperative_constrained_schedule_counts(struct workqueue * wq,struct uthread * uth,thread_qos_t old_thread_qos,workq_tr_flags_t tr_flags)4251*33de042dSApple OSS Distributions workq_adjust_cooperative_constrained_schedule_counts(struct workqueue *wq,
4252*33de042dSApple OSS Distributions     struct uthread *uth, thread_qos_t old_thread_qos, workq_tr_flags_t tr_flags)
4253*33de042dSApple OSS Distributions {
4254*33de042dSApple OSS Distributions 	workq_lock_held(wq);
4255*33de042dSApple OSS Distributions 
4256*33de042dSApple OSS Distributions 	/*
4257*33de042dSApple OSS Distributions 	 * Row: thread type
4258*33de042dSApple OSS Distributions 	 * Column: Request type
4259*33de042dSApple OSS Distributions 	 *
4260*33de042dSApple OSS Distributions 	 *					overcommit		non-overcommit		cooperative
4261*33de042dSApple OSS Distributions 	 * overcommit			X				case 1				case 2
4262*33de042dSApple OSS Distributions 	 * cooperative		case 3				case 4				case 5
4263*33de042dSApple OSS Distributions 	 * non-overcommit	case 6					X				case 7
4264*33de042dSApple OSS Distributions 	 *
4265*33de042dSApple OSS Distributions 	 * Move the thread to the right bucket depending on what state it currently
4266*33de042dSApple OSS Distributions 	 * has and what state the thread req it picks, is going to have.
4267*33de042dSApple OSS Distributions 	 *
4268*33de042dSApple OSS Distributions 	 * Note that the creator thread is an overcommit thread.
4269*33de042dSApple OSS Distributions 	 */
4270*33de042dSApple OSS Distributions 	thread_qos_t new_thread_qos = uth->uu_workq_pri.qos_req;
4271*33de042dSApple OSS Distributions 
4272*33de042dSApple OSS Distributions 	/*
4273*33de042dSApple OSS Distributions 	 * Anytime a cooperative bucket's schedule count changes, we need to
4274*33de042dSApple OSS Distributions 	 * potentially refresh the next best QoS for that pool when we determine
4275*33de042dSApple OSS Distributions 	 * the next request for the creator
4276*33de042dSApple OSS Distributions 	 */
4277*33de042dSApple OSS Distributions 	bool cooperative_pool_sched_count_changed = false;
4278*33de042dSApple OSS Distributions 
4279*33de042dSApple OSS Distributions 	if (workq_thread_is_overcommit(uth)) {
4280*33de042dSApple OSS Distributions 		if (workq_tr_is_nonovercommit(tr_flags)) {
4281*33de042dSApple OSS Distributions 			// Case 1: thread is overcommit, req is non-overcommit
4282*33de042dSApple OSS Distributions 			wq->wq_constrained_threads_scheduled++;
4283*33de042dSApple OSS Distributions 		} else if (workq_tr_is_cooperative(tr_flags)) {
4284*33de042dSApple OSS Distributions 			// Case 2: thread is overcommit, req is cooperative
4285*33de042dSApple OSS Distributions 			_wq_cooperative_queue_scheduled_count_inc(wq, new_thread_qos);
4286*33de042dSApple OSS Distributions 			cooperative_pool_sched_count_changed = true;
4287*33de042dSApple OSS Distributions 		}
4288*33de042dSApple OSS Distributions 	} else if (workq_thread_is_cooperative(uth)) {
4289*33de042dSApple OSS Distributions 		if (workq_tr_is_overcommit(tr_flags)) {
4290*33de042dSApple OSS Distributions 			// Case 3: thread is cooperative, req is overcommit
4291*33de042dSApple OSS Distributions 			_wq_cooperative_queue_scheduled_count_dec(wq, old_thread_qos);
4292*33de042dSApple OSS Distributions 		} else if (workq_tr_is_nonovercommit(tr_flags)) {
4293*33de042dSApple OSS Distributions 			// Case 4: thread is cooperative, req is non-overcommit
4294*33de042dSApple OSS Distributions 			_wq_cooperative_queue_scheduled_count_dec(wq, old_thread_qos);
4295*33de042dSApple OSS Distributions 			wq->wq_constrained_threads_scheduled++;
4296*33de042dSApple OSS Distributions 		} else {
4297*33de042dSApple OSS Distributions 			// Case 5: thread is cooperative, req is also cooperative
4298*33de042dSApple OSS Distributions 			assert(workq_tr_is_cooperative(tr_flags));
4299*33de042dSApple OSS Distributions 			_wq_cooperative_queue_scheduled_count_dec(wq, old_thread_qos);
4300*33de042dSApple OSS Distributions 			_wq_cooperative_queue_scheduled_count_inc(wq, new_thread_qos);
4301*33de042dSApple OSS Distributions 		}
4302*33de042dSApple OSS Distributions 		cooperative_pool_sched_count_changed = true;
4303*33de042dSApple OSS Distributions 	} else {
4304*33de042dSApple OSS Distributions 		if (workq_tr_is_overcommit(tr_flags)) {
4305*33de042dSApple OSS Distributions 			// Case 6: Thread is non-overcommit, req is overcommit
4306*33de042dSApple OSS Distributions 			wq->wq_constrained_threads_scheduled--;
4307*33de042dSApple OSS Distributions 		} else if (workq_tr_is_cooperative(tr_flags)) {
4308*33de042dSApple OSS Distributions 			// Case 7: Thread is non-overcommit, req is cooperative
4309*33de042dSApple OSS Distributions 			wq->wq_constrained_threads_scheduled--;
4310*33de042dSApple OSS Distributions 			_wq_cooperative_queue_scheduled_count_inc(wq, new_thread_qos);
4311*33de042dSApple OSS Distributions 			cooperative_pool_sched_count_changed = true;
4312*33de042dSApple OSS Distributions 		}
4313*33de042dSApple OSS Distributions 	}
4314*33de042dSApple OSS Distributions 
4315*33de042dSApple OSS Distributions 	return cooperative_pool_sched_count_changed;
4316*33de042dSApple OSS Distributions }
4317*33de042dSApple OSS Distributions 
4318*33de042dSApple OSS Distributions static workq_threadreq_t
workq_threadreq_select(struct workqueue * wq,struct uthread * uth)4319*33de042dSApple OSS Distributions workq_threadreq_select(struct workqueue *wq, struct uthread *uth)
4320*33de042dSApple OSS Distributions {
4321*33de042dSApple OSS Distributions 	workq_threadreq_t req_qos, req_pri, req_tmp, req_mgr;
4322*33de042dSApple OSS Distributions 	uintptr_t proprietor;
4323*33de042dSApple OSS Distributions 	thread_qos_t qos = THREAD_QOS_UNSPECIFIED;
4324*33de042dSApple OSS Distributions 	uint8_t pri = 0;
4325*33de042dSApple OSS Distributions 
4326*33de042dSApple OSS Distributions 	if (uth == wq->wq_creator) {
4327*33de042dSApple OSS Distributions 		uth = NULL;
4328*33de042dSApple OSS Distributions 	}
4329*33de042dSApple OSS Distributions 
4330*33de042dSApple OSS Distributions 	/*
4331*33de042dSApple OSS Distributions 	 * Compute the best priority request (special or turnstile)
4332*33de042dSApple OSS Distributions 	 */
4333*33de042dSApple OSS Distributions 
4334*33de042dSApple OSS Distributions 	pri = (uint8_t)turnstile_workq_proprietor_of_max_turnstile(wq->wq_turnstile,
4335*33de042dSApple OSS Distributions 	    &proprietor);
4336*33de042dSApple OSS Distributions 	if (pri) {
4337*33de042dSApple OSS Distributions 		struct kqworkloop *kqwl = (struct kqworkloop *)proprietor;
4338*33de042dSApple OSS Distributions 		req_pri = &kqwl->kqwl_request;
4339*33de042dSApple OSS Distributions 		if (req_pri->tr_state != WORKQ_TR_STATE_QUEUED) {
4340*33de042dSApple OSS Distributions 			panic("Invalid thread request (%p) state %d",
4341*33de042dSApple OSS Distributions 			    req_pri, req_pri->tr_state);
4342*33de042dSApple OSS Distributions 		}
4343*33de042dSApple OSS Distributions 	} else {
4344*33de042dSApple OSS Distributions 		req_pri = NULL;
4345*33de042dSApple OSS Distributions 	}
4346*33de042dSApple OSS Distributions 
4347*33de042dSApple OSS Distributions 	req_tmp = priority_queue_max(&wq->wq_special_queue,
4348*33de042dSApple OSS Distributions 	    struct workq_threadreq_s, tr_entry);
4349*33de042dSApple OSS Distributions 	if (req_tmp && pri < priority_queue_entry_sched_pri(&wq->wq_special_queue,
4350*33de042dSApple OSS Distributions 	    &req_tmp->tr_entry)) {
4351*33de042dSApple OSS Distributions 		req_pri = req_tmp;
4352*33de042dSApple OSS Distributions 		pri = (uint8_t)priority_queue_entry_sched_pri(&wq->wq_special_queue,
4353*33de042dSApple OSS Distributions 		    &req_tmp->tr_entry);
4354*33de042dSApple OSS Distributions 	}
4355*33de042dSApple OSS Distributions 
4356*33de042dSApple OSS Distributions 	/*
4357*33de042dSApple OSS Distributions 	 * Handle the manager thread request. The special queue might yield
4358*33de042dSApple OSS Distributions 	 * a higher priority, but the manager always beats the QoS world.
4359*33de042dSApple OSS Distributions 	 */
4360*33de042dSApple OSS Distributions 
4361*33de042dSApple OSS Distributions 	req_mgr = wq->wq_event_manager_threadreq;
4362*33de042dSApple OSS Distributions 	if (req_mgr && workq_may_start_event_mgr_thread(wq, uth)) {
4363*33de042dSApple OSS Distributions 		uint32_t mgr_pri = wq->wq_event_manager_priority;
4364*33de042dSApple OSS Distributions 
4365*33de042dSApple OSS Distributions 		if (mgr_pri & _PTHREAD_PRIORITY_SCHED_PRI_FLAG) {
4366*33de042dSApple OSS Distributions 			mgr_pri &= _PTHREAD_PRIORITY_SCHED_PRI_MASK;
4367*33de042dSApple OSS Distributions 		} else {
4368*33de042dSApple OSS Distributions 			mgr_pri = thread_workq_pri_for_qos(
4369*33de042dSApple OSS Distributions 				_pthread_priority_thread_qos(mgr_pri));
4370*33de042dSApple OSS Distributions 		}
4371*33de042dSApple OSS Distributions 
4372*33de042dSApple OSS Distributions 		return mgr_pri >= pri ? req_mgr : req_pri;
4373*33de042dSApple OSS Distributions 	}
4374*33de042dSApple OSS Distributions 
4375*33de042dSApple OSS Distributions 	/*
4376*33de042dSApple OSS Distributions 	 * Compute the best QoS Request, and check whether it beats the "pri" one
4377*33de042dSApple OSS Distributions 	 */
4378*33de042dSApple OSS Distributions 
4379*33de042dSApple OSS Distributions 	req_qos = priority_queue_max(&wq->wq_overcommit_queue,
4380*33de042dSApple OSS Distributions 	    struct workq_threadreq_s, tr_entry);
4381*33de042dSApple OSS Distributions 	if (req_qos) {
4382*33de042dSApple OSS Distributions 		qos = req_qos->tr_qos;
4383*33de042dSApple OSS Distributions 	}
4384*33de042dSApple OSS Distributions 
4385*33de042dSApple OSS Distributions 	req_tmp = workq_cooperative_queue_best_req(wq, uth);
4386*33de042dSApple OSS Distributions 	if (req_tmp && qos <= req_tmp->tr_qos) {
4387*33de042dSApple OSS Distributions 		/*
4388*33de042dSApple OSS Distributions 		 * Cooperative TR is better between overcommit and cooperative.  Note
4389*33de042dSApple OSS Distributions 		 * that if qos is same between overcommit and cooperative, we choose
4390*33de042dSApple OSS Distributions 		 * cooperative.
4391*33de042dSApple OSS Distributions 		 *
4392*33de042dSApple OSS Distributions 		 * Pick cooperative pool if it passes the admissions check
4393*33de042dSApple OSS Distributions 		 */
4394*33de042dSApple OSS Distributions 		if (workq_cooperative_allowance(wq, req_tmp->tr_qos, uth, true)) {
4395*33de042dSApple OSS Distributions 			req_qos = req_tmp;
4396*33de042dSApple OSS Distributions 			qos = req_qos->tr_qos;
4397*33de042dSApple OSS Distributions 		}
4398*33de042dSApple OSS Distributions 	}
4399*33de042dSApple OSS Distributions 
4400*33de042dSApple OSS Distributions 	/*
4401*33de042dSApple OSS Distributions 	 * Compare the best QoS so far - either from overcommit or from cooperative
4402*33de042dSApple OSS Distributions 	 * pool - and compare it with the constrained pool
4403*33de042dSApple OSS Distributions 	 */
4404*33de042dSApple OSS Distributions 	req_tmp = priority_queue_max(&wq->wq_constrained_queue,
4405*33de042dSApple OSS Distributions 	    struct workq_threadreq_s, tr_entry);
4406*33de042dSApple OSS Distributions 
4407*33de042dSApple OSS Distributions 	if (req_tmp && qos < req_tmp->tr_qos) {
4408*33de042dSApple OSS Distributions 		/*
4409*33de042dSApple OSS Distributions 		 * Constrained pool is best in QoS between overcommit, cooperative
4410*33de042dSApple OSS Distributions 		 * and constrained. Now check how it fairs against the priority case
4411*33de042dSApple OSS Distributions 		 */
4412*33de042dSApple OSS Distributions 		if (pri && pri >= thread_workq_pri_for_qos(req_tmp->tr_qos)) {
4413*33de042dSApple OSS Distributions 			return req_pri;
4414*33de042dSApple OSS Distributions 		}
4415*33de042dSApple OSS Distributions 
4416*33de042dSApple OSS Distributions 		if (workq_constrained_allowance(wq, req_tmp->tr_qos, uth, true, true)) {
4417*33de042dSApple OSS Distributions 			/*
4418*33de042dSApple OSS Distributions 			 * If the constrained thread request is the best one and passes
4419*33de042dSApple OSS Distributions 			 * the admission check, pick it.
4420*33de042dSApple OSS Distributions 			 */
4421*33de042dSApple OSS Distributions 			return req_tmp;
4422*33de042dSApple OSS Distributions 		}
4423*33de042dSApple OSS Distributions 	}
4424*33de042dSApple OSS Distributions 
4425*33de042dSApple OSS Distributions 	if (req_pri && (!qos || pri >= thread_workq_pri_for_qos(qos))) {
4426*33de042dSApple OSS Distributions 		return req_pri;
4427*33de042dSApple OSS Distributions 	}
4428*33de042dSApple OSS Distributions 
4429*33de042dSApple OSS Distributions 	return req_qos;
4430*33de042dSApple OSS Distributions }
4431*33de042dSApple OSS Distributions 
4432*33de042dSApple OSS Distributions /*
4433*33de042dSApple OSS Distributions  * The creator is an anonymous thread that is counted as scheduled,
4434*33de042dSApple OSS Distributions  * but otherwise without its scheduler callback set or tracked as active
4435*33de042dSApple OSS Distributions  * that is used to make other threads.
4436*33de042dSApple OSS Distributions  *
4437*33de042dSApple OSS Distributions  * When more requests are added or an existing one is hurried along,
4438*33de042dSApple OSS Distributions  * a creator is elected and setup, or the existing one overridden accordingly.
4439*33de042dSApple OSS Distributions  *
4440*33de042dSApple OSS Distributions  * While this creator is in flight, because no request has been dequeued,
4441*33de042dSApple OSS Distributions  * already running threads have a chance at stealing thread requests avoiding
4442*33de042dSApple OSS Distributions  * useless context switches, and the creator once scheduled may not find any
4443*33de042dSApple OSS Distributions  * work to do and will then just park again.
4444*33de042dSApple OSS Distributions  *
4445*33de042dSApple OSS Distributions  * The creator serves the dual purpose of informing the scheduler of work that
4446*33de042dSApple OSS Distributions  * hasn't be materialized as threads yet, and also as a natural pacing mechanism
4447*33de042dSApple OSS Distributions  * for thread creation.
4448*33de042dSApple OSS Distributions  *
4449*33de042dSApple OSS Distributions  * By being anonymous (and not bound to anything) it means that thread requests
4450*33de042dSApple OSS Distributions  * can be stolen from this creator by threads already on core yielding more
4451*33de042dSApple OSS Distributions  * efficient scheduling and reduced context switches.
4452*33de042dSApple OSS Distributions  */
4453*33de042dSApple OSS Distributions static void
workq_schedule_creator(proc_t p,struct workqueue * wq,workq_kern_threadreq_flags_t flags)4454*33de042dSApple OSS Distributions workq_schedule_creator(proc_t p, struct workqueue *wq,
4455*33de042dSApple OSS Distributions     workq_kern_threadreq_flags_t flags)
4456*33de042dSApple OSS Distributions {
4457*33de042dSApple OSS Distributions 	workq_threadreq_t req;
4458*33de042dSApple OSS Distributions 	struct uthread *uth;
4459*33de042dSApple OSS Distributions 	bool needs_wakeup;
4460*33de042dSApple OSS Distributions 
4461*33de042dSApple OSS Distributions 	workq_lock_held(wq);
4462*33de042dSApple OSS Distributions 	assert(p || (flags & WORKQ_THREADREQ_CAN_CREATE_THREADS) == 0);
4463*33de042dSApple OSS Distributions 
4464*33de042dSApple OSS Distributions again:
4465*33de042dSApple OSS Distributions 	uth = wq->wq_creator;
4466*33de042dSApple OSS Distributions 
4467*33de042dSApple OSS Distributions 	if (!wq->wq_reqcount) {
4468*33de042dSApple OSS Distributions 		/*
4469*33de042dSApple OSS Distributions 		 * There is no thread request left.
4470*33de042dSApple OSS Distributions 		 *
4471*33de042dSApple OSS Distributions 		 * If there is a creator, leave everything in place, so that it cleans
4472*33de042dSApple OSS Distributions 		 * up itself in workq_push_idle_thread().
4473*33de042dSApple OSS Distributions 		 *
4474*33de042dSApple OSS Distributions 		 * Else, make sure the turnstile state is reset to no inheritor.
4475*33de042dSApple OSS Distributions 		 */
4476*33de042dSApple OSS Distributions 		if (uth == NULL) {
4477*33de042dSApple OSS Distributions 			workq_turnstile_update_inheritor(wq, TURNSTILE_INHERITOR_NULL, 0);
4478*33de042dSApple OSS Distributions 		}
4479*33de042dSApple OSS Distributions 		return;
4480*33de042dSApple OSS Distributions 	}
4481*33de042dSApple OSS Distributions 
4482*33de042dSApple OSS Distributions 	req = workq_threadreq_select_for_creator(wq);
4483*33de042dSApple OSS Distributions 	if (req == NULL) {
4484*33de042dSApple OSS Distributions 		/*
4485*33de042dSApple OSS Distributions 		 * There isn't a thread request that passes the admission check.
4486*33de042dSApple OSS Distributions 		 *
4487*33de042dSApple OSS Distributions 		 * If there is a creator, do not touch anything, the creator will sort
4488*33de042dSApple OSS Distributions 		 * it out when it runs.
4489*33de042dSApple OSS Distributions 		 *
4490*33de042dSApple OSS Distributions 		 * Else, set the inheritor to "WORKQ" so that the turnstile propagation
4491*33de042dSApple OSS Distributions 		 * code calls us if anything changes.
4492*33de042dSApple OSS Distributions 		 */
4493*33de042dSApple OSS Distributions 		if (uth == NULL) {
4494*33de042dSApple OSS Distributions 			workq_turnstile_update_inheritor(wq, wq, TURNSTILE_INHERITOR_WORKQ);
4495*33de042dSApple OSS Distributions 		}
4496*33de042dSApple OSS Distributions 		return;
4497*33de042dSApple OSS Distributions 	}
4498*33de042dSApple OSS Distributions 
4499*33de042dSApple OSS Distributions 
4500*33de042dSApple OSS Distributions 	if (uth) {
4501*33de042dSApple OSS Distributions 		/*
4502*33de042dSApple OSS Distributions 		 * We need to maybe override the creator we already have
4503*33de042dSApple OSS Distributions 		 */
4504*33de042dSApple OSS Distributions 		if (workq_thread_needs_priority_change(req, uth)) {
4505*33de042dSApple OSS Distributions 			WQ_TRACE_WQ(TRACE_wq_creator_select | DBG_FUNC_NONE,
4506*33de042dSApple OSS Distributions 			    wq, 1, uthread_tid(uth), req->tr_qos);
4507*33de042dSApple OSS Distributions 			workq_thread_reset_pri(wq, uth, req, /*unpark*/ true);
4508*33de042dSApple OSS Distributions 		}
4509*33de042dSApple OSS Distributions 		assert(wq->wq_inheritor == get_machthread(uth));
4510*33de042dSApple OSS Distributions 	} else if (wq->wq_thidlecount) {
4511*33de042dSApple OSS Distributions 		/*
4512*33de042dSApple OSS Distributions 		 * We need to unpark a creator thread
4513*33de042dSApple OSS Distributions 		 */
4514*33de042dSApple OSS Distributions 		wq->wq_creator = uth = workq_pop_idle_thread(wq, UT_WORKQ_OVERCOMMIT,
4515*33de042dSApple OSS Distributions 		    &needs_wakeup);
4516*33de042dSApple OSS Distributions 		/* Always reset the priorities on the newly chosen creator */
4517*33de042dSApple OSS Distributions 		workq_thread_reset_pri(wq, uth, req, /*unpark*/ true);
4518*33de042dSApple OSS Distributions 		workq_turnstile_update_inheritor(wq, get_machthread(uth),
4519*33de042dSApple OSS Distributions 		    TURNSTILE_INHERITOR_THREAD);
4520*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_creator_select | DBG_FUNC_NONE,
4521*33de042dSApple OSS Distributions 		    wq, 2, uthread_tid(uth), req->tr_qos);
4522*33de042dSApple OSS Distributions 		uth->uu_save.uus_workq_park_data.fulfilled_snapshot = wq->wq_fulfilled;
4523*33de042dSApple OSS Distributions 		uth->uu_save.uus_workq_park_data.yields = 0;
4524*33de042dSApple OSS Distributions 		if (needs_wakeup) {
4525*33de042dSApple OSS Distributions 			workq_thread_wakeup(uth);
4526*33de042dSApple OSS Distributions 		}
4527*33de042dSApple OSS Distributions 	} else {
4528*33de042dSApple OSS Distributions 		/*
4529*33de042dSApple OSS Distributions 		 * We need to allocate a thread...
4530*33de042dSApple OSS Distributions 		 */
4531*33de042dSApple OSS Distributions 		if (__improbable(wq->wq_nthreads >= wq_max_threads)) {
4532*33de042dSApple OSS Distributions 			/* out of threads, just go away */
4533*33de042dSApple OSS Distributions 			flags = WORKQ_THREADREQ_NONE;
4534*33de042dSApple OSS Distributions 		} else if (flags & WORKQ_THREADREQ_SET_AST_ON_FAILURE) {
4535*33de042dSApple OSS Distributions 			act_set_astkevent(current_thread(), AST_KEVENT_REDRIVE_THREADREQ);
4536*33de042dSApple OSS Distributions 		} else if (!(flags & WORKQ_THREADREQ_CAN_CREATE_THREADS)) {
4537*33de042dSApple OSS Distributions 			/* This can drop the workqueue lock, and take it again */
4538*33de042dSApple OSS Distributions 			workq_schedule_immediate_thread_creation(wq);
4539*33de042dSApple OSS Distributions 		} else if ((workq_add_new_idle_thread(p, wq,
4540*33de042dSApple OSS Distributions 		    workq_unpark_continue, false, NULL) == KERN_SUCCESS)) {
4541*33de042dSApple OSS Distributions 			goto again;
4542*33de042dSApple OSS Distributions 		} else {
4543*33de042dSApple OSS Distributions 			workq_schedule_delayed_thread_creation(wq, 0);
4544*33de042dSApple OSS Distributions 		}
4545*33de042dSApple OSS Distributions 
4546*33de042dSApple OSS Distributions 		/*
4547*33de042dSApple OSS Distributions 		 * If the current thread is the inheritor:
4548*33de042dSApple OSS Distributions 		 *
4549*33de042dSApple OSS Distributions 		 * If we set the AST, then the thread will stay the inheritor until
4550*33de042dSApple OSS Distributions 		 * either the AST calls workq_kern_threadreq_redrive(), or it parks
4551*33de042dSApple OSS Distributions 		 * and calls workq_push_idle_thread().
4552*33de042dSApple OSS Distributions 		 *
4553*33de042dSApple OSS Distributions 		 * Else, the responsibility of the thread creation is with a thread-call
4554*33de042dSApple OSS Distributions 		 * and we need to clear the inheritor.
4555*33de042dSApple OSS Distributions 		 */
4556*33de042dSApple OSS Distributions 		if ((flags & WORKQ_THREADREQ_SET_AST_ON_FAILURE) == 0 &&
4557*33de042dSApple OSS Distributions 		    wq->wq_inheritor == current_thread()) {
4558*33de042dSApple OSS Distributions 			workq_turnstile_update_inheritor(wq, TURNSTILE_INHERITOR_NULL, 0);
4559*33de042dSApple OSS Distributions 		}
4560*33de042dSApple OSS Distributions 	}
4561*33de042dSApple OSS Distributions }
4562*33de042dSApple OSS Distributions 
4563*33de042dSApple OSS Distributions /**
4564*33de042dSApple OSS Distributions  * Same as workq_unpark_select_threadreq_or_park_and_unlock,
4565*33de042dSApple OSS Distributions  * but do not allow early binds.
4566*33de042dSApple OSS Distributions  *
4567*33de042dSApple OSS Distributions  * Called with the base pri frozen, will unfreeze it.
4568*33de042dSApple OSS Distributions  */
4569*33de042dSApple OSS Distributions __attribute__((noreturn, noinline))
4570*33de042dSApple OSS Distributions static void
workq_select_threadreq_or_park_and_unlock(proc_t p,struct workqueue * wq,struct uthread * uth,uint32_t setup_flags)4571*33de042dSApple OSS Distributions workq_select_threadreq_or_park_and_unlock(proc_t p, struct workqueue *wq,
4572*33de042dSApple OSS Distributions     struct uthread *uth, uint32_t setup_flags)
4573*33de042dSApple OSS Distributions {
4574*33de042dSApple OSS Distributions 	workq_threadreq_t req = NULL;
4575*33de042dSApple OSS Distributions 	bool is_creator = (wq->wq_creator == uth);
4576*33de042dSApple OSS Distributions 	bool schedule_creator = false;
4577*33de042dSApple OSS Distributions 
4578*33de042dSApple OSS Distributions 	if (__improbable(_wq_exiting(wq))) {
4579*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_select_threadreq | DBG_FUNC_NONE, wq, 0, 0, 0);
4580*33de042dSApple OSS Distributions 		goto park;
4581*33de042dSApple OSS Distributions 	}
4582*33de042dSApple OSS Distributions 
4583*33de042dSApple OSS Distributions 	if (wq->wq_reqcount == 0) {
4584*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_select_threadreq | DBG_FUNC_NONE, wq, 1, 0, 0);
4585*33de042dSApple OSS Distributions 		goto park;
4586*33de042dSApple OSS Distributions 	}
4587*33de042dSApple OSS Distributions 
4588*33de042dSApple OSS Distributions 	req = workq_threadreq_select(wq, uth);
4589*33de042dSApple OSS Distributions 	if (__improbable(req == NULL)) {
4590*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_select_threadreq | DBG_FUNC_NONE, wq, 2, 0, 0);
4591*33de042dSApple OSS Distributions 		goto park;
4592*33de042dSApple OSS Distributions 	}
4593*33de042dSApple OSS Distributions 
4594*33de042dSApple OSS Distributions 	struct uu_workq_policy old_pri = uth->uu_workq_pri;
4595*33de042dSApple OSS Distributions 	uint8_t tr_flags = req->tr_flags;
4596*33de042dSApple OSS Distributions 	struct turnstile *req_ts = kqueue_threadreq_get_turnstile(req);
4597*33de042dSApple OSS Distributions 
4598*33de042dSApple OSS Distributions 	/*
4599*33de042dSApple OSS Distributions 	 * Attempt to setup ourselves as the new thing to run, moving all priority
4600*33de042dSApple OSS Distributions 	 * pushes to ourselves.
4601*33de042dSApple OSS Distributions 	 *
4602*33de042dSApple OSS Distributions 	 * If the current thread is the creator, then the fact that we are presently
4603*33de042dSApple OSS Distributions 	 * running is proof that we'll do something useful, so keep going.
4604*33de042dSApple OSS Distributions 	 *
4605*33de042dSApple OSS Distributions 	 * For other cases, peek at the AST to know whether the scheduler wants
4606*33de042dSApple OSS Distributions 	 * to preempt us, if yes, park instead, and move the thread request
4607*33de042dSApple OSS Distributions 	 * turnstile back to the workqueue.
4608*33de042dSApple OSS Distributions 	 */
4609*33de042dSApple OSS Distributions 	if (req_ts) {
4610*33de042dSApple OSS Distributions 		workq_perform_turnstile_operation_locked(wq, ^{
4611*33de042dSApple OSS Distributions 			turnstile_update_inheritor(req_ts, get_machthread(uth),
4612*33de042dSApple OSS Distributions 			TURNSTILE_IMMEDIATE_UPDATE | TURNSTILE_INHERITOR_THREAD);
4613*33de042dSApple OSS Distributions 			turnstile_update_inheritor_complete(req_ts,
4614*33de042dSApple OSS Distributions 			TURNSTILE_INTERLOCK_HELD);
4615*33de042dSApple OSS Distributions 		});
4616*33de042dSApple OSS Distributions 	}
4617*33de042dSApple OSS Distributions 
4618*33de042dSApple OSS Distributions 	/* accounting changes of aggregate thscheduled_count and thactive which has
4619*33de042dSApple OSS Distributions 	 * to be paired with the workq_thread_reset_pri below so that we have
4620*33de042dSApple OSS Distributions 	 * uth->uu_workq_pri match with thactive.
4621*33de042dSApple OSS Distributions 	 *
4622*33de042dSApple OSS Distributions 	 * This is undone when the thread parks */
4623*33de042dSApple OSS Distributions 	if (is_creator) {
4624*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_creator_select, wq, 4, 0,
4625*33de042dSApple OSS Distributions 		    uth->uu_save.uus_workq_park_data.yields);
4626*33de042dSApple OSS Distributions 		wq->wq_creator = NULL;
4627*33de042dSApple OSS Distributions 		_wq_thactive_inc(wq, req->tr_qos);
4628*33de042dSApple OSS Distributions 		wq->wq_thscheduled_count[_wq_bucket(req->tr_qos)]++;
4629*33de042dSApple OSS Distributions 	} else if (old_pri.qos_bucket != req->tr_qos) {
4630*33de042dSApple OSS Distributions 		_wq_thactive_move(wq, old_pri.qos_bucket, req->tr_qos);
4631*33de042dSApple OSS Distributions 	}
4632*33de042dSApple OSS Distributions 	workq_thread_reset_pri(wq, uth, req, /*unpark*/ true);
4633*33de042dSApple OSS Distributions 
4634*33de042dSApple OSS Distributions 	/*
4635*33de042dSApple OSS Distributions 	 * Make relevant accounting changes for pool specific counts.
4636*33de042dSApple OSS Distributions 	 *
4637*33de042dSApple OSS Distributions 	 * The schedule counts changing can affect what the next best request
4638*33de042dSApple OSS Distributions 	 * for cooperative thread pool is if this request is dequeued.
4639*33de042dSApple OSS Distributions 	 */
4640*33de042dSApple OSS Distributions 	bool cooperative_sched_count_changed =
4641*33de042dSApple OSS Distributions 	    workq_adjust_cooperative_constrained_schedule_counts(wq, uth,
4642*33de042dSApple OSS Distributions 	    old_pri.qos_req, tr_flags);
4643*33de042dSApple OSS Distributions 
4644*33de042dSApple OSS Distributions 	if (workq_tr_is_overcommit(tr_flags)) {
4645*33de042dSApple OSS Distributions 		workq_thread_set_type(uth, UT_WORKQ_OVERCOMMIT);
4646*33de042dSApple OSS Distributions 	} else if (workq_tr_is_cooperative(tr_flags)) {
4647*33de042dSApple OSS Distributions 		workq_thread_set_type(uth, UT_WORKQ_COOPERATIVE);
4648*33de042dSApple OSS Distributions 	} else {
4649*33de042dSApple OSS Distributions 		workq_thread_set_type(uth, 0);
4650*33de042dSApple OSS Distributions 	}
4651*33de042dSApple OSS Distributions 
4652*33de042dSApple OSS Distributions 	if (__improbable(thread_unfreeze_base_pri(get_machthread(uth)) && !is_creator)) {
4653*33de042dSApple OSS Distributions 		if (req_ts) {
4654*33de042dSApple OSS Distributions 			workq_perform_turnstile_operation_locked(wq, ^{
4655*33de042dSApple OSS Distributions 				turnstile_update_inheritor(req_ts, wq->wq_turnstile,
4656*33de042dSApple OSS Distributions 				TURNSTILE_IMMEDIATE_UPDATE | TURNSTILE_INHERITOR_TURNSTILE);
4657*33de042dSApple OSS Distributions 				turnstile_update_inheritor_complete(req_ts,
4658*33de042dSApple OSS Distributions 				TURNSTILE_INTERLOCK_HELD);
4659*33de042dSApple OSS Distributions 			});
4660*33de042dSApple OSS Distributions 		}
4661*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_select_threadreq | DBG_FUNC_NONE, wq, 3, 0, 0);
4662*33de042dSApple OSS Distributions 
4663*33de042dSApple OSS Distributions 		/*
4664*33de042dSApple OSS Distributions 		 * If a cooperative thread was the one which picked up the manager
4665*33de042dSApple OSS Distributions 		 * thread request, we need to reevaluate the cooperative pool before
4666*33de042dSApple OSS Distributions 		 * it goes and parks.
4667*33de042dSApple OSS Distributions 		 *
4668*33de042dSApple OSS Distributions 		 * For every other of thread request that it picks up, the logic in
4669*33de042dSApple OSS Distributions 		 * workq_threadreq_select should have done this refresh.
4670*33de042dSApple OSS Distributions 		 * See workq_push_idle_thread.
4671*33de042dSApple OSS Distributions 		 */
4672*33de042dSApple OSS Distributions 		if (cooperative_sched_count_changed) {
4673*33de042dSApple OSS Distributions 			if (req->tr_qos == WORKQ_THREAD_QOS_MANAGER) {
4674*33de042dSApple OSS Distributions 				_wq_cooperative_queue_refresh_best_req_qos(wq);
4675*33de042dSApple OSS Distributions 			}
4676*33de042dSApple OSS Distributions 		}
4677*33de042dSApple OSS Distributions 		goto park_thawed;
4678*33de042dSApple OSS Distributions 	}
4679*33de042dSApple OSS Distributions 
4680*33de042dSApple OSS Distributions 	/*
4681*33de042dSApple OSS Distributions 	 * We passed all checks, dequeue the request, bind to it, and set it up
4682*33de042dSApple OSS Distributions 	 * to return to user.
4683*33de042dSApple OSS Distributions 	 */
4684*33de042dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_thread_logical_run | DBG_FUNC_START, wq,
4685*33de042dSApple OSS Distributions 	    workq_trace_req_id(req), tr_flags, 0);
4686*33de042dSApple OSS Distributions 	wq->wq_fulfilled++;
4687*33de042dSApple OSS Distributions 	schedule_creator = workq_threadreq_dequeue(wq, req,
4688*33de042dSApple OSS Distributions 	    cooperative_sched_count_changed);
4689*33de042dSApple OSS Distributions 
4690*33de042dSApple OSS Distributions 	workq_thread_reset_cpupercent(req, uth);
4691*33de042dSApple OSS Distributions 
4692*33de042dSApple OSS Distributions 	if (tr_flags & (WORKQ_TR_FLAG_KEVENT | WORKQ_TR_FLAG_WORKLOOP)) {
4693*33de042dSApple OSS Distributions 		kqueue_threadreq_bind_prepost(p, req, uth);
4694*33de042dSApple OSS Distributions 		req = NULL;
4695*33de042dSApple OSS Distributions 	} else if (req->tr_count > 0) {
4696*33de042dSApple OSS Distributions 		req = NULL;
4697*33de042dSApple OSS Distributions 	}
4698*33de042dSApple OSS Distributions 
4699*33de042dSApple OSS Distributions 	if (uth->uu_workq_flags & UT_WORKQ_NEW) {
4700*33de042dSApple OSS Distributions 		uth->uu_workq_flags ^= UT_WORKQ_NEW;
4701*33de042dSApple OSS Distributions 		setup_flags |= WQ_SETUP_FIRST_USE;
4702*33de042dSApple OSS Distributions 	}
4703*33de042dSApple OSS Distributions 
4704*33de042dSApple OSS Distributions 	/* If one of the following is true, call workq_schedule_creator (which also
4705*33de042dSApple OSS Distributions 	 * adjusts priority of existing creator):
4706*33de042dSApple OSS Distributions 	 *
4707*33de042dSApple OSS Distributions 	 *	  - We are the creator currently so the wq may need a new creator
4708*33de042dSApple OSS Distributions 	 *	  - The request we're binding to is the highest priority one, existing
4709*33de042dSApple OSS Distributions 	 *	  creator's priority might need to be adjusted to reflect the next
4710*33de042dSApple OSS Distributions 	 *	  highest TR
4711*33de042dSApple OSS Distributions 	 */
4712*33de042dSApple OSS Distributions 	if (is_creator || schedule_creator) {
4713*33de042dSApple OSS Distributions 		/* This can drop the workqueue lock, and take it again */
4714*33de042dSApple OSS Distributions 		workq_schedule_creator(p, wq, WORKQ_THREADREQ_CAN_CREATE_THREADS);
4715*33de042dSApple OSS Distributions 	}
4716*33de042dSApple OSS Distributions 
4717*33de042dSApple OSS Distributions 	workq_unlock(wq);
4718*33de042dSApple OSS Distributions 
4719*33de042dSApple OSS Distributions 	if (req) {
4720*33de042dSApple OSS Distributions 		zfree(workq_zone_threadreq, req);
4721*33de042dSApple OSS Distributions 	}
4722*33de042dSApple OSS Distributions 
4723*33de042dSApple OSS Distributions 	/*
4724*33de042dSApple OSS Distributions 	 * Run Thread, Run!
4725*33de042dSApple OSS Distributions 	 */
4726*33de042dSApple OSS Distributions 	uint32_t upcall_flags = WQ_FLAG_THREAD_NEWSPI;
4727*33de042dSApple OSS Distributions 	if (uth->uu_workq_pri.qos_bucket == WORKQ_THREAD_QOS_MANAGER) {
4728*33de042dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_EVENT_MANAGER;
4729*33de042dSApple OSS Distributions 	} else if (workq_tr_is_overcommit(tr_flags)) {
4730*33de042dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_OVERCOMMIT;
4731*33de042dSApple OSS Distributions 	} else if (workq_tr_is_cooperative(tr_flags)) {
4732*33de042dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_COOPERATIVE;
4733*33de042dSApple OSS Distributions 	}
4734*33de042dSApple OSS Distributions 	if (tr_flags & WORKQ_TR_FLAG_KEVENT) {
4735*33de042dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_KEVENT;
4736*33de042dSApple OSS Distributions 		assert((upcall_flags & WQ_FLAG_THREAD_COOPERATIVE) == 0);
4737*33de042dSApple OSS Distributions 	}
4738*33de042dSApple OSS Distributions 
4739*33de042dSApple OSS Distributions 	if (tr_flags & WORKQ_TR_FLAG_WORKLOOP) {
4740*33de042dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_WORKLOOP | WQ_FLAG_THREAD_KEVENT;
4741*33de042dSApple OSS Distributions 	}
4742*33de042dSApple OSS Distributions 	uth->uu_save.uus_workq_park_data.upcall_flags = upcall_flags;
4743*33de042dSApple OSS Distributions 
4744*33de042dSApple OSS Distributions 	if (tr_flags & (WORKQ_TR_FLAG_KEVENT | WORKQ_TR_FLAG_WORKLOOP)) {
4745*33de042dSApple OSS Distributions 		kqueue_threadreq_bind_commit(p, get_machthread(uth));
4746*33de042dSApple OSS Distributions 	} else {
4747*33de042dSApple OSS Distributions #if CONFIG_PREADOPT_TG
4748*33de042dSApple OSS Distributions 		/*
4749*33de042dSApple OSS Distributions 		 * The thread may have a preadopt thread group on it already because it
4750*33de042dSApple OSS Distributions 		 * got tagged with it as a creator thread. So we need to make sure to
4751*33de042dSApple OSS Distributions 		 * clear that since we don't have preadoption for anonymous thread
4752*33de042dSApple OSS Distributions 		 * requests
4753*33de042dSApple OSS Distributions 		 */
4754*33de042dSApple OSS Distributions 		thread_set_preadopt_thread_group(get_machthread(uth), NULL);
4755*33de042dSApple OSS Distributions #endif
4756*33de042dSApple OSS Distributions 	}
4757*33de042dSApple OSS Distributions 
4758*33de042dSApple OSS Distributions 	workq_setup_and_run(p, uth, setup_flags);
4759*33de042dSApple OSS Distributions 	__builtin_unreachable();
4760*33de042dSApple OSS Distributions 
4761*33de042dSApple OSS Distributions park:
4762*33de042dSApple OSS Distributions 	thread_unfreeze_base_pri(get_machthread(uth));
4763*33de042dSApple OSS Distributions park_thawed:
4764*33de042dSApple OSS Distributions 	workq_park_and_unlock(p, wq, uth, setup_flags);
4765*33de042dSApple OSS Distributions }
4766*33de042dSApple OSS Distributions 
4767*33de042dSApple OSS Distributions /**
4768*33de042dSApple OSS Distributions  * Runs a thread request on a thread
4769*33de042dSApple OSS Distributions  *
4770*33de042dSApple OSS Distributions  * - if thread is THREAD_NULL, will find a thread and run the request there.
4771*33de042dSApple OSS Distributions  *   Otherwise, the thread must be the current thread.
4772*33de042dSApple OSS Distributions  *
4773*33de042dSApple OSS Distributions  * - if req is NULL, will find the highest priority request and run that.  If
4774*33de042dSApple OSS Distributions  *   it is not NULL, it must be a threadreq object in state NEW.  If it can not
4775*33de042dSApple OSS Distributions  *   be run immediately, it will be enqueued and moved to state QUEUED.
4776*33de042dSApple OSS Distributions  *
4777*33de042dSApple OSS Distributions  *   Either way, the thread request object serviced will be moved to state
4778*33de042dSApple OSS Distributions  *   BINDING and attached to the uthread.
4779*33de042dSApple OSS Distributions  *
4780*33de042dSApple OSS Distributions  * Should be called with the workqueue lock held.  Will drop it.
4781*33de042dSApple OSS Distributions  * Should be called with the base pri not frozen.
4782*33de042dSApple OSS Distributions  */
4783*33de042dSApple OSS Distributions __attribute__((noreturn, noinline))
4784*33de042dSApple OSS Distributions static void
workq_unpark_select_threadreq_or_park_and_unlock(proc_t p,struct workqueue * wq,struct uthread * uth,uint32_t setup_flags)4785*33de042dSApple OSS Distributions workq_unpark_select_threadreq_or_park_and_unlock(proc_t p, struct workqueue *wq,
4786*33de042dSApple OSS Distributions     struct uthread *uth, uint32_t setup_flags)
4787*33de042dSApple OSS Distributions {
4788*33de042dSApple OSS Distributions 	if (uth->uu_workq_flags & UT_WORKQ_EARLY_BOUND) {
4789*33de042dSApple OSS Distributions 		if (uth->uu_workq_flags & UT_WORKQ_NEW) {
4790*33de042dSApple OSS Distributions 			setup_flags |= WQ_SETUP_FIRST_USE;
4791*33de042dSApple OSS Distributions 		}
4792*33de042dSApple OSS Distributions 		uth->uu_workq_flags &= ~(UT_WORKQ_NEW | UT_WORKQ_EARLY_BOUND);
4793*33de042dSApple OSS Distributions 		/*
4794*33de042dSApple OSS Distributions 		 * This pointer is possibly freed and only used for tracing purposes.
4795*33de042dSApple OSS Distributions 		 */
4796*33de042dSApple OSS Distributions 		workq_threadreq_t req = uth->uu_save.uus_workq_park_data.thread_request;
4797*33de042dSApple OSS Distributions 		workq_unlock(wq);
4798*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_thread_logical_run | DBG_FUNC_START, wq,
4799*33de042dSApple OSS Distributions 		    VM_KERNEL_ADDRHIDE(req), 0, 0);
4800*33de042dSApple OSS Distributions 		(void)req;
4801*33de042dSApple OSS Distributions 
4802*33de042dSApple OSS Distributions 		workq_setup_and_run(p, uth, setup_flags);
4803*33de042dSApple OSS Distributions 		__builtin_unreachable();
4804*33de042dSApple OSS Distributions 	}
4805*33de042dSApple OSS Distributions 
4806*33de042dSApple OSS Distributions 	thread_freeze_base_pri(get_machthread(uth));
4807*33de042dSApple OSS Distributions 	workq_select_threadreq_or_park_and_unlock(p, wq, uth, setup_flags);
4808*33de042dSApple OSS Distributions }
4809*33de042dSApple OSS Distributions 
4810*33de042dSApple OSS Distributions static bool
workq_creator_should_yield(struct workqueue * wq,struct uthread * uth)4811*33de042dSApple OSS Distributions workq_creator_should_yield(struct workqueue *wq, struct uthread *uth)
4812*33de042dSApple OSS Distributions {
4813*33de042dSApple OSS Distributions 	thread_qos_t qos = workq_pri_override(uth->uu_workq_pri);
4814*33de042dSApple OSS Distributions 
4815*33de042dSApple OSS Distributions 	if (qos >= THREAD_QOS_USER_INTERACTIVE) {
4816*33de042dSApple OSS Distributions 		return false;
4817*33de042dSApple OSS Distributions 	}
4818*33de042dSApple OSS Distributions 
4819*33de042dSApple OSS Distributions 	uint32_t snapshot = uth->uu_save.uus_workq_park_data.fulfilled_snapshot;
4820*33de042dSApple OSS Distributions 	if (wq->wq_fulfilled == snapshot) {
4821*33de042dSApple OSS Distributions 		return false;
4822*33de042dSApple OSS Distributions 	}
4823*33de042dSApple OSS Distributions 
4824*33de042dSApple OSS Distributions 	uint32_t cnt = 0, conc = wq_max_parallelism[_wq_bucket(qos)];
4825*33de042dSApple OSS Distributions 	if (wq->wq_fulfilled - snapshot > conc) {
4826*33de042dSApple OSS Distributions 		/* we fulfilled more than NCPU requests since being dispatched */
4827*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_creator_yield, wq, 1,
4828*33de042dSApple OSS Distributions 		    wq->wq_fulfilled, snapshot);
4829*33de042dSApple OSS Distributions 		return true;
4830*33de042dSApple OSS Distributions 	}
4831*33de042dSApple OSS Distributions 
4832*33de042dSApple OSS Distributions 	for (uint8_t i = _wq_bucket(qos); i < WORKQ_NUM_QOS_BUCKETS; i++) {
4833*33de042dSApple OSS Distributions 		cnt += wq->wq_thscheduled_count[i];
4834*33de042dSApple OSS Distributions 	}
4835*33de042dSApple OSS Distributions 	if (conc <= cnt) {
4836*33de042dSApple OSS Distributions 		/* We fulfilled requests and have more than NCPU scheduled threads */
4837*33de042dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_creator_yield, wq, 2,
4838*33de042dSApple OSS Distributions 		    wq->wq_fulfilled, snapshot);
4839*33de042dSApple OSS Distributions 		return true;
4840*33de042dSApple OSS Distributions 	}
4841*33de042dSApple OSS Distributions 
4842*33de042dSApple OSS Distributions 	return false;
4843*33de042dSApple OSS Distributions }
4844*33de042dSApple OSS Distributions 
4845*33de042dSApple OSS Distributions /**
4846*33de042dSApple OSS Distributions  * parked idle thread wakes up
4847*33de042dSApple OSS Distributions  */
4848*33de042dSApple OSS Distributions __attribute__((noreturn, noinline))
4849*33de042dSApple OSS Distributions static void
workq_unpark_continue(void * parameter __unused,wait_result_t wr __unused)4850*33de042dSApple OSS Distributions workq_unpark_continue(void *parameter __unused, wait_result_t wr __unused)
4851*33de042dSApple OSS Distributions {
4852*33de042dSApple OSS Distributions 	thread_t th = current_thread();
4853*33de042dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(th);
4854*33de042dSApple OSS Distributions 	proc_t p = current_proc();
4855*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr_fast(p);
4856*33de042dSApple OSS Distributions 
4857*33de042dSApple OSS Distributions 	workq_lock_spin(wq);
4858*33de042dSApple OSS Distributions 
4859*33de042dSApple OSS Distributions 	if (wq->wq_creator == uth && workq_creator_should_yield(wq, uth)) {
4860*33de042dSApple OSS Distributions 		/*
4861*33de042dSApple OSS Distributions 		 * If the number of threads we have out are able to keep up with the
4862*33de042dSApple OSS Distributions 		 * demand, then we should avoid sending this creator thread to
4863*33de042dSApple OSS Distributions 		 * userspace.
4864*33de042dSApple OSS Distributions 		 */
4865*33de042dSApple OSS Distributions 		uth->uu_save.uus_workq_park_data.fulfilled_snapshot = wq->wq_fulfilled;
4866*33de042dSApple OSS Distributions 		uth->uu_save.uus_workq_park_data.yields++;
4867*33de042dSApple OSS Distributions 		workq_unlock(wq);
4868*33de042dSApple OSS Distributions 		thread_yield_with_continuation(workq_unpark_continue, NULL);
4869*33de042dSApple OSS Distributions 		__builtin_unreachable();
4870*33de042dSApple OSS Distributions 	}
4871*33de042dSApple OSS Distributions 
4872*33de042dSApple OSS Distributions 	if (__probable(uth->uu_workq_flags & UT_WORKQ_RUNNING)) {
4873*33de042dSApple OSS Distributions 		workq_unpark_select_threadreq_or_park_and_unlock(p, wq, uth, WQ_SETUP_NONE);
4874*33de042dSApple OSS Distributions 		__builtin_unreachable();
4875*33de042dSApple OSS Distributions 	}
4876*33de042dSApple OSS Distributions 
4877*33de042dSApple OSS Distributions 	if (__probable(wr == THREAD_AWAKENED)) {
4878*33de042dSApple OSS Distributions 		/*
4879*33de042dSApple OSS Distributions 		 * We were set running, but for the purposes of dying.
4880*33de042dSApple OSS Distributions 		 */
4881*33de042dSApple OSS Distributions 		assert(uth->uu_workq_flags & UT_WORKQ_DYING);
4882*33de042dSApple OSS Distributions 		assert((uth->uu_workq_flags & UT_WORKQ_NEW) == 0);
4883*33de042dSApple OSS Distributions 	} else {
4884*33de042dSApple OSS Distributions 		/*
4885*33de042dSApple OSS Distributions 		 * workaround for <rdar://problem/38647347>,
4886*33de042dSApple OSS Distributions 		 * in case we do hit userspace, make sure calling
4887*33de042dSApple OSS Distributions 		 * workq_thread_terminate() does the right thing here,
4888*33de042dSApple OSS Distributions 		 * and if we never call it, that workq_exit() will too because it sees
4889*33de042dSApple OSS Distributions 		 * this thread on the runlist.
4890*33de042dSApple OSS Distributions 		 */
4891*33de042dSApple OSS Distributions 		assert(wr == THREAD_INTERRUPTED);
4892*33de042dSApple OSS Distributions 		wq->wq_thdying_count++;
4893*33de042dSApple OSS Distributions 		uth->uu_workq_flags |= UT_WORKQ_DYING;
4894*33de042dSApple OSS Distributions 	}
4895*33de042dSApple OSS Distributions 
4896*33de042dSApple OSS Distributions 	workq_unpark_for_death_and_unlock(p, wq, uth,
4897*33de042dSApple OSS Distributions 	    WORKQ_UNPARK_FOR_DEATH_WAS_IDLE, WQ_SETUP_NONE);
4898*33de042dSApple OSS Distributions 	__builtin_unreachable();
4899*33de042dSApple OSS Distributions }
4900*33de042dSApple OSS Distributions 
4901*33de042dSApple OSS Distributions __attribute__((noreturn, noinline))
4902*33de042dSApple OSS Distributions static void
workq_setup_and_run(proc_t p,struct uthread * uth,int setup_flags)4903*33de042dSApple OSS Distributions workq_setup_and_run(proc_t p, struct uthread *uth, int setup_flags)
4904*33de042dSApple OSS Distributions {
4905*33de042dSApple OSS Distributions 	thread_t th = get_machthread(uth);
4906*33de042dSApple OSS Distributions 	vm_map_t vmap = get_task_map(proc_task(p));
4907*33de042dSApple OSS Distributions 
4908*33de042dSApple OSS Distributions 	if (setup_flags & WQ_SETUP_CLEAR_VOUCHER) {
4909*33de042dSApple OSS Distributions 		/*
4910*33de042dSApple OSS Distributions 		 * For preemption reasons, we want to reset the voucher as late as
4911*33de042dSApple OSS Distributions 		 * possible, so we do it in two places:
4912*33de042dSApple OSS Distributions 		 *   - Just before parking (i.e. in workq_park_and_unlock())
4913*33de042dSApple OSS Distributions 		 *   - Prior to doing the setup for the next workitem (i.e. here)
4914*33de042dSApple OSS Distributions 		 *
4915*33de042dSApple OSS Distributions 		 * Those two places are sufficient to ensure we always reset it before
4916*33de042dSApple OSS Distributions 		 * it goes back out to user space, but be careful to not break that
4917*33de042dSApple OSS Distributions 		 * guarantee.
4918*33de042dSApple OSS Distributions 		 *
4919*33de042dSApple OSS Distributions 		 * Note that setting the voucher to NULL will not clear the preadoption
4920*33de042dSApple OSS Distributions 		 * thread group on this thread
4921*33de042dSApple OSS Distributions 		 */
4922*33de042dSApple OSS Distributions 		__assert_only kern_return_t kr;
4923*33de042dSApple OSS Distributions 		kr = thread_set_voucher_name(MACH_PORT_NULL);
4924*33de042dSApple OSS Distributions 		assert(kr == KERN_SUCCESS);
4925*33de042dSApple OSS Distributions 	}
4926*33de042dSApple OSS Distributions 
4927*33de042dSApple OSS Distributions 	uint32_t upcall_flags = uth->uu_save.uus_workq_park_data.upcall_flags;
4928*33de042dSApple OSS Distributions 	if (!(setup_flags & WQ_SETUP_FIRST_USE)) {
4929*33de042dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_REUSE;
4930*33de042dSApple OSS Distributions 	}
4931*33de042dSApple OSS Distributions 
4932*33de042dSApple OSS Distributions 	if (uth->uu_workq_flags & UT_WORKQ_OUTSIDE_QOS) {
4933*33de042dSApple OSS Distributions 		/*
4934*33de042dSApple OSS Distributions 		 * For threads that have an outside-of-QoS thread priority, indicate
4935*33de042dSApple OSS Distributions 		 * to userspace that setting QoS should only affect the TSD and not
4936*33de042dSApple OSS Distributions 		 * change QOS in the kernel.
4937*33de042dSApple OSS Distributions 		 */
4938*33de042dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_OUTSIDEQOS;
4939*33de042dSApple OSS Distributions 	} else {
4940*33de042dSApple OSS Distributions 		/*
4941*33de042dSApple OSS Distributions 		 * Put the QoS class value into the lower bits of the reuse_thread
4942*33de042dSApple OSS Distributions 		 * register, this is where the thread priority used to be stored
4943*33de042dSApple OSS Distributions 		 * anyway.
4944*33de042dSApple OSS Distributions 		 */
4945*33de042dSApple OSS Distributions 		upcall_flags |= uth->uu_save.uus_workq_park_data.qos |
4946*33de042dSApple OSS Distributions 		    WQ_FLAG_THREAD_PRIO_QOS;
4947*33de042dSApple OSS Distributions 	}
4948*33de042dSApple OSS Distributions 
4949*33de042dSApple OSS Distributions 	if (uth->uu_workq_thport == MACH_PORT_NULL) {
4950*33de042dSApple OSS Distributions 		/* convert_thread_to_port_pinned() consumes a reference */
4951*33de042dSApple OSS Distributions 		thread_reference(th);
4952*33de042dSApple OSS Distributions 		/* Convert to immovable/pinned thread port, but port is not pinned yet */
4953*33de042dSApple OSS Distributions 		ipc_port_t port = convert_thread_to_port_pinned(th);
4954*33de042dSApple OSS Distributions 		/* Atomically, pin and copy out the port */
4955*33de042dSApple OSS Distributions 		uth->uu_workq_thport = ipc_port_copyout_send_pinned(port, get_task_ipcspace(proc_task(p)));
4956*33de042dSApple OSS Distributions 	}
4957*33de042dSApple OSS Distributions 
4958*33de042dSApple OSS Distributions 	/* Thread has been set up to run, arm its next workqueue quantum or disarm
4959*33de042dSApple OSS Distributions 	 * if it is no longer supporting that */
4960*33de042dSApple OSS Distributions 	if (thread_supports_cooperative_workqueue(th)) {
4961*33de042dSApple OSS Distributions 		thread_arm_workqueue_quantum(th);
4962*33de042dSApple OSS Distributions 	} else {
4963*33de042dSApple OSS Distributions 		thread_disarm_workqueue_quantum(th);
4964*33de042dSApple OSS Distributions 	}
4965*33de042dSApple OSS Distributions 
4966*33de042dSApple OSS Distributions 	/*
4967*33de042dSApple OSS Distributions 	 * Call out to pthread, this sets up the thread, pulls in kevent structs
4968*33de042dSApple OSS Distributions 	 * onto the stack, sets up the thread state and then returns to userspace.
4969*33de042dSApple OSS Distributions 	 */
4970*33de042dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_runthread | DBG_FUNC_START,
4971*33de042dSApple OSS Distributions 	    proc_get_wqptr_fast(p), 0, 0, 0);
4972*33de042dSApple OSS Distributions 
4973*33de042dSApple OSS Distributions 	if (workq_thread_is_cooperative(uth) || workq_thread_is_permanently_bound(uth)) {
4974*33de042dSApple OSS Distributions 		thread_sched_call(th, NULL);
4975*33de042dSApple OSS Distributions 	} else {
4976*33de042dSApple OSS Distributions 		thread_sched_call(th, workq_sched_callback);
4977*33de042dSApple OSS Distributions 	}
4978*33de042dSApple OSS Distributions 
4979*33de042dSApple OSS Distributions 	pthread_functions->workq_setup_thread(p, th, vmap, uth->uu_workq_stackaddr,
4980*33de042dSApple OSS Distributions 	    uth->uu_workq_thport, 0, setup_flags, upcall_flags);
4981*33de042dSApple OSS Distributions 
4982*33de042dSApple OSS Distributions 	__builtin_unreachable();
4983*33de042dSApple OSS Distributions }
4984*33de042dSApple OSS Distributions 
4985*33de042dSApple OSS Distributions /**
4986*33de042dSApple OSS Distributions  * A wrapper around workq_setup_and_run for permanently bound thread.
4987*33de042dSApple OSS Distributions  */
4988*33de042dSApple OSS Distributions __attribute__((noreturn, noinline))
4989*33de042dSApple OSS Distributions static void
workq_bound_thread_setup_and_run(struct uthread * uth,int setup_flags)4990*33de042dSApple OSS Distributions workq_bound_thread_setup_and_run(struct uthread *uth, int setup_flags)
4991*33de042dSApple OSS Distributions {
4992*33de042dSApple OSS Distributions 	struct workq_threadreq_s * kqr = uth->uu_kqr_bound;
4993*33de042dSApple OSS Distributions 
4994*33de042dSApple OSS Distributions 	uint32_t upcall_flags = (WQ_FLAG_THREAD_NEWSPI |
4995*33de042dSApple OSS Distributions 	    WQ_FLAG_THREAD_WORKLOOP | WQ_FLAG_THREAD_KEVENT);
4996*33de042dSApple OSS Distributions 	if (workq_tr_is_overcommit(kqr->tr_flags)) {
4997*33de042dSApple OSS Distributions 		workq_thread_set_type(uth, UT_WORKQ_OVERCOMMIT);
4998*33de042dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_OVERCOMMIT;
4999*33de042dSApple OSS Distributions 	}
5000*33de042dSApple OSS Distributions 	uth->uu_save.uus_workq_park_data.upcall_flags = upcall_flags;
5001*33de042dSApple OSS Distributions 	workq_setup_and_run(current_proc(), uth, setup_flags);
5002*33de042dSApple OSS Distributions 	__builtin_unreachable();
5003*33de042dSApple OSS Distributions }
5004*33de042dSApple OSS Distributions 
5005*33de042dSApple OSS Distributions /**
5006*33de042dSApple OSS Distributions  * A parked bound thread wakes up for the first time.
5007*33de042dSApple OSS Distributions  */
5008*33de042dSApple OSS Distributions __attribute__((noreturn, noinline))
5009*33de042dSApple OSS Distributions static void
workq_bound_thread_initialize_and_unpark_continue(void * parameter __unused,wait_result_t wr)5010*33de042dSApple OSS Distributions workq_bound_thread_initialize_and_unpark_continue(void *parameter __unused,
5011*33de042dSApple OSS Distributions     wait_result_t wr)
5012*33de042dSApple OSS Distributions {
5013*33de042dSApple OSS Distributions 	/*
5014*33de042dSApple OSS Distributions 	 * Locking model for accessing uu_workq_flags :
5015*33de042dSApple OSS Distributions 	 *
5016*33de042dSApple OSS Distributions 	 * The concurrent access to uu_workq_flags is synchronized with workq lock
5017*33de042dSApple OSS Distributions 	 * until a thread gets permanently bound to a kqwl. Post that, kqlock
5018*33de042dSApple OSS Distributions 	 * is used for subsequent synchronizations. This gives us a significant
5019*33de042dSApple OSS Distributions 	 * benefit by avoiding having to take a process wide workq lock on every
5020*33de042dSApple OSS Distributions 	 * wakeup of the bound thread.
5021*33de042dSApple OSS Distributions 	 * This flip in locking model is tracked with UT_WORKQ_PERMANENT_BIND flag.
5022*33de042dSApple OSS Distributions 	 *
5023*33de042dSApple OSS Distributions 	 * There is one more optimization we can perform for when the thread is
5024*33de042dSApple OSS Distributions 	 * awakened for running (i.e THREAD_AWAKENED) until it parks.
5025*33de042dSApple OSS Distributions 	 * During this window, we know KQ_SLEEP bit is reset so there should not
5026*33de042dSApple OSS Distributions 	 * be any concurrent attempts to modify uu_workq_flags by
5027*33de042dSApple OSS Distributions 	 * kqworkloop_bound_thread_wakeup because the thread is already "awake".
5028*33de042dSApple OSS Distributions 	 * So we can safely access uu_workq_flags within this window without having
5029*33de042dSApple OSS Distributions 	 * to take kqlock. This KQ_SLEEP is later set by the bound thread under
5030*33de042dSApple OSS Distributions 	 * kqlock on its way to parking.
5031*33de042dSApple OSS Distributions 	 */
5032*33de042dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(current_thread());
5033*33de042dSApple OSS Distributions 
5034*33de042dSApple OSS Distributions 	if (__probable(wr == THREAD_AWAKENED)) {
5035*33de042dSApple OSS Distributions 		/* At most one flag. */
5036*33de042dSApple OSS Distributions 		assert((uth->uu_workq_flags & (UT_WORKQ_RUNNING | UT_WORKQ_DYING))
5037*33de042dSApple OSS Distributions 		    != (UT_WORKQ_RUNNING | UT_WORKQ_DYING));
5038*33de042dSApple OSS Distributions 
5039*33de042dSApple OSS Distributions 		assert(workq_thread_is_permanently_bound(uth));
5040*33de042dSApple OSS Distributions 
5041*33de042dSApple OSS Distributions 		if (uth->uu_workq_flags & UT_WORKQ_RUNNING) {
5042*33de042dSApple OSS Distributions 			assert(uth->uu_workq_flags & UT_WORKQ_NEW);
5043*33de042dSApple OSS Distributions 			uth->uu_workq_flags &= ~UT_WORKQ_NEW;
5044*33de042dSApple OSS Distributions 
5045*33de042dSApple OSS Distributions 			struct workq_threadreq_s * kqr = uth->uu_kqr_bound;
5046*33de042dSApple OSS Distributions 			if (kqr->tr_work_interval) {
5047*33de042dSApple OSS Distributions 				kern_return_t kr;
5048*33de042dSApple OSS Distributions 				kr = kern_work_interval_explicit_join(get_machthread(uth),
5049*33de042dSApple OSS Distributions 				    kqr->tr_work_interval);
5050*33de042dSApple OSS Distributions 				/*
5051*33de042dSApple OSS Distributions 				 * The work interval functions requires to be called on the
5052*33de042dSApple OSS Distributions 				 * current thread. If we fail here, we record the fact and
5053*33de042dSApple OSS Distributions 				 * continue.
5054*33de042dSApple OSS Distributions 				 * In the future, we can preflight checking that this join will
5055*33de042dSApple OSS Distributions 				 * always be successful when the paird kqwl is configured; but,
5056*33de042dSApple OSS Distributions 				 * for now, this should be a rare case (e.g. if you have passed
5057*33de042dSApple OSS Distributions 				 * invalid arguments to the join).
5058*33de042dSApple OSS Distributions 				 */
5059*33de042dSApple OSS Distributions 				if (kr == KERN_SUCCESS) {
5060*33de042dSApple OSS Distributions 					uth->uu_workq_flags |= UT_WORKQ_WORK_INTERVAL_JOINED;
5061*33de042dSApple OSS Distributions 					/* Thread and kqwl both have +1 ref on the work interval. */
5062*33de042dSApple OSS Distributions 				} else {
5063*33de042dSApple OSS Distributions 					uth->uu_workq_flags |= UT_WORKQ_WORK_INTERVAL_FAILED;
5064*33de042dSApple OSS Distributions 				}
5065*33de042dSApple OSS Distributions 			}
5066*33de042dSApple OSS Distributions 			workq_thread_reset_cpupercent(kqr, uth);
5067*33de042dSApple OSS Distributions 			workq_bound_thread_setup_and_run(uth, WQ_SETUP_FIRST_USE);
5068*33de042dSApple OSS Distributions 			__builtin_unreachable();
5069*33de042dSApple OSS Distributions 		} else {
5070*33de042dSApple OSS Distributions 			/*
5071*33de042dSApple OSS Distributions 			 * The permanently bound kqworkloop is getting destroyed so we
5072*33de042dSApple OSS Distributions 			 * are woken up to cleanly unbind ourselves from it and terminate.
5073*33de042dSApple OSS Distributions 			 * See KQ_WORKLOOP_DESTROY -> workq_kern_bound_thread_wakeup.
5074*33de042dSApple OSS Distributions 			 *
5075*33de042dSApple OSS Distributions 			 * The actual full unbind happens from
5076*33de042dSApple OSS Distributions 			 * uthread_cleanup -> kqueue_threadreq_unbind.
5077*33de042dSApple OSS Distributions 			 */
5078*33de042dSApple OSS Distributions 			assert(uth->uu_workq_flags & UT_WORKQ_DYING);
5079*33de042dSApple OSS Distributions 		}
5080*33de042dSApple OSS Distributions 	} else {
5081*33de042dSApple OSS Distributions 		/*
5082*33de042dSApple OSS Distributions 		 * The process is getting terminated so we are woken up to die.
5083*33de042dSApple OSS Distributions 		 * E.g. SIGKILL'd.
5084*33de042dSApple OSS Distributions 		 */
5085*33de042dSApple OSS Distributions 		assert(wr == THREAD_INTERRUPTED);
5086*33de042dSApple OSS Distributions 		/*
5087*33de042dSApple OSS Distributions 		 * It is possible we started running as the process is aborted
5088*33de042dSApple OSS Distributions 		 * due to termination; but, workq_kern_threadreq_permanent_bind
5089*33de042dSApple OSS Distributions 		 * has not had a chance to bind us to the kqwl yet.
5090*33de042dSApple OSS Distributions 		 *
5091*33de042dSApple OSS Distributions 		 * We synchronize with it using workq lock.
5092*33de042dSApple OSS Distributions 		 */
5093*33de042dSApple OSS Distributions 		proc_t p = current_proc();
5094*33de042dSApple OSS Distributions 		struct workqueue *wq = proc_get_wqptr_fast(p);
5095*33de042dSApple OSS Distributions 		workq_lock_spin(wq);
5096*33de042dSApple OSS Distributions 		assert(workq_thread_is_permanently_bound(uth));
5097*33de042dSApple OSS Distributions 		workq_unlock(wq);
5098*33de042dSApple OSS Distributions 
5099*33de042dSApple OSS Distributions 		/*
5100*33de042dSApple OSS Distributions 		 * We do the bind commit ourselves if workq_kern_threadreq_permanent_bind
5101*33de042dSApple OSS Distributions 		 * has not done it for us yet so our state is aligned with what the
5102*33de042dSApple OSS Distributions 		 * termination path below expects.
5103*33de042dSApple OSS Distributions 		 */
5104*33de042dSApple OSS Distributions 		kqueue_threadreq_bind_commit(p, get_machthread(uth));
5105*33de042dSApple OSS Distributions 	}
5106*33de042dSApple OSS Distributions 	workq_kern_bound_thread_terminate(uth->uu_kqr_bound);
5107*33de042dSApple OSS Distributions 	__builtin_unreachable();
5108*33de042dSApple OSS Distributions }
5109*33de042dSApple OSS Distributions 
5110*33de042dSApple OSS Distributions /**
5111*33de042dSApple OSS Distributions  * A parked bound thread wakes up. Not the first time.
5112*33de042dSApple OSS Distributions  */
5113*33de042dSApple OSS Distributions __attribute__((noreturn, noinline))
5114*33de042dSApple OSS Distributions static void
workq_bound_thread_unpark_continue(void * parameter __unused,wait_result_t wr)5115*33de042dSApple OSS Distributions workq_bound_thread_unpark_continue(void *parameter __unused, wait_result_t wr)
5116*33de042dSApple OSS Distributions {
5117*33de042dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(current_thread());
5118*33de042dSApple OSS Distributions 	assert(workq_thread_is_permanently_bound(uth));
5119*33de042dSApple OSS Distributions 
5120*33de042dSApple OSS Distributions 	if (__probable(wr == THREAD_AWAKENED)) {
5121*33de042dSApple OSS Distributions 		/* At most one flag. */
5122*33de042dSApple OSS Distributions 		assert((uth->uu_workq_flags & (UT_WORKQ_RUNNING | UT_WORKQ_DYING))
5123*33de042dSApple OSS Distributions 		    != (UT_WORKQ_RUNNING | UT_WORKQ_DYING));
5124*33de042dSApple OSS Distributions 		if (uth->uu_workq_flags & UT_WORKQ_RUNNING) {
5125*33de042dSApple OSS Distributions 			workq_bound_thread_setup_and_run(uth, WQ_SETUP_NONE);
5126*33de042dSApple OSS Distributions 		} else {
5127*33de042dSApple OSS Distributions 			assert(uth->uu_workq_flags & UT_WORKQ_DYING);
5128*33de042dSApple OSS Distributions 		}
5129*33de042dSApple OSS Distributions 	} else {
5130*33de042dSApple OSS Distributions 		assert(wr == THREAD_INTERRUPTED);
5131*33de042dSApple OSS Distributions 	}
5132*33de042dSApple OSS Distributions 	workq_kern_bound_thread_terminate(uth->uu_kqr_bound);
5133*33de042dSApple OSS Distributions 	__builtin_unreachable();
5134*33de042dSApple OSS Distributions }
5135*33de042dSApple OSS Distributions 
5136*33de042dSApple OSS Distributions #pragma mark misc
5137*33de042dSApple OSS Distributions 
5138*33de042dSApple OSS Distributions int
fill_procworkqueue(proc_t p,struct proc_workqueueinfo * pwqinfo)5139*33de042dSApple OSS Distributions fill_procworkqueue(proc_t p, struct proc_workqueueinfo * pwqinfo)
5140*33de042dSApple OSS Distributions {
5141*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
5142*33de042dSApple OSS Distributions 	int error = 0;
5143*33de042dSApple OSS Distributions 	int     activecount;
5144*33de042dSApple OSS Distributions 
5145*33de042dSApple OSS Distributions 	if (wq == NULL) {
5146*33de042dSApple OSS Distributions 		return EINVAL;
5147*33de042dSApple OSS Distributions 	}
5148*33de042dSApple OSS Distributions 
5149*33de042dSApple OSS Distributions 	/*
5150*33de042dSApple OSS Distributions 	 * This is sometimes called from interrupt context by the kperf sampler.
5151*33de042dSApple OSS Distributions 	 * In that case, it's not safe to spin trying to take the lock since we
5152*33de042dSApple OSS Distributions 	 * might already hold it.  So, we just try-lock it and error out if it's
5153*33de042dSApple OSS Distributions 	 * already held.  Since this is just a debugging aid, and all our callers
5154*33de042dSApple OSS Distributions 	 * are able to handle an error, that's fine.
5155*33de042dSApple OSS Distributions 	 */
5156*33de042dSApple OSS Distributions 	bool locked = workq_lock_try(wq);
5157*33de042dSApple OSS Distributions 	if (!locked) {
5158*33de042dSApple OSS Distributions 		return EBUSY;
5159*33de042dSApple OSS Distributions 	}
5160*33de042dSApple OSS Distributions 
5161*33de042dSApple OSS Distributions 	wq_thactive_t act = _wq_thactive(wq);
5162*33de042dSApple OSS Distributions 	activecount = _wq_thactive_aggregate_downto_qos(wq, act,
5163*33de042dSApple OSS Distributions 	    WORKQ_THREAD_QOS_MIN, NULL, NULL);
5164*33de042dSApple OSS Distributions 	if (act & _wq_thactive_offset_for_qos(WORKQ_THREAD_QOS_MANAGER)) {
5165*33de042dSApple OSS Distributions 		activecount++;
5166*33de042dSApple OSS Distributions 	}
5167*33de042dSApple OSS Distributions 	pwqinfo->pwq_nthreads = wq->wq_nthreads;
5168*33de042dSApple OSS Distributions 	pwqinfo->pwq_runthreads = activecount;
5169*33de042dSApple OSS Distributions 	pwqinfo->pwq_blockedthreads = wq->wq_threads_scheduled - activecount;
5170*33de042dSApple OSS Distributions 	pwqinfo->pwq_state = 0;
5171*33de042dSApple OSS Distributions 
5172*33de042dSApple OSS Distributions 	if (wq->wq_constrained_threads_scheduled >= wq_max_constrained_threads) {
5173*33de042dSApple OSS Distributions 		pwqinfo->pwq_state |= WQ_EXCEEDED_CONSTRAINED_THREAD_LIMIT;
5174*33de042dSApple OSS Distributions 	}
5175*33de042dSApple OSS Distributions 
5176*33de042dSApple OSS Distributions 	if (wq->wq_nthreads >= wq_max_threads) {
5177*33de042dSApple OSS Distributions 		pwqinfo->pwq_state |= WQ_EXCEEDED_TOTAL_THREAD_LIMIT;
5178*33de042dSApple OSS Distributions 	}
5179*33de042dSApple OSS Distributions 
5180*33de042dSApple OSS Distributions 	uint64_t total_cooperative_threads;
5181*33de042dSApple OSS Distributions 	total_cooperative_threads = workq_num_cooperative_threads_scheduled_total(wq);
5182*33de042dSApple OSS Distributions 	if ((total_cooperative_threads == wq_cooperative_queue_max_size(wq)) &&
5183*33de042dSApple OSS Distributions 	    workq_has_cooperative_thread_requests(wq)) {
5184*33de042dSApple OSS Distributions 		pwqinfo->pwq_state |= WQ_EXCEEDED_COOPERATIVE_THREAD_LIMIT;
5185*33de042dSApple OSS Distributions 	}
5186*33de042dSApple OSS Distributions 
5187*33de042dSApple OSS Distributions 	if (wq->wq_exceeded_active_constrained_thread_limit) {
5188*33de042dSApple OSS Distributions 		pwqinfo->pwq_state |= WQ_EXCEEDED_ACTIVE_CONSTRAINED_THREAD_LIMIT;
5189*33de042dSApple OSS Distributions 	}
5190*33de042dSApple OSS Distributions 
5191*33de042dSApple OSS Distributions 	workq_unlock(wq);
5192*33de042dSApple OSS Distributions 	return error;
5193*33de042dSApple OSS Distributions }
5194*33de042dSApple OSS Distributions 
5195*33de042dSApple OSS Distributions boolean_t
workqueue_get_pwq_exceeded(void * v,boolean_t * exceeded_total,boolean_t * exceeded_constrained)5196*33de042dSApple OSS Distributions workqueue_get_pwq_exceeded(void *v, boolean_t *exceeded_total,
5197*33de042dSApple OSS Distributions     boolean_t *exceeded_constrained)
5198*33de042dSApple OSS Distributions {
5199*33de042dSApple OSS Distributions 	proc_t p = v;
5200*33de042dSApple OSS Distributions 	struct proc_workqueueinfo pwqinfo;
5201*33de042dSApple OSS Distributions 	int err;
5202*33de042dSApple OSS Distributions 
5203*33de042dSApple OSS Distributions 	assert(p != NULL);
5204*33de042dSApple OSS Distributions 	assert(exceeded_total != NULL);
5205*33de042dSApple OSS Distributions 	assert(exceeded_constrained != NULL);
5206*33de042dSApple OSS Distributions 
5207*33de042dSApple OSS Distributions 	err = fill_procworkqueue(p, &pwqinfo);
5208*33de042dSApple OSS Distributions 	if (err) {
5209*33de042dSApple OSS Distributions 		return FALSE;
5210*33de042dSApple OSS Distributions 	}
5211*33de042dSApple OSS Distributions 	if (!(pwqinfo.pwq_state & WQ_FLAGS_AVAILABLE)) {
5212*33de042dSApple OSS Distributions 		return FALSE;
5213*33de042dSApple OSS Distributions 	}
5214*33de042dSApple OSS Distributions 
5215*33de042dSApple OSS Distributions 	*exceeded_total = (pwqinfo.pwq_state & WQ_EXCEEDED_TOTAL_THREAD_LIMIT);
5216*33de042dSApple OSS Distributions 	*exceeded_constrained = (pwqinfo.pwq_state & WQ_EXCEEDED_CONSTRAINED_THREAD_LIMIT);
5217*33de042dSApple OSS Distributions 
5218*33de042dSApple OSS Distributions 	return TRUE;
5219*33de042dSApple OSS Distributions }
5220*33de042dSApple OSS Distributions 
5221*33de042dSApple OSS Distributions uint64_t
workqueue_get_task_ss_flags_from_pwq_state_kdp(void * v)5222*33de042dSApple OSS Distributions workqueue_get_task_ss_flags_from_pwq_state_kdp(void * v)
5223*33de042dSApple OSS Distributions {
5224*33de042dSApple OSS Distributions 	static_assert((WQ_EXCEEDED_CONSTRAINED_THREAD_LIMIT << 17) ==
5225*33de042dSApple OSS Distributions 	    kTaskWqExceededConstrainedThreadLimit);
5226*33de042dSApple OSS Distributions 	static_assert((WQ_EXCEEDED_TOTAL_THREAD_LIMIT << 17) ==
5227*33de042dSApple OSS Distributions 	    kTaskWqExceededTotalThreadLimit);
5228*33de042dSApple OSS Distributions 	static_assert((WQ_FLAGS_AVAILABLE << 17) == kTaskWqFlagsAvailable);
5229*33de042dSApple OSS Distributions 	static_assert(((uint64_t)WQ_EXCEEDED_COOPERATIVE_THREAD_LIMIT << 34) ==
5230*33de042dSApple OSS Distributions 	    (uint64_t)kTaskWqExceededCooperativeThreadLimit);
5231*33de042dSApple OSS Distributions 	static_assert(((uint64_t)WQ_EXCEEDED_ACTIVE_CONSTRAINED_THREAD_LIMIT << 34) ==
5232*33de042dSApple OSS Distributions 	    (uint64_t)kTaskWqExceededActiveConstrainedThreadLimit);
5233*33de042dSApple OSS Distributions 	static_assert((WQ_FLAGS_AVAILABLE | WQ_EXCEEDED_TOTAL_THREAD_LIMIT |
5234*33de042dSApple OSS Distributions 	    WQ_EXCEEDED_CONSTRAINED_THREAD_LIMIT |
5235*33de042dSApple OSS Distributions 	    WQ_EXCEEDED_COOPERATIVE_THREAD_LIMIT |
5236*33de042dSApple OSS Distributions 	    WQ_EXCEEDED_ACTIVE_CONSTRAINED_THREAD_LIMIT) == 0x1F);
5237*33de042dSApple OSS Distributions 
5238*33de042dSApple OSS Distributions 	if (v == NULL) {
5239*33de042dSApple OSS Distributions 		return 0;
5240*33de042dSApple OSS Distributions 	}
5241*33de042dSApple OSS Distributions 
5242*33de042dSApple OSS Distributions 	proc_t p = v;
5243*33de042dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
5244*33de042dSApple OSS Distributions 
5245*33de042dSApple OSS Distributions 	if (wq == NULL || workq_lock_is_acquired_kdp(wq)) {
5246*33de042dSApple OSS Distributions 		return 0;
5247*33de042dSApple OSS Distributions 	}
5248*33de042dSApple OSS Distributions 
5249*33de042dSApple OSS Distributions 	uint64_t ss_flags = kTaskWqFlagsAvailable;
5250*33de042dSApple OSS Distributions 
5251*33de042dSApple OSS Distributions 	if (wq->wq_constrained_threads_scheduled >= wq_max_constrained_threads) {
5252*33de042dSApple OSS Distributions 		ss_flags |= kTaskWqExceededConstrainedThreadLimit;
5253*33de042dSApple OSS Distributions 	}
5254*33de042dSApple OSS Distributions 
5255*33de042dSApple OSS Distributions 	if (wq->wq_nthreads >= wq_max_threads) {
5256*33de042dSApple OSS Distributions 		ss_flags |= kTaskWqExceededTotalThreadLimit;
5257*33de042dSApple OSS Distributions 	}
5258*33de042dSApple OSS Distributions 
5259*33de042dSApple OSS Distributions 	uint64_t total_cooperative_threads;
5260*33de042dSApple OSS Distributions 	total_cooperative_threads = workq_num_cooperative_threads_scheduled_to_qos_internal(wq,
5261*33de042dSApple OSS Distributions 	    WORKQ_THREAD_QOS_MIN);
5262*33de042dSApple OSS Distributions 	if ((total_cooperative_threads == wq_cooperative_queue_max_size(wq)) &&
5263*33de042dSApple OSS Distributions 	    workq_has_cooperative_thread_requests(wq)) {
5264*33de042dSApple OSS Distributions 		ss_flags |= kTaskWqExceededCooperativeThreadLimit;
5265*33de042dSApple OSS Distributions 	}
5266*33de042dSApple OSS Distributions 
5267*33de042dSApple OSS Distributions 	if (wq->wq_exceeded_active_constrained_thread_limit) {
5268*33de042dSApple OSS Distributions 		ss_flags |= kTaskWqExceededActiveConstrainedThreadLimit;
5269*33de042dSApple OSS Distributions 	}
5270*33de042dSApple OSS Distributions 
5271*33de042dSApple OSS Distributions 	return ss_flags;
5272*33de042dSApple OSS Distributions }
5273*33de042dSApple OSS Distributions 
5274*33de042dSApple OSS Distributions void
workq_init(void)5275*33de042dSApple OSS Distributions workq_init(void)
5276*33de042dSApple OSS Distributions {
5277*33de042dSApple OSS Distributions 	clock_interval_to_absolutetime_interval(wq_stalled_window.usecs,
5278*33de042dSApple OSS Distributions 	    NSEC_PER_USEC, &wq_stalled_window.abstime);
5279*33de042dSApple OSS Distributions 	clock_interval_to_absolutetime_interval(wq_reduce_pool_window.usecs,
5280*33de042dSApple OSS Distributions 	    NSEC_PER_USEC, &wq_reduce_pool_window.abstime);
5281*33de042dSApple OSS Distributions 	clock_interval_to_absolutetime_interval(wq_max_timer_interval.usecs,
5282*33de042dSApple OSS Distributions 	    NSEC_PER_USEC, &wq_max_timer_interval.abstime);
5283*33de042dSApple OSS Distributions 
5284*33de042dSApple OSS Distributions 	thread_deallocate_daemon_register_queue(&workq_deallocate_queue,
5285*33de042dSApple OSS Distributions 	    workq_deallocate_queue_invoke);
5286*33de042dSApple OSS Distributions }
5287