xref: /xnu-11215.1.10/bsd/pthread/pthread_workqueue.c (revision 8d741a5de7ff4191bf97d57b9f54c2f6d4a15585)
1*8d741a5dSApple OSS Distributions /*
2*8d741a5dSApple OSS Distributions  * Copyright (c) 2000-2020 Apple Inc. All rights reserved.
3*8d741a5dSApple OSS Distributions  *
4*8d741a5dSApple OSS Distributions  * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
5*8d741a5dSApple OSS Distributions  *
6*8d741a5dSApple OSS Distributions  * This file contains Original Code and/or Modifications of Original Code
7*8d741a5dSApple OSS Distributions  * as defined in and that are subject to the Apple Public Source License
8*8d741a5dSApple OSS Distributions  * Version 2.0 (the 'License'). You may not use this file except in
9*8d741a5dSApple OSS Distributions  * compliance with the License. The rights granted to you under the License
10*8d741a5dSApple OSS Distributions  * may not be used to create, or enable the creation or redistribution of,
11*8d741a5dSApple OSS Distributions  * unlawful or unlicensed copies of an Apple operating system, or to
12*8d741a5dSApple OSS Distributions  * circumvent, violate, or enable the circumvention or violation of, any
13*8d741a5dSApple OSS Distributions  * terms of an Apple operating system software license agreement.
14*8d741a5dSApple OSS Distributions  *
15*8d741a5dSApple OSS Distributions  * Please obtain a copy of the License at
16*8d741a5dSApple OSS Distributions  * http://www.opensource.apple.com/apsl/ and read it before using this file.
17*8d741a5dSApple OSS Distributions  *
18*8d741a5dSApple OSS Distributions  * The Original Code and all software distributed under the License are
19*8d741a5dSApple OSS Distributions  * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20*8d741a5dSApple OSS Distributions  * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21*8d741a5dSApple OSS Distributions  * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22*8d741a5dSApple OSS Distributions  * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23*8d741a5dSApple OSS Distributions  * Please see the License for the specific language governing rights and
24*8d741a5dSApple OSS Distributions  * limitations under the License.
25*8d741a5dSApple OSS Distributions  *
26*8d741a5dSApple OSS Distributions  * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
27*8d741a5dSApple OSS Distributions  */
28*8d741a5dSApple OSS Distributions /* Copyright (c) 1995-2018 Apple, Inc. All Rights Reserved */
29*8d741a5dSApple OSS Distributions 
30*8d741a5dSApple OSS Distributions #include <sys/cdefs.h>
31*8d741a5dSApple OSS Distributions 
32*8d741a5dSApple OSS Distributions #include <kern/assert.h>
33*8d741a5dSApple OSS Distributions #include <kern/ast.h>
34*8d741a5dSApple OSS Distributions #include <kern/clock.h>
35*8d741a5dSApple OSS Distributions #include <kern/cpu_data.h>
36*8d741a5dSApple OSS Distributions #include <kern/kern_types.h>
37*8d741a5dSApple OSS Distributions #include <kern/policy_internal.h>
38*8d741a5dSApple OSS Distributions #include <kern/processor.h>
39*8d741a5dSApple OSS Distributions #include <kern/sched_prim.h>    /* for thread_exception_return */
40*8d741a5dSApple OSS Distributions #include <kern/task.h>
41*8d741a5dSApple OSS Distributions #include <kern/thread.h>
42*8d741a5dSApple OSS Distributions #include <kern/thread_group.h>
43*8d741a5dSApple OSS Distributions #include <kern/zalloc.h>
44*8d741a5dSApple OSS Distributions #include <kern/work_interval.h>
45*8d741a5dSApple OSS Distributions #include <mach/kern_return.h>
46*8d741a5dSApple OSS Distributions #include <mach/mach_param.h>
47*8d741a5dSApple OSS Distributions #include <mach/mach_port.h>
48*8d741a5dSApple OSS Distributions #include <mach/mach_types.h>
49*8d741a5dSApple OSS Distributions #include <mach/mach_vm.h>
50*8d741a5dSApple OSS Distributions #include <mach/sync_policy.h>
51*8d741a5dSApple OSS Distributions #include <mach/task.h>
52*8d741a5dSApple OSS Distributions #include <mach/thread_act.h> /* for thread_resume */
53*8d741a5dSApple OSS Distributions #include <mach/thread_policy.h>
54*8d741a5dSApple OSS Distributions #include <mach/thread_status.h>
55*8d741a5dSApple OSS Distributions #include <mach/vm_prot.h>
56*8d741a5dSApple OSS Distributions #include <mach/vm_statistics.h>
57*8d741a5dSApple OSS Distributions #include <machine/atomic.h>
58*8d741a5dSApple OSS Distributions #include <machine/machine_routines.h>
59*8d741a5dSApple OSS Distributions #include <machine/smp.h>
60*8d741a5dSApple OSS Distributions #include <vm/vm_map.h>
61*8d741a5dSApple OSS Distributions #include <vm/vm_protos.h>
62*8d741a5dSApple OSS Distributions 
63*8d741a5dSApple OSS Distributions #include <sys/eventvar.h>
64*8d741a5dSApple OSS Distributions #include <sys/kdebug.h>
65*8d741a5dSApple OSS Distributions #include <sys/kernel.h>
66*8d741a5dSApple OSS Distributions #include <sys/lock.h>
67*8d741a5dSApple OSS Distributions #include <sys/param.h>
68*8d741a5dSApple OSS Distributions #include <sys/proc_info.h>      /* for fill_procworkqueue */
69*8d741a5dSApple OSS Distributions #include <sys/proc_internal.h>
70*8d741a5dSApple OSS Distributions #include <sys/pthread_shims.h>
71*8d741a5dSApple OSS Distributions #include <sys/resourcevar.h>
72*8d741a5dSApple OSS Distributions #include <sys/signalvar.h>
73*8d741a5dSApple OSS Distributions #include <sys/sysctl.h>
74*8d741a5dSApple OSS Distributions #include <sys/sysproto.h>
75*8d741a5dSApple OSS Distributions #include <sys/systm.h>
76*8d741a5dSApple OSS Distributions #include <sys/ulock.h> /* for ulock_owner_value_to_port_name */
77*8d741a5dSApple OSS Distributions 
78*8d741a5dSApple OSS Distributions #include <pthread/bsdthread_private.h>
79*8d741a5dSApple OSS Distributions #include <pthread/workqueue_syscalls.h>
80*8d741a5dSApple OSS Distributions #include <pthread/workqueue_internal.h>
81*8d741a5dSApple OSS Distributions #include <pthread/workqueue_trace.h>
82*8d741a5dSApple OSS Distributions 
83*8d741a5dSApple OSS Distributions #include <os/log.h>
84*8d741a5dSApple OSS Distributions 
85*8d741a5dSApple OSS Distributions static void workq_unpark_continue(void *uth, wait_result_t wr) __dead2;
86*8d741a5dSApple OSS Distributions 
87*8d741a5dSApple OSS Distributions static void workq_bound_thread_unpark_continue(void *uth, wait_result_t wr) __dead2;
88*8d741a5dSApple OSS Distributions 
89*8d741a5dSApple OSS Distributions static void workq_bound_thread_initialize_and_unpark_continue(void *uth, wait_result_t wr) __dead2;
90*8d741a5dSApple OSS Distributions 
91*8d741a5dSApple OSS Distributions static void workq_bound_thread_setup_and_run(struct uthread *uth, int setup_flags) __dead2;
92*8d741a5dSApple OSS Distributions 
93*8d741a5dSApple OSS Distributions static void workq_schedule_creator(proc_t p, struct workqueue *wq,
94*8d741a5dSApple OSS Distributions     workq_kern_threadreq_flags_t flags);
95*8d741a5dSApple OSS Distributions 
96*8d741a5dSApple OSS Distributions static bool workq_threadreq_admissible(struct workqueue *wq, struct uthread *uth,
97*8d741a5dSApple OSS Distributions     workq_threadreq_t req);
98*8d741a5dSApple OSS Distributions 
99*8d741a5dSApple OSS Distributions static uint32_t workq_constrained_allowance(struct workqueue *wq,
100*8d741a5dSApple OSS Distributions     thread_qos_t at_qos, struct uthread *uth,
101*8d741a5dSApple OSS Distributions     bool may_start_timer, bool record_failed_allowance);
102*8d741a5dSApple OSS Distributions 
103*8d741a5dSApple OSS Distributions static bool _wq_cooperative_queue_refresh_best_req_qos(struct workqueue *wq);
104*8d741a5dSApple OSS Distributions 
105*8d741a5dSApple OSS Distributions static bool workq_thread_is_busy(uint64_t cur_ts,
106*8d741a5dSApple OSS Distributions     _Atomic uint64_t *lastblocked_tsp);
107*8d741a5dSApple OSS Distributions 
108*8d741a5dSApple OSS Distributions static int workq_sysctl_handle_usecs SYSCTL_HANDLER_ARGS;
109*8d741a5dSApple OSS Distributions 
110*8d741a5dSApple OSS Distributions static bool
111*8d741a5dSApple OSS Distributions workq_schedule_delayed_thread_creation(struct workqueue *wq, int flags);
112*8d741a5dSApple OSS Distributions 
113*8d741a5dSApple OSS Distributions static inline void
114*8d741a5dSApple OSS Distributions workq_lock_spin(struct workqueue *wq);
115*8d741a5dSApple OSS Distributions 
116*8d741a5dSApple OSS Distributions static inline void
117*8d741a5dSApple OSS Distributions workq_unlock(struct workqueue *wq);
118*8d741a5dSApple OSS Distributions 
119*8d741a5dSApple OSS Distributions #pragma mark globals
120*8d741a5dSApple OSS Distributions 
121*8d741a5dSApple OSS Distributions struct workq_usec_var {
122*8d741a5dSApple OSS Distributions 	uint32_t usecs;
123*8d741a5dSApple OSS Distributions 	uint64_t abstime;
124*8d741a5dSApple OSS Distributions };
125*8d741a5dSApple OSS Distributions 
126*8d741a5dSApple OSS Distributions #define WORKQ_SYSCTL_USECS(var, init) \
127*8d741a5dSApple OSS Distributions 	        static struct workq_usec_var var = { .usecs = init }; \
128*8d741a5dSApple OSS Distributions 	        SYSCTL_OID(_kern, OID_AUTO, var##_usecs, \
129*8d741a5dSApple OSS Distributions 	                        CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED, &var, 0, \
130*8d741a5dSApple OSS Distributions 	                        workq_sysctl_handle_usecs, "I", "")
131*8d741a5dSApple OSS Distributions 
132*8d741a5dSApple OSS Distributions static LCK_GRP_DECLARE(workq_lck_grp, "workq");
133*8d741a5dSApple OSS Distributions os_refgrp_decl(static, workq_refgrp, "workq", NULL);
134*8d741a5dSApple OSS Distributions 
135*8d741a5dSApple OSS Distributions static ZONE_DEFINE(workq_zone_workqueue, "workq.wq",
136*8d741a5dSApple OSS Distributions     sizeof(struct workqueue), ZC_NONE);
137*8d741a5dSApple OSS Distributions static ZONE_DEFINE(workq_zone_threadreq, "workq.threadreq",
138*8d741a5dSApple OSS Distributions     sizeof(struct workq_threadreq_s), ZC_CACHING);
139*8d741a5dSApple OSS Distributions 
140*8d741a5dSApple OSS Distributions static struct mpsc_daemon_queue workq_deallocate_queue;
141*8d741a5dSApple OSS Distributions 
142*8d741a5dSApple OSS Distributions WORKQ_SYSCTL_USECS(wq_stalled_window, WQ_STALLED_WINDOW_USECS);
143*8d741a5dSApple OSS Distributions WORKQ_SYSCTL_USECS(wq_reduce_pool_window, WQ_REDUCE_POOL_WINDOW_USECS);
144*8d741a5dSApple OSS Distributions WORKQ_SYSCTL_USECS(wq_max_timer_interval, WQ_MAX_TIMER_INTERVAL_USECS);
145*8d741a5dSApple OSS Distributions static uint32_t wq_max_threads              = WORKQUEUE_MAXTHREADS;
146*8d741a5dSApple OSS Distributions static uint32_t wq_max_constrained_threads  = WORKQUEUE_MAXTHREADS / 8;
147*8d741a5dSApple OSS Distributions static uint32_t wq_init_constrained_limit   = 1;
148*8d741a5dSApple OSS Distributions static uint16_t wq_death_max_load;
149*8d741a5dSApple OSS Distributions static uint32_t wq_max_parallelism[WORKQ_NUM_QOS_BUCKETS];
150*8d741a5dSApple OSS Distributions 
151*8d741a5dSApple OSS Distributions /*
152*8d741a5dSApple OSS Distributions  * This is not a hard limit but the max size we want to aim to hit across the
153*8d741a5dSApple OSS Distributions  * entire cooperative pool. We can oversubscribe the pool due to non-cooperative
154*8d741a5dSApple OSS Distributions  * workers and the max we will oversubscribe the pool by, is a total of
155*8d741a5dSApple OSS Distributions  * wq_max_cooperative_threads * WORKQ_NUM_QOS_BUCKETS.
156*8d741a5dSApple OSS Distributions  */
157*8d741a5dSApple OSS Distributions static uint32_t wq_max_cooperative_threads;
158*8d741a5dSApple OSS Distributions 
159*8d741a5dSApple OSS Distributions static inline uint32_t
wq_cooperative_queue_max_size(struct workqueue * wq)160*8d741a5dSApple OSS Distributions wq_cooperative_queue_max_size(struct workqueue *wq)
161*8d741a5dSApple OSS Distributions {
162*8d741a5dSApple OSS Distributions 	return wq->wq_cooperative_queue_has_limited_max_size ? 1 : wq_max_cooperative_threads;
163*8d741a5dSApple OSS Distributions }
164*8d741a5dSApple OSS Distributions 
165*8d741a5dSApple OSS Distributions #pragma mark sysctls
166*8d741a5dSApple OSS Distributions 
167*8d741a5dSApple OSS Distributions static int
168*8d741a5dSApple OSS Distributions workq_sysctl_handle_usecs SYSCTL_HANDLER_ARGS
169*8d741a5dSApple OSS Distributions {
170*8d741a5dSApple OSS Distributions #pragma unused(arg2)
171*8d741a5dSApple OSS Distributions 	struct workq_usec_var *v = arg1;
172*8d741a5dSApple OSS Distributions 	int error = sysctl_handle_int(oidp, &v->usecs, 0, req);
173*8d741a5dSApple OSS Distributions 	if (error || !req->newptr) {
174*8d741a5dSApple OSS Distributions 		return error;
175*8d741a5dSApple OSS Distributions 	}
176*8d741a5dSApple OSS Distributions 	clock_interval_to_absolutetime_interval(v->usecs, NSEC_PER_USEC,
177*8d741a5dSApple OSS Distributions 	    &v->abstime);
178*8d741a5dSApple OSS Distributions 	return 0;
179*8d741a5dSApple OSS Distributions }
180*8d741a5dSApple OSS Distributions 
181*8d741a5dSApple OSS Distributions SYSCTL_INT(_kern, OID_AUTO, wq_max_threads, CTLFLAG_RW | CTLFLAG_LOCKED,
182*8d741a5dSApple OSS Distributions     &wq_max_threads, 0, "");
183*8d741a5dSApple OSS Distributions 
184*8d741a5dSApple OSS Distributions SYSCTL_INT(_kern, OID_AUTO, wq_max_constrained_threads, CTLFLAG_RW | CTLFLAG_LOCKED,
185*8d741a5dSApple OSS Distributions     &wq_max_constrained_threads, 0, "");
186*8d741a5dSApple OSS Distributions 
187*8d741a5dSApple OSS Distributions static int
188*8d741a5dSApple OSS Distributions wq_limit_cooperative_threads_for_proc SYSCTL_HANDLER_ARGS
189*8d741a5dSApple OSS Distributions {
190*8d741a5dSApple OSS Distributions #pragma unused(arg1, arg2, oidp)
191*8d741a5dSApple OSS Distributions 	int input_pool_size = 0;
192*8d741a5dSApple OSS Distributions 	int changed;
193*8d741a5dSApple OSS Distributions 	int error = 0;
194*8d741a5dSApple OSS Distributions 
195*8d741a5dSApple OSS Distributions 	error = sysctl_io_number(req, 0, sizeof(int), &input_pool_size, &changed);
196*8d741a5dSApple OSS Distributions 	if (error || !changed) {
197*8d741a5dSApple OSS Distributions 		return error;
198*8d741a5dSApple OSS Distributions 	}
199*8d741a5dSApple OSS Distributions 
200*8d741a5dSApple OSS Distributions #define WQ_COOPERATIVE_POOL_SIZE_DEFAULT 0
201*8d741a5dSApple OSS Distributions #define WQ_COOPERATIVE_POOL_SIZE_STRICT_PER_QOS -1
202*8d741a5dSApple OSS Distributions /* Not available currently, but sysctl interface is designed to allow these
203*8d741a5dSApple OSS Distributions  * extra parameters:
204*8d741a5dSApple OSS Distributions  *		WQ_COOPERATIVE_POOL_SIZE_STRICT : -2 (across all bucket)
205*8d741a5dSApple OSS Distributions  *		WQ_COOPERATIVE_POOL_SIZE_CUSTOM : [1, 512]
206*8d741a5dSApple OSS Distributions  */
207*8d741a5dSApple OSS Distributions 
208*8d741a5dSApple OSS Distributions 	if (input_pool_size != WQ_COOPERATIVE_POOL_SIZE_DEFAULT
209*8d741a5dSApple OSS Distributions 	    && input_pool_size != WQ_COOPERATIVE_POOL_SIZE_STRICT_PER_QOS) {
210*8d741a5dSApple OSS Distributions 		error = EINVAL;
211*8d741a5dSApple OSS Distributions 		goto out;
212*8d741a5dSApple OSS Distributions 	}
213*8d741a5dSApple OSS Distributions 
214*8d741a5dSApple OSS Distributions 	proc_t p = req->p;
215*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
216*8d741a5dSApple OSS Distributions 
217*8d741a5dSApple OSS Distributions 	if (wq != NULL) {
218*8d741a5dSApple OSS Distributions 		workq_lock_spin(wq);
219*8d741a5dSApple OSS Distributions 		if (wq->wq_reqcount > 0 || wq->wq_nthreads > 0) {
220*8d741a5dSApple OSS Distributions 			// Hackily enforce that the workqueue is still new (no requests or
221*8d741a5dSApple OSS Distributions 			// threads)
222*8d741a5dSApple OSS Distributions 			error = ENOTSUP;
223*8d741a5dSApple OSS Distributions 		} else {
224*8d741a5dSApple OSS Distributions 			wq->wq_cooperative_queue_has_limited_max_size = (input_pool_size == WQ_COOPERATIVE_POOL_SIZE_STRICT_PER_QOS);
225*8d741a5dSApple OSS Distributions 		}
226*8d741a5dSApple OSS Distributions 		workq_unlock(wq);
227*8d741a5dSApple OSS Distributions 	} else {
228*8d741a5dSApple OSS Distributions 		/* This process has no workqueue, calling this syctl makes no sense */
229*8d741a5dSApple OSS Distributions 		return ENOTSUP;
230*8d741a5dSApple OSS Distributions 	}
231*8d741a5dSApple OSS Distributions 
232*8d741a5dSApple OSS Distributions out:
233*8d741a5dSApple OSS Distributions 	return error;
234*8d741a5dSApple OSS Distributions }
235*8d741a5dSApple OSS Distributions 
236*8d741a5dSApple OSS Distributions SYSCTL_PROC(_kern, OID_AUTO, wq_limit_cooperative_threads,
237*8d741a5dSApple OSS Distributions     CTLFLAG_ANYBODY | CTLFLAG_MASKED | CTLFLAG_WR | CTLFLAG_LOCKED | CTLTYPE_INT, 0, 0,
238*8d741a5dSApple OSS Distributions     wq_limit_cooperative_threads_for_proc,
239*8d741a5dSApple OSS Distributions     "I", "Modify the max pool size of the cooperative pool");
240*8d741a5dSApple OSS Distributions 
241*8d741a5dSApple OSS Distributions #pragma mark p_wqptr
242*8d741a5dSApple OSS Distributions 
243*8d741a5dSApple OSS Distributions #define WQPTR_IS_INITING_VALUE ((struct workqueue *)~(uintptr_t)0)
244*8d741a5dSApple OSS Distributions 
245*8d741a5dSApple OSS Distributions static struct workqueue *
proc_get_wqptr_fast(struct proc * p)246*8d741a5dSApple OSS Distributions proc_get_wqptr_fast(struct proc *p)
247*8d741a5dSApple OSS Distributions {
248*8d741a5dSApple OSS Distributions 	return os_atomic_load(&p->p_wqptr, relaxed);
249*8d741a5dSApple OSS Distributions }
250*8d741a5dSApple OSS Distributions 
251*8d741a5dSApple OSS Distributions struct workqueue *
proc_get_wqptr(struct proc * p)252*8d741a5dSApple OSS Distributions proc_get_wqptr(struct proc *p)
253*8d741a5dSApple OSS Distributions {
254*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr_fast(p);
255*8d741a5dSApple OSS Distributions 	return wq == WQPTR_IS_INITING_VALUE ? NULL : wq;
256*8d741a5dSApple OSS Distributions }
257*8d741a5dSApple OSS Distributions 
258*8d741a5dSApple OSS Distributions static void
proc_set_wqptr(struct proc * p,struct workqueue * wq)259*8d741a5dSApple OSS Distributions proc_set_wqptr(struct proc *p, struct workqueue *wq)
260*8d741a5dSApple OSS Distributions {
261*8d741a5dSApple OSS Distributions 	wq = os_atomic_xchg(&p->p_wqptr, wq, release);
262*8d741a5dSApple OSS Distributions 	if (wq == WQPTR_IS_INITING_VALUE) {
263*8d741a5dSApple OSS Distributions 		proc_lock(p);
264*8d741a5dSApple OSS Distributions 		thread_wakeup(&p->p_wqptr);
265*8d741a5dSApple OSS Distributions 		proc_unlock(p);
266*8d741a5dSApple OSS Distributions 	}
267*8d741a5dSApple OSS Distributions }
268*8d741a5dSApple OSS Distributions 
269*8d741a5dSApple OSS Distributions static bool
proc_init_wqptr_or_wait(struct proc * p)270*8d741a5dSApple OSS Distributions proc_init_wqptr_or_wait(struct proc *p)
271*8d741a5dSApple OSS Distributions {
272*8d741a5dSApple OSS Distributions 	struct workqueue *wq;
273*8d741a5dSApple OSS Distributions 
274*8d741a5dSApple OSS Distributions 	proc_lock(p);
275*8d741a5dSApple OSS Distributions 	wq = os_atomic_load(&p->p_wqptr, relaxed);
276*8d741a5dSApple OSS Distributions 
277*8d741a5dSApple OSS Distributions 	if (wq == NULL) {
278*8d741a5dSApple OSS Distributions 		os_atomic_store(&p->p_wqptr, WQPTR_IS_INITING_VALUE, relaxed);
279*8d741a5dSApple OSS Distributions 		proc_unlock(p);
280*8d741a5dSApple OSS Distributions 		return true;
281*8d741a5dSApple OSS Distributions 	}
282*8d741a5dSApple OSS Distributions 
283*8d741a5dSApple OSS Distributions 	if (wq == WQPTR_IS_INITING_VALUE) {
284*8d741a5dSApple OSS Distributions 		assert_wait(&p->p_wqptr, THREAD_UNINT);
285*8d741a5dSApple OSS Distributions 		proc_unlock(p);
286*8d741a5dSApple OSS Distributions 		thread_block(THREAD_CONTINUE_NULL);
287*8d741a5dSApple OSS Distributions 	} else {
288*8d741a5dSApple OSS Distributions 		proc_unlock(p);
289*8d741a5dSApple OSS Distributions 	}
290*8d741a5dSApple OSS Distributions 	return false;
291*8d741a5dSApple OSS Distributions }
292*8d741a5dSApple OSS Distributions 
293*8d741a5dSApple OSS Distributions static inline event_t
workq_parked_wait_event(struct uthread * uth)294*8d741a5dSApple OSS Distributions workq_parked_wait_event(struct uthread *uth)
295*8d741a5dSApple OSS Distributions {
296*8d741a5dSApple OSS Distributions 	return (event_t)&uth->uu_workq_stackaddr;
297*8d741a5dSApple OSS Distributions }
298*8d741a5dSApple OSS Distributions 
299*8d741a5dSApple OSS Distributions static inline void
workq_thread_wakeup(struct uthread * uth)300*8d741a5dSApple OSS Distributions workq_thread_wakeup(struct uthread *uth)
301*8d741a5dSApple OSS Distributions {
302*8d741a5dSApple OSS Distributions 	thread_wakeup_thread(workq_parked_wait_event(uth), get_machthread(uth));
303*8d741a5dSApple OSS Distributions }
304*8d741a5dSApple OSS Distributions 
305*8d741a5dSApple OSS Distributions #pragma mark wq_thactive
306*8d741a5dSApple OSS Distributions 
307*8d741a5dSApple OSS Distributions #if defined(__LP64__)
308*8d741a5dSApple OSS Distributions // Layout is:
309*8d741a5dSApple OSS Distributions //   127 - 115 : 13 bits of zeroes
310*8d741a5dSApple OSS Distributions //   114 - 112 : best QoS among all pending constrained requests
311*8d741a5dSApple OSS Distributions //   111 -   0 : MGR, AUI, UI, IN, DF, UT, BG+MT buckets every 16 bits
312*8d741a5dSApple OSS Distributions #define WQ_THACTIVE_BUCKET_WIDTH 16
313*8d741a5dSApple OSS Distributions #define WQ_THACTIVE_QOS_SHIFT    (7 * WQ_THACTIVE_BUCKET_WIDTH)
314*8d741a5dSApple OSS Distributions #else
315*8d741a5dSApple OSS Distributions // Layout is:
316*8d741a5dSApple OSS Distributions //   63 - 61 : best QoS among all pending constrained requests
317*8d741a5dSApple OSS Distributions //   60      : Manager bucket (0 or 1)
318*8d741a5dSApple OSS Distributions //   59 -  0 : AUI, UI, IN, DF, UT, BG+MT buckets every 10 bits
319*8d741a5dSApple OSS Distributions #define WQ_THACTIVE_BUCKET_WIDTH 10
320*8d741a5dSApple OSS Distributions #define WQ_THACTIVE_QOS_SHIFT    (6 * WQ_THACTIVE_BUCKET_WIDTH + 1)
321*8d741a5dSApple OSS Distributions #endif
322*8d741a5dSApple OSS Distributions #define WQ_THACTIVE_BUCKET_MASK  ((1U << WQ_THACTIVE_BUCKET_WIDTH) - 1)
323*8d741a5dSApple OSS Distributions #define WQ_THACTIVE_BUCKET_HALF  (1U << (WQ_THACTIVE_BUCKET_WIDTH - 1))
324*8d741a5dSApple OSS Distributions 
325*8d741a5dSApple OSS Distributions static_assert(sizeof(wq_thactive_t) * CHAR_BIT - WQ_THACTIVE_QOS_SHIFT >= 3,
326*8d741a5dSApple OSS Distributions     "Make sure we have space to encode a QoS");
327*8d741a5dSApple OSS Distributions 
328*8d741a5dSApple OSS Distributions static inline wq_thactive_t
_wq_thactive(struct workqueue * wq)329*8d741a5dSApple OSS Distributions _wq_thactive(struct workqueue *wq)
330*8d741a5dSApple OSS Distributions {
331*8d741a5dSApple OSS Distributions 	return os_atomic_load_wide(&wq->wq_thactive, relaxed);
332*8d741a5dSApple OSS Distributions }
333*8d741a5dSApple OSS Distributions 
334*8d741a5dSApple OSS Distributions static inline uint8_t
_wq_bucket(thread_qos_t qos)335*8d741a5dSApple OSS Distributions _wq_bucket(thread_qos_t qos)
336*8d741a5dSApple OSS Distributions {
337*8d741a5dSApple OSS Distributions 	// Map both BG and MT to the same bucket by over-shifting down and
338*8d741a5dSApple OSS Distributions 	// clamping MT and BG together.
339*8d741a5dSApple OSS Distributions 	switch (qos) {
340*8d741a5dSApple OSS Distributions 	case THREAD_QOS_MAINTENANCE:
341*8d741a5dSApple OSS Distributions 		return 0;
342*8d741a5dSApple OSS Distributions 	default:
343*8d741a5dSApple OSS Distributions 		return qos - 2;
344*8d741a5dSApple OSS Distributions 	}
345*8d741a5dSApple OSS Distributions }
346*8d741a5dSApple OSS Distributions 
347*8d741a5dSApple OSS Distributions #define WQ_THACTIVE_BEST_CONSTRAINED_REQ_QOS(tha) \
348*8d741a5dSApple OSS Distributions 	        ((thread_qos_t)((tha) >> WQ_THACTIVE_QOS_SHIFT))
349*8d741a5dSApple OSS Distributions 
350*8d741a5dSApple OSS Distributions static inline thread_qos_t
_wq_thactive_best_constrained_req_qos(struct workqueue * wq)351*8d741a5dSApple OSS Distributions _wq_thactive_best_constrained_req_qos(struct workqueue *wq)
352*8d741a5dSApple OSS Distributions {
353*8d741a5dSApple OSS Distributions 	// Avoid expensive atomic operations: the three bits we're loading are in
354*8d741a5dSApple OSS Distributions 	// a single byte, and always updated under the workqueue lock
355*8d741a5dSApple OSS Distributions 	wq_thactive_t v = *(wq_thactive_t *)&wq->wq_thactive;
356*8d741a5dSApple OSS Distributions 	return WQ_THACTIVE_BEST_CONSTRAINED_REQ_QOS(v);
357*8d741a5dSApple OSS Distributions }
358*8d741a5dSApple OSS Distributions 
359*8d741a5dSApple OSS Distributions static void
_wq_thactive_refresh_best_constrained_req_qos(struct workqueue * wq)360*8d741a5dSApple OSS Distributions _wq_thactive_refresh_best_constrained_req_qos(struct workqueue *wq)
361*8d741a5dSApple OSS Distributions {
362*8d741a5dSApple OSS Distributions 	thread_qos_t old_qos, new_qos;
363*8d741a5dSApple OSS Distributions 	workq_threadreq_t req;
364*8d741a5dSApple OSS Distributions 
365*8d741a5dSApple OSS Distributions 	req = priority_queue_max(&wq->wq_constrained_queue,
366*8d741a5dSApple OSS Distributions 	    struct workq_threadreq_s, tr_entry);
367*8d741a5dSApple OSS Distributions 	new_qos = req ? req->tr_qos : THREAD_QOS_UNSPECIFIED;
368*8d741a5dSApple OSS Distributions 	old_qos = _wq_thactive_best_constrained_req_qos(wq);
369*8d741a5dSApple OSS Distributions 	if (old_qos != new_qos) {
370*8d741a5dSApple OSS Distributions 		long delta = (long)new_qos - (long)old_qos;
371*8d741a5dSApple OSS Distributions 		wq_thactive_t v = (wq_thactive_t)delta << WQ_THACTIVE_QOS_SHIFT;
372*8d741a5dSApple OSS Distributions 		/*
373*8d741a5dSApple OSS Distributions 		 * We can do an atomic add relative to the initial load because updates
374*8d741a5dSApple OSS Distributions 		 * to this qos are always serialized under the workqueue lock.
375*8d741a5dSApple OSS Distributions 		 */
376*8d741a5dSApple OSS Distributions 		v = os_atomic_add(&wq->wq_thactive, v, relaxed);
377*8d741a5dSApple OSS Distributions #ifdef __LP64__
378*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_thactive_update, wq, (uint64_t)v,
379*8d741a5dSApple OSS Distributions 		    (uint64_t)(v >> 64), 0);
380*8d741a5dSApple OSS Distributions #else
381*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_thactive_update, wq, v, 0, 0);
382*8d741a5dSApple OSS Distributions #endif
383*8d741a5dSApple OSS Distributions 	}
384*8d741a5dSApple OSS Distributions }
385*8d741a5dSApple OSS Distributions 
386*8d741a5dSApple OSS Distributions static inline wq_thactive_t
_wq_thactive_offset_for_qos(thread_qos_t qos)387*8d741a5dSApple OSS Distributions _wq_thactive_offset_for_qos(thread_qos_t qos)
388*8d741a5dSApple OSS Distributions {
389*8d741a5dSApple OSS Distributions 	uint8_t bucket = _wq_bucket(qos);
390*8d741a5dSApple OSS Distributions 	__builtin_assume(bucket < WORKQ_NUM_BUCKETS);
391*8d741a5dSApple OSS Distributions 	return (wq_thactive_t)1 << (bucket * WQ_THACTIVE_BUCKET_WIDTH);
392*8d741a5dSApple OSS Distributions }
393*8d741a5dSApple OSS Distributions 
394*8d741a5dSApple OSS Distributions static inline wq_thactive_t
_wq_thactive_inc(struct workqueue * wq,thread_qos_t qos)395*8d741a5dSApple OSS Distributions _wq_thactive_inc(struct workqueue *wq, thread_qos_t qos)
396*8d741a5dSApple OSS Distributions {
397*8d741a5dSApple OSS Distributions 	wq_thactive_t v = _wq_thactive_offset_for_qos(qos);
398*8d741a5dSApple OSS Distributions 	return os_atomic_add_orig(&wq->wq_thactive, v, relaxed);
399*8d741a5dSApple OSS Distributions }
400*8d741a5dSApple OSS Distributions 
401*8d741a5dSApple OSS Distributions static inline wq_thactive_t
_wq_thactive_dec(struct workqueue * wq,thread_qos_t qos)402*8d741a5dSApple OSS Distributions _wq_thactive_dec(struct workqueue *wq, thread_qos_t qos)
403*8d741a5dSApple OSS Distributions {
404*8d741a5dSApple OSS Distributions 	wq_thactive_t v = _wq_thactive_offset_for_qos(qos);
405*8d741a5dSApple OSS Distributions 	return os_atomic_sub_orig(&wq->wq_thactive, v, relaxed);
406*8d741a5dSApple OSS Distributions }
407*8d741a5dSApple OSS Distributions 
408*8d741a5dSApple OSS Distributions static inline void
_wq_thactive_move(struct workqueue * wq,thread_qos_t old_qos,thread_qos_t new_qos)409*8d741a5dSApple OSS Distributions _wq_thactive_move(struct workqueue *wq,
410*8d741a5dSApple OSS Distributions     thread_qos_t old_qos, thread_qos_t new_qos)
411*8d741a5dSApple OSS Distributions {
412*8d741a5dSApple OSS Distributions 	wq_thactive_t v = _wq_thactive_offset_for_qos(new_qos) -
413*8d741a5dSApple OSS Distributions 	    _wq_thactive_offset_for_qos(old_qos);
414*8d741a5dSApple OSS Distributions 	os_atomic_add(&wq->wq_thactive, v, relaxed);
415*8d741a5dSApple OSS Distributions 	wq->wq_thscheduled_count[_wq_bucket(old_qos)]--;
416*8d741a5dSApple OSS Distributions 	wq->wq_thscheduled_count[_wq_bucket(new_qos)]++;
417*8d741a5dSApple OSS Distributions }
418*8d741a5dSApple OSS Distributions 
419*8d741a5dSApple OSS Distributions static inline uint32_t
_wq_thactive_aggregate_downto_qos(struct workqueue * wq,wq_thactive_t v,thread_qos_t qos,uint32_t * busycount,uint32_t * max_busycount)420*8d741a5dSApple OSS Distributions _wq_thactive_aggregate_downto_qos(struct workqueue *wq, wq_thactive_t v,
421*8d741a5dSApple OSS Distributions     thread_qos_t qos, uint32_t *busycount, uint32_t *max_busycount)
422*8d741a5dSApple OSS Distributions {
423*8d741a5dSApple OSS Distributions 	uint32_t count = 0, active;
424*8d741a5dSApple OSS Distributions 	uint64_t curtime;
425*8d741a5dSApple OSS Distributions 
426*8d741a5dSApple OSS Distributions 	assert(WORKQ_THREAD_QOS_MIN <= qos && qos <= WORKQ_THREAD_QOS_MAX);
427*8d741a5dSApple OSS Distributions 
428*8d741a5dSApple OSS Distributions 	if (busycount) {
429*8d741a5dSApple OSS Distributions 		curtime = mach_absolute_time();
430*8d741a5dSApple OSS Distributions 		*busycount = 0;
431*8d741a5dSApple OSS Distributions 	}
432*8d741a5dSApple OSS Distributions 	if (max_busycount) {
433*8d741a5dSApple OSS Distributions 		*max_busycount = THREAD_QOS_LAST - qos;
434*8d741a5dSApple OSS Distributions 	}
435*8d741a5dSApple OSS Distributions 
436*8d741a5dSApple OSS Distributions 	uint8_t i = _wq_bucket(qos);
437*8d741a5dSApple OSS Distributions 	v >>= i * WQ_THACTIVE_BUCKET_WIDTH;
438*8d741a5dSApple OSS Distributions 	for (; i < WORKQ_NUM_QOS_BUCKETS; i++, v >>= WQ_THACTIVE_BUCKET_WIDTH) {
439*8d741a5dSApple OSS Distributions 		active = v & WQ_THACTIVE_BUCKET_MASK;
440*8d741a5dSApple OSS Distributions 		count += active;
441*8d741a5dSApple OSS Distributions 
442*8d741a5dSApple OSS Distributions 		if (busycount && wq->wq_thscheduled_count[i] > active) {
443*8d741a5dSApple OSS Distributions 			if (workq_thread_is_busy(curtime, &wq->wq_lastblocked_ts[i])) {
444*8d741a5dSApple OSS Distributions 				/*
445*8d741a5dSApple OSS Distributions 				 * We only consider the last blocked thread for a given bucket
446*8d741a5dSApple OSS Distributions 				 * as busy because we don't want to take the list lock in each
447*8d741a5dSApple OSS Distributions 				 * sched callback. However this is an approximation that could
448*8d741a5dSApple OSS Distributions 				 * contribute to thread creation storms.
449*8d741a5dSApple OSS Distributions 				 */
450*8d741a5dSApple OSS Distributions 				(*busycount)++;
451*8d741a5dSApple OSS Distributions 			}
452*8d741a5dSApple OSS Distributions 		}
453*8d741a5dSApple OSS Distributions 	}
454*8d741a5dSApple OSS Distributions 
455*8d741a5dSApple OSS Distributions 	return count;
456*8d741a5dSApple OSS Distributions }
457*8d741a5dSApple OSS Distributions 
458*8d741a5dSApple OSS Distributions /* The input qos here should be the requested QoS of the thread, not accounting
459*8d741a5dSApple OSS Distributions  * for any overrides */
460*8d741a5dSApple OSS Distributions static inline void
_wq_cooperative_queue_scheduled_count_dec(struct workqueue * wq,thread_qos_t qos)461*8d741a5dSApple OSS Distributions _wq_cooperative_queue_scheduled_count_dec(struct workqueue *wq, thread_qos_t qos)
462*8d741a5dSApple OSS Distributions {
463*8d741a5dSApple OSS Distributions 	__assert_only uint8_t old_scheduled_count = wq->wq_cooperative_queue_scheduled_count[_wq_bucket(qos)]--;
464*8d741a5dSApple OSS Distributions 	assert(old_scheduled_count > 0);
465*8d741a5dSApple OSS Distributions }
466*8d741a5dSApple OSS Distributions 
467*8d741a5dSApple OSS Distributions /* The input qos here should be the requested QoS of the thread, not accounting
468*8d741a5dSApple OSS Distributions  * for any overrides */
469*8d741a5dSApple OSS Distributions static inline void
_wq_cooperative_queue_scheduled_count_inc(struct workqueue * wq,thread_qos_t qos)470*8d741a5dSApple OSS Distributions _wq_cooperative_queue_scheduled_count_inc(struct workqueue *wq, thread_qos_t qos)
471*8d741a5dSApple OSS Distributions {
472*8d741a5dSApple OSS Distributions 	__assert_only uint8_t old_scheduled_count = wq->wq_cooperative_queue_scheduled_count[_wq_bucket(qos)]++;
473*8d741a5dSApple OSS Distributions 	assert(old_scheduled_count < UINT8_MAX);
474*8d741a5dSApple OSS Distributions }
475*8d741a5dSApple OSS Distributions 
476*8d741a5dSApple OSS Distributions #pragma mark wq_flags
477*8d741a5dSApple OSS Distributions 
478*8d741a5dSApple OSS Distributions static inline uint32_t
_wq_flags(struct workqueue * wq)479*8d741a5dSApple OSS Distributions _wq_flags(struct workqueue *wq)
480*8d741a5dSApple OSS Distributions {
481*8d741a5dSApple OSS Distributions 	return os_atomic_load(&wq->wq_flags, relaxed);
482*8d741a5dSApple OSS Distributions }
483*8d741a5dSApple OSS Distributions 
484*8d741a5dSApple OSS Distributions static inline bool
_wq_exiting(struct workqueue * wq)485*8d741a5dSApple OSS Distributions _wq_exiting(struct workqueue *wq)
486*8d741a5dSApple OSS Distributions {
487*8d741a5dSApple OSS Distributions 	return _wq_flags(wq) & WQ_EXITING;
488*8d741a5dSApple OSS Distributions }
489*8d741a5dSApple OSS Distributions 
490*8d741a5dSApple OSS Distributions bool
workq_is_exiting(struct proc * p)491*8d741a5dSApple OSS Distributions workq_is_exiting(struct proc *p)
492*8d741a5dSApple OSS Distributions {
493*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
494*8d741a5dSApple OSS Distributions 	return !wq || _wq_exiting(wq);
495*8d741a5dSApple OSS Distributions }
496*8d741a5dSApple OSS Distributions 
497*8d741a5dSApple OSS Distributions 
498*8d741a5dSApple OSS Distributions #pragma mark workqueue lock
499*8d741a5dSApple OSS Distributions 
500*8d741a5dSApple OSS Distributions static bool
workq_lock_is_acquired_kdp(struct workqueue * wq)501*8d741a5dSApple OSS Distributions workq_lock_is_acquired_kdp(struct workqueue *wq)
502*8d741a5dSApple OSS Distributions {
503*8d741a5dSApple OSS Distributions 	return kdp_lck_ticket_is_acquired(&wq->wq_lock);
504*8d741a5dSApple OSS Distributions }
505*8d741a5dSApple OSS Distributions 
506*8d741a5dSApple OSS Distributions static inline void
workq_lock_spin(struct workqueue * wq)507*8d741a5dSApple OSS Distributions workq_lock_spin(struct workqueue *wq)
508*8d741a5dSApple OSS Distributions {
509*8d741a5dSApple OSS Distributions 	lck_ticket_lock(&wq->wq_lock, &workq_lck_grp);
510*8d741a5dSApple OSS Distributions }
511*8d741a5dSApple OSS Distributions 
512*8d741a5dSApple OSS Distributions static inline void
workq_lock_held(struct workqueue * wq)513*8d741a5dSApple OSS Distributions workq_lock_held(struct workqueue *wq)
514*8d741a5dSApple OSS Distributions {
515*8d741a5dSApple OSS Distributions 	LCK_TICKET_ASSERT_OWNED(&wq->wq_lock);
516*8d741a5dSApple OSS Distributions }
517*8d741a5dSApple OSS Distributions 
518*8d741a5dSApple OSS Distributions static inline bool
workq_lock_try(struct workqueue * wq)519*8d741a5dSApple OSS Distributions workq_lock_try(struct workqueue *wq)
520*8d741a5dSApple OSS Distributions {
521*8d741a5dSApple OSS Distributions 	return lck_ticket_lock_try(&wq->wq_lock, &workq_lck_grp);
522*8d741a5dSApple OSS Distributions }
523*8d741a5dSApple OSS Distributions 
524*8d741a5dSApple OSS Distributions static inline void
workq_unlock(struct workqueue * wq)525*8d741a5dSApple OSS Distributions workq_unlock(struct workqueue *wq)
526*8d741a5dSApple OSS Distributions {
527*8d741a5dSApple OSS Distributions 	lck_ticket_unlock(&wq->wq_lock);
528*8d741a5dSApple OSS Distributions }
529*8d741a5dSApple OSS Distributions 
530*8d741a5dSApple OSS Distributions #pragma mark idle thread lists
531*8d741a5dSApple OSS Distributions 
532*8d741a5dSApple OSS Distributions #define WORKQ_POLICY_INIT(qos) \
533*8d741a5dSApple OSS Distributions 	        (struct uu_workq_policy){ .qos_req = qos, .qos_bucket = qos }
534*8d741a5dSApple OSS Distributions 
535*8d741a5dSApple OSS Distributions static inline thread_qos_t
workq_pri_bucket(struct uu_workq_policy req)536*8d741a5dSApple OSS Distributions workq_pri_bucket(struct uu_workq_policy req)
537*8d741a5dSApple OSS Distributions {
538*8d741a5dSApple OSS Distributions 	return MAX(MAX(req.qos_req, req.qos_max), req.qos_override);
539*8d741a5dSApple OSS Distributions }
540*8d741a5dSApple OSS Distributions 
541*8d741a5dSApple OSS Distributions static inline thread_qos_t
workq_pri_override(struct uu_workq_policy req)542*8d741a5dSApple OSS Distributions workq_pri_override(struct uu_workq_policy req)
543*8d741a5dSApple OSS Distributions {
544*8d741a5dSApple OSS Distributions 	return MAX(workq_pri_bucket(req), req.qos_bucket);
545*8d741a5dSApple OSS Distributions }
546*8d741a5dSApple OSS Distributions 
547*8d741a5dSApple OSS Distributions static inline bool
workq_thread_needs_params_change(workq_threadreq_t req,struct uthread * uth)548*8d741a5dSApple OSS Distributions workq_thread_needs_params_change(workq_threadreq_t req, struct uthread *uth)
549*8d741a5dSApple OSS Distributions {
550*8d741a5dSApple OSS Distributions 	workq_threadreq_param_t cur_trp, req_trp = { };
551*8d741a5dSApple OSS Distributions 
552*8d741a5dSApple OSS Distributions 	cur_trp.trp_value = uth->uu_save.uus_workq_park_data.workloop_params;
553*8d741a5dSApple OSS Distributions 	if (req->tr_flags & WORKQ_TR_FLAG_WL_PARAMS) {
554*8d741a5dSApple OSS Distributions 		req_trp = kqueue_threadreq_workloop_param(req);
555*8d741a5dSApple OSS Distributions 	}
556*8d741a5dSApple OSS Distributions 
557*8d741a5dSApple OSS Distributions 	/*
558*8d741a5dSApple OSS Distributions 	 * CPU percent flags are handled separately to policy changes, so ignore
559*8d741a5dSApple OSS Distributions 	 * them for all of these checks.
560*8d741a5dSApple OSS Distributions 	 */
561*8d741a5dSApple OSS Distributions 	uint16_t cur_flags = (cur_trp.trp_flags & ~TRP_CPUPERCENT);
562*8d741a5dSApple OSS Distributions 	uint16_t req_flags = (req_trp.trp_flags & ~TRP_CPUPERCENT);
563*8d741a5dSApple OSS Distributions 
564*8d741a5dSApple OSS Distributions 	if (!req_flags && !cur_flags) {
565*8d741a5dSApple OSS Distributions 		return false;
566*8d741a5dSApple OSS Distributions 	}
567*8d741a5dSApple OSS Distributions 
568*8d741a5dSApple OSS Distributions 	if (req_flags != cur_flags) {
569*8d741a5dSApple OSS Distributions 		return true;
570*8d741a5dSApple OSS Distributions 	}
571*8d741a5dSApple OSS Distributions 
572*8d741a5dSApple OSS Distributions 	if ((req_flags & TRP_PRIORITY) && req_trp.trp_pri != cur_trp.trp_pri) {
573*8d741a5dSApple OSS Distributions 		return true;
574*8d741a5dSApple OSS Distributions 	}
575*8d741a5dSApple OSS Distributions 
576*8d741a5dSApple OSS Distributions 	if ((req_flags & TRP_POLICY) && req_trp.trp_pol != cur_trp.trp_pol) {
577*8d741a5dSApple OSS Distributions 		return true;
578*8d741a5dSApple OSS Distributions 	}
579*8d741a5dSApple OSS Distributions 
580*8d741a5dSApple OSS Distributions 	return false;
581*8d741a5dSApple OSS Distributions }
582*8d741a5dSApple OSS Distributions 
583*8d741a5dSApple OSS Distributions static inline bool
workq_thread_needs_priority_change(workq_threadreq_t req,struct uthread * uth)584*8d741a5dSApple OSS Distributions workq_thread_needs_priority_change(workq_threadreq_t req, struct uthread *uth)
585*8d741a5dSApple OSS Distributions {
586*8d741a5dSApple OSS Distributions 	if (workq_thread_needs_params_change(req, uth)) {
587*8d741a5dSApple OSS Distributions 		return true;
588*8d741a5dSApple OSS Distributions 	}
589*8d741a5dSApple OSS Distributions 
590*8d741a5dSApple OSS Distributions 	if (req->tr_qos != workq_pri_override(uth->uu_workq_pri)) {
591*8d741a5dSApple OSS Distributions 		return true;
592*8d741a5dSApple OSS Distributions 	}
593*8d741a5dSApple OSS Distributions 
594*8d741a5dSApple OSS Distributions #if CONFIG_PREADOPT_TG
595*8d741a5dSApple OSS Distributions 	thread_group_qos_t tg = kqr_preadopt_thread_group(req);
596*8d741a5dSApple OSS Distributions 	if (KQWL_HAS_VALID_PREADOPTED_TG(tg)) {
597*8d741a5dSApple OSS Distributions 		/*
598*8d741a5dSApple OSS Distributions 		 * Ideally, we'd add check here to see if thread's preadopt TG is same
599*8d741a5dSApple OSS Distributions 		 * as the thread requests's thread group and short circuit if that is
600*8d741a5dSApple OSS Distributions 		 * the case. But in the interest of keeping the code clean and not
601*8d741a5dSApple OSS Distributions 		 * taking the thread lock here, we're going to skip this. We will
602*8d741a5dSApple OSS Distributions 		 * eventually shortcircuit once we try to set the preadoption thread
603*8d741a5dSApple OSS Distributions 		 * group on the thread.
604*8d741a5dSApple OSS Distributions 		 */
605*8d741a5dSApple OSS Distributions 		return true;
606*8d741a5dSApple OSS Distributions 	}
607*8d741a5dSApple OSS Distributions #endif
608*8d741a5dSApple OSS Distributions 
609*8d741a5dSApple OSS Distributions 	return false;
610*8d741a5dSApple OSS Distributions }
611*8d741a5dSApple OSS Distributions 
612*8d741a5dSApple OSS Distributions /* Input thread must be self. Called during self override, resetting overrides
613*8d741a5dSApple OSS Distributions  * or while processing kevents
614*8d741a5dSApple OSS Distributions  *
615*8d741a5dSApple OSS Distributions  * Called with workq lock held. Sometimes also the thread mutex
616*8d741a5dSApple OSS Distributions  */
617*8d741a5dSApple OSS Distributions static void
workq_thread_update_bucket(proc_t p,struct workqueue * wq,struct uthread * uth,struct uu_workq_policy old_pri,struct uu_workq_policy new_pri,bool force_run)618*8d741a5dSApple OSS Distributions workq_thread_update_bucket(proc_t p, struct workqueue *wq, struct uthread *uth,
619*8d741a5dSApple OSS Distributions     struct uu_workq_policy old_pri, struct uu_workq_policy new_pri,
620*8d741a5dSApple OSS Distributions     bool force_run)
621*8d741a5dSApple OSS Distributions {
622*8d741a5dSApple OSS Distributions 	assert(uth == current_uthread());
623*8d741a5dSApple OSS Distributions 
624*8d741a5dSApple OSS Distributions 	thread_qos_t old_bucket = old_pri.qos_bucket;
625*8d741a5dSApple OSS Distributions 	thread_qos_t new_bucket = workq_pri_bucket(new_pri);
626*8d741a5dSApple OSS Distributions 
627*8d741a5dSApple OSS Distributions 	if ((old_bucket != new_bucket) &&
628*8d741a5dSApple OSS Distributions 	    !workq_thread_is_permanently_bound(uth)) {
629*8d741a5dSApple OSS Distributions 		_wq_thactive_move(wq, old_bucket, new_bucket);
630*8d741a5dSApple OSS Distributions 	}
631*8d741a5dSApple OSS Distributions 
632*8d741a5dSApple OSS Distributions 	new_pri.qos_bucket = new_bucket;
633*8d741a5dSApple OSS Distributions 	uth->uu_workq_pri = new_pri;
634*8d741a5dSApple OSS Distributions 
635*8d741a5dSApple OSS Distributions 	if (old_pri.qos_override != new_pri.qos_override) {
636*8d741a5dSApple OSS Distributions 		thread_set_workq_override(get_machthread(uth), new_pri.qos_override);
637*8d741a5dSApple OSS Distributions 	}
638*8d741a5dSApple OSS Distributions 
639*8d741a5dSApple OSS Distributions 	if (wq->wq_reqcount &&
640*8d741a5dSApple OSS Distributions 	    !workq_thread_is_permanently_bound(uth) &&
641*8d741a5dSApple OSS Distributions 	    (old_bucket > new_bucket || force_run)) {
642*8d741a5dSApple OSS Distributions 		int flags = WORKQ_THREADREQ_CAN_CREATE_THREADS;
643*8d741a5dSApple OSS Distributions 		if (old_bucket > new_bucket) {
644*8d741a5dSApple OSS Distributions 			/*
645*8d741a5dSApple OSS Distributions 			 * When lowering our bucket, we may unblock a thread request,
646*8d741a5dSApple OSS Distributions 			 * but we can't drop our priority before we have evaluated
647*8d741a5dSApple OSS Distributions 			 * whether this is the case, and if we ever drop the workqueue lock
648*8d741a5dSApple OSS Distributions 			 * that would cause a priority inversion.
649*8d741a5dSApple OSS Distributions 			 *
650*8d741a5dSApple OSS Distributions 			 * We hence have to disallow thread creation in that case.
651*8d741a5dSApple OSS Distributions 			 */
652*8d741a5dSApple OSS Distributions 			flags = 0;
653*8d741a5dSApple OSS Distributions 		}
654*8d741a5dSApple OSS Distributions 		workq_schedule_creator(p, wq, flags);
655*8d741a5dSApple OSS Distributions 	}
656*8d741a5dSApple OSS Distributions }
657*8d741a5dSApple OSS Distributions 
658*8d741a5dSApple OSS Distributions /*
659*8d741a5dSApple OSS Distributions  * Sets/resets the cpu percent limits on the current thread. We can't set
660*8d741a5dSApple OSS Distributions  * these limits from outside of the current thread, so this function needs
661*8d741a5dSApple OSS Distributions  * to be called when we're executing on the intended
662*8d741a5dSApple OSS Distributions  */
663*8d741a5dSApple OSS Distributions static void
workq_thread_reset_cpupercent(workq_threadreq_t req,struct uthread * uth)664*8d741a5dSApple OSS Distributions workq_thread_reset_cpupercent(workq_threadreq_t req, struct uthread *uth)
665*8d741a5dSApple OSS Distributions {
666*8d741a5dSApple OSS Distributions 	assert(uth == current_uthread());
667*8d741a5dSApple OSS Distributions 	workq_threadreq_param_t trp = { };
668*8d741a5dSApple OSS Distributions 
669*8d741a5dSApple OSS Distributions 	if (req && (req->tr_flags & WORKQ_TR_FLAG_WL_PARAMS)) {
670*8d741a5dSApple OSS Distributions 		trp = kqueue_threadreq_workloop_param(req);
671*8d741a5dSApple OSS Distributions 	}
672*8d741a5dSApple OSS Distributions 
673*8d741a5dSApple OSS Distributions 	if (uth->uu_workq_flags & UT_WORKQ_CPUPERCENT) {
674*8d741a5dSApple OSS Distributions 		/*
675*8d741a5dSApple OSS Distributions 		 * Going through disable when we have an existing CPU percent limit
676*8d741a5dSApple OSS Distributions 		 * set will force the ledger to refill the token bucket of the current
677*8d741a5dSApple OSS Distributions 		 * thread. Removing any penalty applied by previous thread use.
678*8d741a5dSApple OSS Distributions 		 */
679*8d741a5dSApple OSS Distributions 		thread_set_cpulimit(THREAD_CPULIMIT_DISABLE, 0, 0);
680*8d741a5dSApple OSS Distributions 		uth->uu_workq_flags &= ~UT_WORKQ_CPUPERCENT;
681*8d741a5dSApple OSS Distributions 	}
682*8d741a5dSApple OSS Distributions 
683*8d741a5dSApple OSS Distributions 	if (trp.trp_flags & TRP_CPUPERCENT) {
684*8d741a5dSApple OSS Distributions 		thread_set_cpulimit(THREAD_CPULIMIT_BLOCK, trp.trp_cpupercent,
685*8d741a5dSApple OSS Distributions 		    (uint64_t)trp.trp_refillms * NSEC_PER_SEC);
686*8d741a5dSApple OSS Distributions 		uth->uu_workq_flags |= UT_WORKQ_CPUPERCENT;
687*8d741a5dSApple OSS Distributions 	}
688*8d741a5dSApple OSS Distributions }
689*8d741a5dSApple OSS Distributions 
690*8d741a5dSApple OSS Distributions /*
691*8d741a5dSApple OSS Distributions  * This function is always called with the workq lock, except for the
692*8d741a5dSApple OSS Distributions  * permanently bound workqueue thread, which instead requires the kqlock.
693*8d741a5dSApple OSS Distributions  * See locking model for bound thread's uu_workq_flags.
694*8d741a5dSApple OSS Distributions  */
695*8d741a5dSApple OSS Distributions static void
workq_thread_reset_pri(struct workqueue * wq,struct uthread * uth,workq_threadreq_t req,bool unpark)696*8d741a5dSApple OSS Distributions workq_thread_reset_pri(struct workqueue *wq, struct uthread *uth,
697*8d741a5dSApple OSS Distributions     workq_threadreq_t req, bool unpark)
698*8d741a5dSApple OSS Distributions {
699*8d741a5dSApple OSS Distributions 	thread_t th = get_machthread(uth);
700*8d741a5dSApple OSS Distributions 	thread_qos_t qos = req ? req->tr_qos : WORKQ_THREAD_QOS_CLEANUP;
701*8d741a5dSApple OSS Distributions 	workq_threadreq_param_t trp = { };
702*8d741a5dSApple OSS Distributions 	int priority = 31;
703*8d741a5dSApple OSS Distributions 	int policy = POLICY_TIMESHARE;
704*8d741a5dSApple OSS Distributions 
705*8d741a5dSApple OSS Distributions 	if (req && (req->tr_flags & WORKQ_TR_FLAG_WL_PARAMS)) {
706*8d741a5dSApple OSS Distributions 		trp = kqueue_threadreq_workloop_param(req);
707*8d741a5dSApple OSS Distributions 	}
708*8d741a5dSApple OSS Distributions 
709*8d741a5dSApple OSS Distributions 	uth->uu_workq_pri = WORKQ_POLICY_INIT(qos);
710*8d741a5dSApple OSS Distributions 	uth->uu_workq_flags &= ~UT_WORKQ_OUTSIDE_QOS;
711*8d741a5dSApple OSS Distributions 
712*8d741a5dSApple OSS Distributions 	if (unpark) {
713*8d741a5dSApple OSS Distributions 		uth->uu_save.uus_workq_park_data.workloop_params = trp.trp_value;
714*8d741a5dSApple OSS Distributions 		// qos sent out to userspace (may differ from uu_workq_pri on param threads)
715*8d741a5dSApple OSS Distributions 		uth->uu_save.uus_workq_park_data.qos = qos;
716*8d741a5dSApple OSS Distributions 	}
717*8d741a5dSApple OSS Distributions 
718*8d741a5dSApple OSS Distributions 	if (qos == WORKQ_THREAD_QOS_MANAGER) {
719*8d741a5dSApple OSS Distributions 		uint32_t mgr_pri = wq->wq_event_manager_priority;
720*8d741a5dSApple OSS Distributions 		assert(trp.trp_value == 0); // manager qos and thread policy don't mix
721*8d741a5dSApple OSS Distributions 
722*8d741a5dSApple OSS Distributions 		if (_pthread_priority_has_sched_pri(mgr_pri)) {
723*8d741a5dSApple OSS Distributions 			mgr_pri &= _PTHREAD_PRIORITY_SCHED_PRI_MASK;
724*8d741a5dSApple OSS Distributions 			thread_set_workq_pri(th, THREAD_QOS_UNSPECIFIED, mgr_pri,
725*8d741a5dSApple OSS Distributions 			    POLICY_TIMESHARE);
726*8d741a5dSApple OSS Distributions 			return;
727*8d741a5dSApple OSS Distributions 		}
728*8d741a5dSApple OSS Distributions 
729*8d741a5dSApple OSS Distributions 		qos = _pthread_priority_thread_qos(mgr_pri);
730*8d741a5dSApple OSS Distributions 	} else {
731*8d741a5dSApple OSS Distributions 		if (trp.trp_flags & TRP_PRIORITY) {
732*8d741a5dSApple OSS Distributions 			qos = THREAD_QOS_UNSPECIFIED;
733*8d741a5dSApple OSS Distributions 			priority = trp.trp_pri;
734*8d741a5dSApple OSS Distributions 			uth->uu_workq_flags |= UT_WORKQ_OUTSIDE_QOS;
735*8d741a5dSApple OSS Distributions 		}
736*8d741a5dSApple OSS Distributions 
737*8d741a5dSApple OSS Distributions 		if (trp.trp_flags & TRP_POLICY) {
738*8d741a5dSApple OSS Distributions 			policy = trp.trp_pol;
739*8d741a5dSApple OSS Distributions 		}
740*8d741a5dSApple OSS Distributions 	}
741*8d741a5dSApple OSS Distributions 
742*8d741a5dSApple OSS Distributions #if CONFIG_PREADOPT_TG
743*8d741a5dSApple OSS Distributions 	if (req && (req->tr_flags & WORKQ_TR_FLAG_WORKLOOP)) {
744*8d741a5dSApple OSS Distributions 		/*
745*8d741a5dSApple OSS Distributions 		 * For kqwl permanently configured with a thread group, we can safely borrow
746*8d741a5dSApple OSS Distributions 		 * +1 ref from kqwl_preadopt_tg. A thread then takes additional +1 ref
747*8d741a5dSApple OSS Distributions 		 * for itself via thread_set_preadopt_thread_group.
748*8d741a5dSApple OSS Distributions 		 *
749*8d741a5dSApple OSS Distributions 		 * In all other cases, we cannot safely read and borrow the reference from the kqwl
750*8d741a5dSApple OSS Distributions 		 * since it can disappear from under us at any time due to the max-ing logic in
751*8d741a5dSApple OSS Distributions 		 * kqueue_set_preadopted_thread_group.
752*8d741a5dSApple OSS Distributions 		 *
753*8d741a5dSApple OSS Distributions 		 * As such, we do the following dance:
754*8d741a5dSApple OSS Distributions 		 *
755*8d741a5dSApple OSS Distributions 		 * 1) cmpxchng and steal the kqwl's preadopt thread group and leave
756*8d741a5dSApple OSS Distributions 		 * behind with (NULL + QoS). At this point, we have the reference
757*8d741a5dSApple OSS Distributions 		 * to the thread group from the kqwl.
758*8d741a5dSApple OSS Distributions 		 * 2) Have the thread set the preadoption thread group on itself.
759*8d741a5dSApple OSS Distributions 		 * 3) cmpxchng from (NULL + QoS) which we set earlier in (1), back to
760*8d741a5dSApple OSS Distributions 		 * thread_group + QoS. ie we try to give the reference back to the kqwl.
761*8d741a5dSApple OSS Distributions 		 * If we fail, that's because a higher QoS thread group was set on the
762*8d741a5dSApple OSS Distributions 		 * kqwl in kqueue_set_preadopted_thread_group in which case, we need to
763*8d741a5dSApple OSS Distributions 		 * go back to (1).
764*8d741a5dSApple OSS Distributions 		 */
765*8d741a5dSApple OSS Distributions 
766*8d741a5dSApple OSS Distributions 		_Atomic(struct thread_group *) * tg_loc = kqr_preadopt_thread_group_addr(req);
767*8d741a5dSApple OSS Distributions 
768*8d741a5dSApple OSS Distributions 		thread_group_qos_t old_tg, new_tg;
769*8d741a5dSApple OSS Distributions 		int ret = 0;
770*8d741a5dSApple OSS Distributions again:
771*8d741a5dSApple OSS Distributions 		ret = os_atomic_rmw_loop(tg_loc, old_tg, new_tg, relaxed, {
772*8d741a5dSApple OSS Distributions 			if ((!KQWL_HAS_VALID_PREADOPTED_TG(old_tg)) ||
773*8d741a5dSApple OSS Distributions 			KQWL_HAS_PERMANENT_PREADOPTED_TG(old_tg)) {
774*8d741a5dSApple OSS Distributions 			        os_atomic_rmw_loop_give_up(break);
775*8d741a5dSApple OSS Distributions 			}
776*8d741a5dSApple OSS Distributions 
777*8d741a5dSApple OSS Distributions 			/*
778*8d741a5dSApple OSS Distributions 			 * Leave the QoS behind - kqueue_set_preadopted_thread_group will
779*8d741a5dSApple OSS Distributions 			 * only modify it if there is a higher QoS thread group to attach
780*8d741a5dSApple OSS Distributions 			 */
781*8d741a5dSApple OSS Distributions 			new_tg = (thread_group_qos_t) ((uintptr_t) old_tg & KQWL_PREADOPT_TG_QOS_MASK);
782*8d741a5dSApple OSS Distributions 		});
783*8d741a5dSApple OSS Distributions 
784*8d741a5dSApple OSS Distributions 		if (ret) {
785*8d741a5dSApple OSS Distributions 			/*
786*8d741a5dSApple OSS Distributions 			 * We successfully took the ref from the kqwl so set it on the
787*8d741a5dSApple OSS Distributions 			 * thread now
788*8d741a5dSApple OSS Distributions 			 */
789*8d741a5dSApple OSS Distributions 			thread_set_preadopt_thread_group(th, KQWL_GET_PREADOPTED_TG(old_tg));
790*8d741a5dSApple OSS Distributions 
791*8d741a5dSApple OSS Distributions 			thread_group_qos_t thread_group_to_expect = new_tg;
792*8d741a5dSApple OSS Distributions 			thread_group_qos_t thread_group_to_set = old_tg;
793*8d741a5dSApple OSS Distributions 
794*8d741a5dSApple OSS Distributions 			os_atomic_rmw_loop(tg_loc, old_tg, new_tg, relaxed, {
795*8d741a5dSApple OSS Distributions 				if (old_tg != thread_group_to_expect) {
796*8d741a5dSApple OSS Distributions 				        /*
797*8d741a5dSApple OSS Distributions 				         * There was an intervening write to the kqwl_preadopt_tg,
798*8d741a5dSApple OSS Distributions 				         * and it has a higher QoS than what we are working with
799*8d741a5dSApple OSS Distributions 				         * here. Abandon our current adopted thread group and redo
800*8d741a5dSApple OSS Distributions 				         * the full dance
801*8d741a5dSApple OSS Distributions 				         */
802*8d741a5dSApple OSS Distributions 				        thread_group_deallocate_safe(KQWL_GET_PREADOPTED_TG(thread_group_to_set));
803*8d741a5dSApple OSS Distributions 				        os_atomic_rmw_loop_give_up(goto again);
804*8d741a5dSApple OSS Distributions 				}
805*8d741a5dSApple OSS Distributions 
806*8d741a5dSApple OSS Distributions 				new_tg = thread_group_to_set;
807*8d741a5dSApple OSS Distributions 			});
808*8d741a5dSApple OSS Distributions 		} else {
809*8d741a5dSApple OSS Distributions 			if (KQWL_HAS_PERMANENT_PREADOPTED_TG(old_tg)) {
810*8d741a5dSApple OSS Distributions 				thread_set_preadopt_thread_group(th, KQWL_GET_PREADOPTED_TG(old_tg));
811*8d741a5dSApple OSS Distributions 			} else {
812*8d741a5dSApple OSS Distributions 				/* Nothing valid on the kqwl, just clear what's on the thread */
813*8d741a5dSApple OSS Distributions 				thread_set_preadopt_thread_group(th, NULL);
814*8d741a5dSApple OSS Distributions 			}
815*8d741a5dSApple OSS Distributions 		}
816*8d741a5dSApple OSS Distributions 	} else {
817*8d741a5dSApple OSS Distributions 		/* Not even a kqwl, clear what's on the thread */
818*8d741a5dSApple OSS Distributions 		thread_set_preadopt_thread_group(th, NULL);
819*8d741a5dSApple OSS Distributions 	}
820*8d741a5dSApple OSS Distributions #endif
821*8d741a5dSApple OSS Distributions 	thread_set_workq_pri(th, qos, priority, policy);
822*8d741a5dSApple OSS Distributions }
823*8d741a5dSApple OSS Distributions 
824*8d741a5dSApple OSS Distributions /*
825*8d741a5dSApple OSS Distributions  * Called by kevent with the NOTE_WL_THREAD_REQUEST knote lock held,
826*8d741a5dSApple OSS Distributions  * every time a servicer is being told about a new max QoS.
827*8d741a5dSApple OSS Distributions  */
828*8d741a5dSApple OSS Distributions void
workq_thread_set_max_qos(struct proc * p,workq_threadreq_t kqr)829*8d741a5dSApple OSS Distributions workq_thread_set_max_qos(struct proc *p, workq_threadreq_t kqr)
830*8d741a5dSApple OSS Distributions {
831*8d741a5dSApple OSS Distributions 	struct uu_workq_policy old_pri, new_pri;
832*8d741a5dSApple OSS Distributions 	struct uthread *uth = current_uthread();
833*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr_fast(p);
834*8d741a5dSApple OSS Distributions 	thread_qos_t qos = kqr->tr_kq_qos_index;
835*8d741a5dSApple OSS Distributions 
836*8d741a5dSApple OSS Distributions 	if (uth->uu_workq_pri.qos_max == qos) {
837*8d741a5dSApple OSS Distributions 		return;
838*8d741a5dSApple OSS Distributions 	}
839*8d741a5dSApple OSS Distributions 
840*8d741a5dSApple OSS Distributions 	workq_lock_spin(wq);
841*8d741a5dSApple OSS Distributions 	old_pri = new_pri = uth->uu_workq_pri;
842*8d741a5dSApple OSS Distributions 	new_pri.qos_max = qos;
843*8d741a5dSApple OSS Distributions 	workq_thread_update_bucket(p, wq, uth, old_pri, new_pri, false);
844*8d741a5dSApple OSS Distributions 	workq_unlock(wq);
845*8d741a5dSApple OSS Distributions }
846*8d741a5dSApple OSS Distributions 
847*8d741a5dSApple OSS Distributions #pragma mark idle threads accounting and handling
848*8d741a5dSApple OSS Distributions 
849*8d741a5dSApple OSS Distributions static inline struct uthread *
workq_oldest_killable_idle_thread(struct workqueue * wq)850*8d741a5dSApple OSS Distributions workq_oldest_killable_idle_thread(struct workqueue *wq)
851*8d741a5dSApple OSS Distributions {
852*8d741a5dSApple OSS Distributions 	struct uthread *uth = TAILQ_LAST(&wq->wq_thidlelist, workq_uthread_head);
853*8d741a5dSApple OSS Distributions 
854*8d741a5dSApple OSS Distributions 	if (uth && !uth->uu_save.uus_workq_park_data.has_stack) {
855*8d741a5dSApple OSS Distributions 		uth = TAILQ_PREV(uth, workq_uthread_head, uu_workq_entry);
856*8d741a5dSApple OSS Distributions 		if (uth) {
857*8d741a5dSApple OSS Distributions 			assert(uth->uu_save.uus_workq_park_data.has_stack);
858*8d741a5dSApple OSS Distributions 		}
859*8d741a5dSApple OSS Distributions 	}
860*8d741a5dSApple OSS Distributions 	return uth;
861*8d741a5dSApple OSS Distributions }
862*8d741a5dSApple OSS Distributions 
863*8d741a5dSApple OSS Distributions static inline uint64_t
workq_kill_delay_for_idle_thread(struct workqueue * wq)864*8d741a5dSApple OSS Distributions workq_kill_delay_for_idle_thread(struct workqueue *wq)
865*8d741a5dSApple OSS Distributions {
866*8d741a5dSApple OSS Distributions 	uint64_t delay = wq_reduce_pool_window.abstime;
867*8d741a5dSApple OSS Distributions 	uint16_t idle = wq->wq_thidlecount;
868*8d741a5dSApple OSS Distributions 
869*8d741a5dSApple OSS Distributions 	/*
870*8d741a5dSApple OSS Distributions 	 * If we have less than wq_death_max_load threads, have a 5s timer.
871*8d741a5dSApple OSS Distributions 	 *
872*8d741a5dSApple OSS Distributions 	 * For the next wq_max_constrained_threads ones, decay linearly from
873*8d741a5dSApple OSS Distributions 	 * from 5s to 50ms.
874*8d741a5dSApple OSS Distributions 	 */
875*8d741a5dSApple OSS Distributions 	if (idle <= wq_death_max_load) {
876*8d741a5dSApple OSS Distributions 		return delay;
877*8d741a5dSApple OSS Distributions 	}
878*8d741a5dSApple OSS Distributions 
879*8d741a5dSApple OSS Distributions 	if (wq_max_constrained_threads > idle - wq_death_max_load) {
880*8d741a5dSApple OSS Distributions 		delay *= (wq_max_constrained_threads - (idle - wq_death_max_load));
881*8d741a5dSApple OSS Distributions 	}
882*8d741a5dSApple OSS Distributions 	return delay / wq_max_constrained_threads;
883*8d741a5dSApple OSS Distributions }
884*8d741a5dSApple OSS Distributions 
885*8d741a5dSApple OSS Distributions static inline bool
workq_should_kill_idle_thread(struct workqueue * wq,struct uthread * uth,uint64_t now)886*8d741a5dSApple OSS Distributions workq_should_kill_idle_thread(struct workqueue *wq, struct uthread *uth,
887*8d741a5dSApple OSS Distributions     uint64_t now)
888*8d741a5dSApple OSS Distributions {
889*8d741a5dSApple OSS Distributions 	uint64_t delay = workq_kill_delay_for_idle_thread(wq);
890*8d741a5dSApple OSS Distributions 	return now - uth->uu_save.uus_workq_park_data.idle_stamp > delay;
891*8d741a5dSApple OSS Distributions }
892*8d741a5dSApple OSS Distributions 
893*8d741a5dSApple OSS Distributions static void
workq_death_call_schedule(struct workqueue * wq,uint64_t deadline)894*8d741a5dSApple OSS Distributions workq_death_call_schedule(struct workqueue *wq, uint64_t deadline)
895*8d741a5dSApple OSS Distributions {
896*8d741a5dSApple OSS Distributions 	uint32_t wq_flags = os_atomic_load(&wq->wq_flags, relaxed);
897*8d741a5dSApple OSS Distributions 
898*8d741a5dSApple OSS Distributions 	if (wq_flags & (WQ_EXITING | WQ_DEATH_CALL_SCHEDULED)) {
899*8d741a5dSApple OSS Distributions 		return;
900*8d741a5dSApple OSS Distributions 	}
901*8d741a5dSApple OSS Distributions 	os_atomic_or(&wq->wq_flags, WQ_DEATH_CALL_SCHEDULED, relaxed);
902*8d741a5dSApple OSS Distributions 
903*8d741a5dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_death_call | DBG_FUNC_NONE, wq, 1, 0, 0);
904*8d741a5dSApple OSS Distributions 
905*8d741a5dSApple OSS Distributions 	/*
906*8d741a5dSApple OSS Distributions 	 * <rdar://problem/13139182> Due to how long term timers work, the leeway
907*8d741a5dSApple OSS Distributions 	 * can't be too short, so use 500ms which is long enough that we will not
908*8d741a5dSApple OSS Distributions 	 * wake up the CPU for killing threads, but short enough that it doesn't
909*8d741a5dSApple OSS Distributions 	 * fall into long-term timer list shenanigans.
910*8d741a5dSApple OSS Distributions 	 */
911*8d741a5dSApple OSS Distributions 	thread_call_enter_delayed_with_leeway(wq->wq_death_call, NULL, deadline,
912*8d741a5dSApple OSS Distributions 	    wq_reduce_pool_window.abstime / 10,
913*8d741a5dSApple OSS Distributions 	    THREAD_CALL_DELAY_LEEWAY | THREAD_CALL_DELAY_USER_BACKGROUND);
914*8d741a5dSApple OSS Distributions }
915*8d741a5dSApple OSS Distributions 
916*8d741a5dSApple OSS Distributions /*
917*8d741a5dSApple OSS Distributions  * `decrement` is set to the number of threads that are no longer dying:
918*8d741a5dSApple OSS Distributions  * - because they have been resuscitated just in time (workq_pop_idle_thread)
919*8d741a5dSApple OSS Distributions  * - or have been killed (workq_thread_terminate).
920*8d741a5dSApple OSS Distributions  */
921*8d741a5dSApple OSS Distributions static void
workq_death_policy_evaluate(struct workqueue * wq,uint16_t decrement)922*8d741a5dSApple OSS Distributions workq_death_policy_evaluate(struct workqueue *wq, uint16_t decrement)
923*8d741a5dSApple OSS Distributions {
924*8d741a5dSApple OSS Distributions 	struct uthread *uth;
925*8d741a5dSApple OSS Distributions 
926*8d741a5dSApple OSS Distributions 	assert(wq->wq_thdying_count >= decrement);
927*8d741a5dSApple OSS Distributions 	if ((wq->wq_thdying_count -= decrement) > 0) {
928*8d741a5dSApple OSS Distributions 		return;
929*8d741a5dSApple OSS Distributions 	}
930*8d741a5dSApple OSS Distributions 
931*8d741a5dSApple OSS Distributions 	if (wq->wq_thidlecount <= 1) {
932*8d741a5dSApple OSS Distributions 		return;
933*8d741a5dSApple OSS Distributions 	}
934*8d741a5dSApple OSS Distributions 
935*8d741a5dSApple OSS Distributions 	if ((uth = workq_oldest_killable_idle_thread(wq)) == NULL) {
936*8d741a5dSApple OSS Distributions 		return;
937*8d741a5dSApple OSS Distributions 	}
938*8d741a5dSApple OSS Distributions 
939*8d741a5dSApple OSS Distributions 	uint64_t now = mach_absolute_time();
940*8d741a5dSApple OSS Distributions 	uint64_t delay = workq_kill_delay_for_idle_thread(wq);
941*8d741a5dSApple OSS Distributions 
942*8d741a5dSApple OSS Distributions 	if (now - uth->uu_save.uus_workq_park_data.idle_stamp > delay) {
943*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_thread_terminate | DBG_FUNC_START,
944*8d741a5dSApple OSS Distributions 		    wq, wq->wq_thidlecount, 0, 0);
945*8d741a5dSApple OSS Distributions 		wq->wq_thdying_count++;
946*8d741a5dSApple OSS Distributions 		uth->uu_workq_flags |= UT_WORKQ_DYING;
947*8d741a5dSApple OSS Distributions 		if ((uth->uu_workq_flags & UT_WORKQ_IDLE_CLEANUP) == 0) {
948*8d741a5dSApple OSS Distributions 			workq_thread_wakeup(uth);
949*8d741a5dSApple OSS Distributions 		}
950*8d741a5dSApple OSS Distributions 		return;
951*8d741a5dSApple OSS Distributions 	}
952*8d741a5dSApple OSS Distributions 
953*8d741a5dSApple OSS Distributions 	workq_death_call_schedule(wq,
954*8d741a5dSApple OSS Distributions 	    uth->uu_save.uus_workq_park_data.idle_stamp + delay);
955*8d741a5dSApple OSS Distributions }
956*8d741a5dSApple OSS Distributions 
957*8d741a5dSApple OSS Distributions void
workq_thread_terminate(struct proc * p,struct uthread * uth)958*8d741a5dSApple OSS Distributions workq_thread_terminate(struct proc *p, struct uthread *uth)
959*8d741a5dSApple OSS Distributions {
960*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr_fast(p);
961*8d741a5dSApple OSS Distributions 
962*8d741a5dSApple OSS Distributions 	workq_lock_spin(wq);
963*8d741a5dSApple OSS Distributions 	if (!workq_thread_is_permanently_bound(uth)) {
964*8d741a5dSApple OSS Distributions 		TAILQ_REMOVE(&wq->wq_thrunlist, uth, uu_workq_entry);
965*8d741a5dSApple OSS Distributions 		if (uth->uu_workq_flags & UT_WORKQ_DYING) {
966*8d741a5dSApple OSS Distributions 			WQ_TRACE_WQ(TRACE_wq_thread_terminate | DBG_FUNC_END,
967*8d741a5dSApple OSS Distributions 			    wq, wq->wq_thidlecount, 0, 0);
968*8d741a5dSApple OSS Distributions 			workq_death_policy_evaluate(wq, 1);
969*8d741a5dSApple OSS Distributions 		}
970*8d741a5dSApple OSS Distributions 	}
971*8d741a5dSApple OSS Distributions 	if (wq->wq_nthreads-- == wq_max_threads) {
972*8d741a5dSApple OSS Distributions 		/*
973*8d741a5dSApple OSS Distributions 		 * We got under the thread limit again, which may have prevented
974*8d741a5dSApple OSS Distributions 		 * thread creation from happening, redrive if there are pending requests
975*8d741a5dSApple OSS Distributions 		 */
976*8d741a5dSApple OSS Distributions 		if (wq->wq_reqcount) {
977*8d741a5dSApple OSS Distributions 			workq_schedule_creator(p, wq, WORKQ_THREADREQ_CAN_CREATE_THREADS);
978*8d741a5dSApple OSS Distributions 		}
979*8d741a5dSApple OSS Distributions 	}
980*8d741a5dSApple OSS Distributions 	workq_unlock(wq);
981*8d741a5dSApple OSS Distributions 
982*8d741a5dSApple OSS Distributions 	thread_deallocate(get_machthread(uth));
983*8d741a5dSApple OSS Distributions }
984*8d741a5dSApple OSS Distributions 
985*8d741a5dSApple OSS Distributions static void
workq_kill_old_threads_call(void * param0,void * param1 __unused)986*8d741a5dSApple OSS Distributions workq_kill_old_threads_call(void *param0, void *param1 __unused)
987*8d741a5dSApple OSS Distributions {
988*8d741a5dSApple OSS Distributions 	struct workqueue *wq = param0;
989*8d741a5dSApple OSS Distributions 
990*8d741a5dSApple OSS Distributions 	workq_lock_spin(wq);
991*8d741a5dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_death_call | DBG_FUNC_START, wq, 0, 0, 0);
992*8d741a5dSApple OSS Distributions 	os_atomic_andnot(&wq->wq_flags, WQ_DEATH_CALL_SCHEDULED, relaxed);
993*8d741a5dSApple OSS Distributions 	workq_death_policy_evaluate(wq, 0);
994*8d741a5dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_death_call | DBG_FUNC_END, wq, 0, 0, 0);
995*8d741a5dSApple OSS Distributions 	workq_unlock(wq);
996*8d741a5dSApple OSS Distributions }
997*8d741a5dSApple OSS Distributions 
998*8d741a5dSApple OSS Distributions static struct uthread *
workq_pop_idle_thread(struct workqueue * wq,uint16_t uu_flags,bool * needs_wakeup)999*8d741a5dSApple OSS Distributions workq_pop_idle_thread(struct workqueue *wq, uint16_t uu_flags,
1000*8d741a5dSApple OSS Distributions     bool *needs_wakeup)
1001*8d741a5dSApple OSS Distributions {
1002*8d741a5dSApple OSS Distributions 	struct uthread *uth;
1003*8d741a5dSApple OSS Distributions 
1004*8d741a5dSApple OSS Distributions 	if ((uth = TAILQ_FIRST(&wq->wq_thidlelist))) {
1005*8d741a5dSApple OSS Distributions 		TAILQ_REMOVE(&wq->wq_thidlelist, uth, uu_workq_entry);
1006*8d741a5dSApple OSS Distributions 	} else {
1007*8d741a5dSApple OSS Distributions 		uth = TAILQ_FIRST(&wq->wq_thnewlist);
1008*8d741a5dSApple OSS Distributions 		TAILQ_REMOVE(&wq->wq_thnewlist, uth, uu_workq_entry);
1009*8d741a5dSApple OSS Distributions 	}
1010*8d741a5dSApple OSS Distributions 	TAILQ_INSERT_TAIL(&wq->wq_thrunlist, uth, uu_workq_entry);
1011*8d741a5dSApple OSS Distributions 
1012*8d741a5dSApple OSS Distributions 	assert((uth->uu_workq_flags & UT_WORKQ_RUNNING) == 0);
1013*8d741a5dSApple OSS Distributions 	uth->uu_workq_flags |= UT_WORKQ_RUNNING | uu_flags;
1014*8d741a5dSApple OSS Distributions 
1015*8d741a5dSApple OSS Distributions 	/* A thread is never woken up as part of the cooperative pool */
1016*8d741a5dSApple OSS Distributions 	assert((uu_flags & UT_WORKQ_COOPERATIVE) == 0);
1017*8d741a5dSApple OSS Distributions 
1018*8d741a5dSApple OSS Distributions 	if ((uu_flags & UT_WORKQ_OVERCOMMIT) == 0) {
1019*8d741a5dSApple OSS Distributions 		wq->wq_constrained_threads_scheduled++;
1020*8d741a5dSApple OSS Distributions 	}
1021*8d741a5dSApple OSS Distributions 	wq->wq_threads_scheduled++;
1022*8d741a5dSApple OSS Distributions 	wq->wq_thidlecount--;
1023*8d741a5dSApple OSS Distributions 
1024*8d741a5dSApple OSS Distributions 	if (__improbable(uth->uu_workq_flags & UT_WORKQ_DYING)) {
1025*8d741a5dSApple OSS Distributions 		uth->uu_workq_flags ^= UT_WORKQ_DYING;
1026*8d741a5dSApple OSS Distributions 		workq_death_policy_evaluate(wq, 1);
1027*8d741a5dSApple OSS Distributions 		*needs_wakeup = false;
1028*8d741a5dSApple OSS Distributions 	} else if (uth->uu_workq_flags & UT_WORKQ_IDLE_CLEANUP) {
1029*8d741a5dSApple OSS Distributions 		*needs_wakeup = false;
1030*8d741a5dSApple OSS Distributions 	} else {
1031*8d741a5dSApple OSS Distributions 		*needs_wakeup = true;
1032*8d741a5dSApple OSS Distributions 	}
1033*8d741a5dSApple OSS Distributions 	return uth;
1034*8d741a5dSApple OSS Distributions }
1035*8d741a5dSApple OSS Distributions 
1036*8d741a5dSApple OSS Distributions /*
1037*8d741a5dSApple OSS Distributions  * Called by thread_create_workq_waiting() during thread initialization, before
1038*8d741a5dSApple OSS Distributions  * assert_wait, before the thread has been started.
1039*8d741a5dSApple OSS Distributions  */
1040*8d741a5dSApple OSS Distributions event_t
workq_thread_init_and_wq_lock(task_t task,thread_t th)1041*8d741a5dSApple OSS Distributions workq_thread_init_and_wq_lock(task_t task, thread_t th)
1042*8d741a5dSApple OSS Distributions {
1043*8d741a5dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(th);
1044*8d741a5dSApple OSS Distributions 
1045*8d741a5dSApple OSS Distributions 	uth->uu_workq_flags = UT_WORKQ_NEW;
1046*8d741a5dSApple OSS Distributions 	uth->uu_workq_pri = WORKQ_POLICY_INIT(THREAD_QOS_LEGACY);
1047*8d741a5dSApple OSS Distributions 	uth->uu_workq_thport = MACH_PORT_NULL;
1048*8d741a5dSApple OSS Distributions 	uth->uu_workq_stackaddr = 0;
1049*8d741a5dSApple OSS Distributions 	uth->uu_workq_pthread_kill_allowed = 0;
1050*8d741a5dSApple OSS Distributions 
1051*8d741a5dSApple OSS Distributions 	thread_set_tag(th, THREAD_TAG_PTHREAD | THREAD_TAG_WORKQUEUE);
1052*8d741a5dSApple OSS Distributions 	thread_reset_workq_qos(th, THREAD_QOS_LEGACY);
1053*8d741a5dSApple OSS Distributions 
1054*8d741a5dSApple OSS Distributions 	workq_lock_spin(proc_get_wqptr_fast(get_bsdtask_info(task)));
1055*8d741a5dSApple OSS Distributions 	return workq_parked_wait_event(uth);
1056*8d741a5dSApple OSS Distributions }
1057*8d741a5dSApple OSS Distributions 
1058*8d741a5dSApple OSS Distributions /**
1059*8d741a5dSApple OSS Distributions  * Try to add a new workqueue thread.
1060*8d741a5dSApple OSS Distributions  *
1061*8d741a5dSApple OSS Distributions  * - called with workq lock held
1062*8d741a5dSApple OSS Distributions  * - dropped and retaken around thread creation
1063*8d741a5dSApple OSS Distributions  * - return with workq lock held
1064*8d741a5dSApple OSS Distributions  */
1065*8d741a5dSApple OSS Distributions static kern_return_t
workq_add_new_idle_thread(proc_t p,struct workqueue * wq,thread_continue_t continuation,bool is_permanently_bound,thread_t * new_thread)1066*8d741a5dSApple OSS Distributions workq_add_new_idle_thread(
1067*8d741a5dSApple OSS Distributions 	proc_t             p,
1068*8d741a5dSApple OSS Distributions 	struct workqueue  *wq,
1069*8d741a5dSApple OSS Distributions 	thread_continue_t continuation,
1070*8d741a5dSApple OSS Distributions 	bool              is_permanently_bound,
1071*8d741a5dSApple OSS Distributions 	thread_t          *new_thread)
1072*8d741a5dSApple OSS Distributions {
1073*8d741a5dSApple OSS Distributions 	mach_vm_offset_t th_stackaddr;
1074*8d741a5dSApple OSS Distributions 	kern_return_t kret;
1075*8d741a5dSApple OSS Distributions 	thread_t th;
1076*8d741a5dSApple OSS Distributions 
1077*8d741a5dSApple OSS Distributions 	wq->wq_nthreads++;
1078*8d741a5dSApple OSS Distributions 
1079*8d741a5dSApple OSS Distributions 	workq_unlock(wq);
1080*8d741a5dSApple OSS Distributions 
1081*8d741a5dSApple OSS Distributions 	vm_map_t vmap = get_task_map(proc_task(p));
1082*8d741a5dSApple OSS Distributions 
1083*8d741a5dSApple OSS Distributions 	kret = pthread_functions->workq_create_threadstack(p, vmap, &th_stackaddr);
1084*8d741a5dSApple OSS Distributions 	if (kret != KERN_SUCCESS) {
1085*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_thread_create_failed | DBG_FUNC_NONE, wq,
1086*8d741a5dSApple OSS Distributions 		    kret, 1, 0);
1087*8d741a5dSApple OSS Distributions 		goto out;
1088*8d741a5dSApple OSS Distributions 	}
1089*8d741a5dSApple OSS Distributions 
1090*8d741a5dSApple OSS Distributions 	kret = thread_create_workq_waiting(proc_task(p),
1091*8d741a5dSApple OSS Distributions 	    continuation,
1092*8d741a5dSApple OSS Distributions 	    &th,
1093*8d741a5dSApple OSS Distributions 	    is_permanently_bound);
1094*8d741a5dSApple OSS Distributions 	if (kret != KERN_SUCCESS) {
1095*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_thread_create_failed | DBG_FUNC_NONE, wq,
1096*8d741a5dSApple OSS Distributions 		    kret, 0, 0);
1097*8d741a5dSApple OSS Distributions 		pthread_functions->workq_destroy_threadstack(p, vmap, th_stackaddr);
1098*8d741a5dSApple OSS Distributions 		goto out;
1099*8d741a5dSApple OSS Distributions 	}
1100*8d741a5dSApple OSS Distributions 
1101*8d741a5dSApple OSS Distributions 	// thread_create_workq_waiting() will return with the wq lock held
1102*8d741a5dSApple OSS Distributions 	// on success, because it calls workq_thread_init_and_wq_lock() above
1103*8d741a5dSApple OSS Distributions 
1104*8d741a5dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(th);
1105*8d741a5dSApple OSS Distributions 	uth->uu_workq_stackaddr = (user_addr_t)th_stackaddr;
1106*8d741a5dSApple OSS Distributions 
1107*8d741a5dSApple OSS Distributions 	wq->wq_creations++;
1108*8d741a5dSApple OSS Distributions 	if (!is_permanently_bound) {
1109*8d741a5dSApple OSS Distributions 		wq->wq_thidlecount++;
1110*8d741a5dSApple OSS Distributions 		TAILQ_INSERT_TAIL(&wq->wq_thnewlist, uth, uu_workq_entry);
1111*8d741a5dSApple OSS Distributions 	}
1112*8d741a5dSApple OSS Distributions 
1113*8d741a5dSApple OSS Distributions 	if (new_thread) {
1114*8d741a5dSApple OSS Distributions 		*new_thread = th;
1115*8d741a5dSApple OSS Distributions 	}
1116*8d741a5dSApple OSS Distributions 
1117*8d741a5dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_thread_create | DBG_FUNC_NONE, wq, 0, 0, 0);
1118*8d741a5dSApple OSS Distributions 	return kret;
1119*8d741a5dSApple OSS Distributions 
1120*8d741a5dSApple OSS Distributions out:
1121*8d741a5dSApple OSS Distributions 	workq_lock_spin(wq);
1122*8d741a5dSApple OSS Distributions 	/*
1123*8d741a5dSApple OSS Distributions 	 * Do not redrive here if we went under wq_max_threads again,
1124*8d741a5dSApple OSS Distributions 	 * it is the responsibility of the callers of this function
1125*8d741a5dSApple OSS Distributions 	 * to do so when it fails.
1126*8d741a5dSApple OSS Distributions 	 */
1127*8d741a5dSApple OSS Distributions 	wq->wq_nthreads--;
1128*8d741a5dSApple OSS Distributions 	return kret;
1129*8d741a5dSApple OSS Distributions }
1130*8d741a5dSApple OSS Distributions 
1131*8d741a5dSApple OSS Distributions static inline bool
workq_thread_is_overcommit(struct uthread * uth)1132*8d741a5dSApple OSS Distributions workq_thread_is_overcommit(struct uthread *uth)
1133*8d741a5dSApple OSS Distributions {
1134*8d741a5dSApple OSS Distributions 	return (uth->uu_workq_flags & UT_WORKQ_OVERCOMMIT) != 0;
1135*8d741a5dSApple OSS Distributions }
1136*8d741a5dSApple OSS Distributions 
1137*8d741a5dSApple OSS Distributions static inline bool
workq_thread_is_nonovercommit(struct uthread * uth)1138*8d741a5dSApple OSS Distributions workq_thread_is_nonovercommit(struct uthread *uth)
1139*8d741a5dSApple OSS Distributions {
1140*8d741a5dSApple OSS Distributions 	return (uth->uu_workq_flags & (UT_WORKQ_OVERCOMMIT |
1141*8d741a5dSApple OSS Distributions 	       UT_WORKQ_COOPERATIVE)) == 0;
1142*8d741a5dSApple OSS Distributions }
1143*8d741a5dSApple OSS Distributions 
1144*8d741a5dSApple OSS Distributions static inline bool
workq_thread_is_cooperative(struct uthread * uth)1145*8d741a5dSApple OSS Distributions workq_thread_is_cooperative(struct uthread *uth)
1146*8d741a5dSApple OSS Distributions {
1147*8d741a5dSApple OSS Distributions 	return (uth->uu_workq_flags & UT_WORKQ_COOPERATIVE) != 0;
1148*8d741a5dSApple OSS Distributions }
1149*8d741a5dSApple OSS Distributions 
1150*8d741a5dSApple OSS Distributions bool
workq_thread_is_permanently_bound(struct uthread * uth)1151*8d741a5dSApple OSS Distributions workq_thread_is_permanently_bound(struct uthread *uth)
1152*8d741a5dSApple OSS Distributions {
1153*8d741a5dSApple OSS Distributions 	return (uth->uu_workq_flags & UT_WORKQ_PERMANENT_BIND) != 0;
1154*8d741a5dSApple OSS Distributions }
1155*8d741a5dSApple OSS Distributions 
1156*8d741a5dSApple OSS Distributions static inline void
workq_thread_set_type(struct uthread * uth,uint16_t flags)1157*8d741a5dSApple OSS Distributions workq_thread_set_type(struct uthread *uth, uint16_t flags)
1158*8d741a5dSApple OSS Distributions {
1159*8d741a5dSApple OSS Distributions 	uth->uu_workq_flags &= ~(UT_WORKQ_OVERCOMMIT | UT_WORKQ_COOPERATIVE);
1160*8d741a5dSApple OSS Distributions 	uth->uu_workq_flags |= flags;
1161*8d741a5dSApple OSS Distributions }
1162*8d741a5dSApple OSS Distributions 
1163*8d741a5dSApple OSS Distributions 
1164*8d741a5dSApple OSS Distributions #define WORKQ_UNPARK_FOR_DEATH_WAS_IDLE 0x1
1165*8d741a5dSApple OSS Distributions 
1166*8d741a5dSApple OSS Distributions __attribute__((noreturn, noinline))
1167*8d741a5dSApple OSS Distributions static void
workq_unpark_for_death_and_unlock(proc_t p,struct workqueue * wq,struct uthread * uth,uint32_t death_flags,uint32_t setup_flags)1168*8d741a5dSApple OSS Distributions workq_unpark_for_death_and_unlock(proc_t p, struct workqueue *wq,
1169*8d741a5dSApple OSS Distributions     struct uthread *uth, uint32_t death_flags, uint32_t setup_flags)
1170*8d741a5dSApple OSS Distributions {
1171*8d741a5dSApple OSS Distributions 	thread_qos_t qos = workq_pri_override(uth->uu_workq_pri);
1172*8d741a5dSApple OSS Distributions 	bool first_use = uth->uu_workq_flags & UT_WORKQ_NEW;
1173*8d741a5dSApple OSS Distributions 
1174*8d741a5dSApple OSS Distributions 	if (qos > WORKQ_THREAD_QOS_CLEANUP) {
1175*8d741a5dSApple OSS Distributions 		workq_thread_reset_pri(wq, uth, NULL, /*unpark*/ true);
1176*8d741a5dSApple OSS Distributions 		qos = WORKQ_THREAD_QOS_CLEANUP;
1177*8d741a5dSApple OSS Distributions 	}
1178*8d741a5dSApple OSS Distributions 
1179*8d741a5dSApple OSS Distributions 	workq_thread_reset_cpupercent(NULL, uth);
1180*8d741a5dSApple OSS Distributions 
1181*8d741a5dSApple OSS Distributions 	if (death_flags & WORKQ_UNPARK_FOR_DEATH_WAS_IDLE) {
1182*8d741a5dSApple OSS Distributions 		wq->wq_thidlecount--;
1183*8d741a5dSApple OSS Distributions 		if (first_use) {
1184*8d741a5dSApple OSS Distributions 			TAILQ_REMOVE(&wq->wq_thnewlist, uth, uu_workq_entry);
1185*8d741a5dSApple OSS Distributions 		} else {
1186*8d741a5dSApple OSS Distributions 			TAILQ_REMOVE(&wq->wq_thidlelist, uth, uu_workq_entry);
1187*8d741a5dSApple OSS Distributions 		}
1188*8d741a5dSApple OSS Distributions 	}
1189*8d741a5dSApple OSS Distributions 	TAILQ_INSERT_TAIL(&wq->wq_thrunlist, uth, uu_workq_entry);
1190*8d741a5dSApple OSS Distributions 
1191*8d741a5dSApple OSS Distributions 	workq_unlock(wq);
1192*8d741a5dSApple OSS Distributions 
1193*8d741a5dSApple OSS Distributions 	if (setup_flags & WQ_SETUP_CLEAR_VOUCHER) {
1194*8d741a5dSApple OSS Distributions 		__assert_only kern_return_t kr;
1195*8d741a5dSApple OSS Distributions 		kr = thread_set_voucher_name(MACH_PORT_NULL);
1196*8d741a5dSApple OSS Distributions 		assert(kr == KERN_SUCCESS);
1197*8d741a5dSApple OSS Distributions 	}
1198*8d741a5dSApple OSS Distributions 
1199*8d741a5dSApple OSS Distributions 	uint32_t flags = WQ_FLAG_THREAD_NEWSPI | qos | WQ_FLAG_THREAD_PRIO_QOS;
1200*8d741a5dSApple OSS Distributions 	thread_t th = get_machthread(uth);
1201*8d741a5dSApple OSS Distributions 	vm_map_t vmap = get_task_map(proc_task(p));
1202*8d741a5dSApple OSS Distributions 
1203*8d741a5dSApple OSS Distributions 	if (!first_use) {
1204*8d741a5dSApple OSS Distributions 		flags |= WQ_FLAG_THREAD_REUSE;
1205*8d741a5dSApple OSS Distributions 	}
1206*8d741a5dSApple OSS Distributions 
1207*8d741a5dSApple OSS Distributions 	pthread_functions->workq_setup_thread(p, th, vmap, uth->uu_workq_stackaddr,
1208*8d741a5dSApple OSS Distributions 	    uth->uu_workq_thport, 0, WQ_SETUP_EXIT_THREAD, flags);
1209*8d741a5dSApple OSS Distributions 	__builtin_unreachable();
1210*8d741a5dSApple OSS Distributions }
1211*8d741a5dSApple OSS Distributions 
1212*8d741a5dSApple OSS Distributions bool
workq_is_current_thread_updating_turnstile(struct workqueue * wq)1213*8d741a5dSApple OSS Distributions workq_is_current_thread_updating_turnstile(struct workqueue *wq)
1214*8d741a5dSApple OSS Distributions {
1215*8d741a5dSApple OSS Distributions 	return wq->wq_turnstile_updater == current_thread();
1216*8d741a5dSApple OSS Distributions }
1217*8d741a5dSApple OSS Distributions 
1218*8d741a5dSApple OSS Distributions __attribute__((always_inline))
1219*8d741a5dSApple OSS Distributions static inline void
1220*8d741a5dSApple OSS Distributions workq_perform_turnstile_operation_locked(struct workqueue *wq,
1221*8d741a5dSApple OSS Distributions     void (^operation)(void))
1222*8d741a5dSApple OSS Distributions {
1223*8d741a5dSApple OSS Distributions 	workq_lock_held(wq);
1224*8d741a5dSApple OSS Distributions 	wq->wq_turnstile_updater = current_thread();
1225*8d741a5dSApple OSS Distributions 	operation();
1226*8d741a5dSApple OSS Distributions 	wq->wq_turnstile_updater = THREAD_NULL;
1227*8d741a5dSApple OSS Distributions }
1228*8d741a5dSApple OSS Distributions 
1229*8d741a5dSApple OSS Distributions static void
workq_turnstile_update_inheritor(struct workqueue * wq,turnstile_inheritor_t inheritor,turnstile_update_flags_t flags)1230*8d741a5dSApple OSS Distributions workq_turnstile_update_inheritor(struct workqueue *wq,
1231*8d741a5dSApple OSS Distributions     turnstile_inheritor_t inheritor,
1232*8d741a5dSApple OSS Distributions     turnstile_update_flags_t flags)
1233*8d741a5dSApple OSS Distributions {
1234*8d741a5dSApple OSS Distributions 	if (wq->wq_inheritor == inheritor) {
1235*8d741a5dSApple OSS Distributions 		return;
1236*8d741a5dSApple OSS Distributions 	}
1237*8d741a5dSApple OSS Distributions 	wq->wq_inheritor = inheritor;
1238*8d741a5dSApple OSS Distributions 	workq_perform_turnstile_operation_locked(wq, ^{
1239*8d741a5dSApple OSS Distributions 		turnstile_update_inheritor(wq->wq_turnstile, inheritor,
1240*8d741a5dSApple OSS Distributions 		flags | TURNSTILE_IMMEDIATE_UPDATE);
1241*8d741a5dSApple OSS Distributions 		turnstile_update_inheritor_complete(wq->wq_turnstile,
1242*8d741a5dSApple OSS Distributions 		TURNSTILE_INTERLOCK_HELD);
1243*8d741a5dSApple OSS Distributions 	});
1244*8d741a5dSApple OSS Distributions }
1245*8d741a5dSApple OSS Distributions 
1246*8d741a5dSApple OSS Distributions static void
workq_push_idle_thread(proc_t p,struct workqueue * wq,struct uthread * uth,uint32_t setup_flags)1247*8d741a5dSApple OSS Distributions workq_push_idle_thread(proc_t p, struct workqueue *wq, struct uthread *uth,
1248*8d741a5dSApple OSS Distributions     uint32_t setup_flags)
1249*8d741a5dSApple OSS Distributions {
1250*8d741a5dSApple OSS Distributions 	uint64_t now = mach_absolute_time();
1251*8d741a5dSApple OSS Distributions 	bool is_creator = (uth == wq->wq_creator);
1252*8d741a5dSApple OSS Distributions 
1253*8d741a5dSApple OSS Distributions 	if (workq_thread_is_cooperative(uth)) {
1254*8d741a5dSApple OSS Distributions 		assert(!is_creator);
1255*8d741a5dSApple OSS Distributions 
1256*8d741a5dSApple OSS Distributions 		thread_qos_t thread_qos = uth->uu_workq_pri.qos_req;
1257*8d741a5dSApple OSS Distributions 		_wq_cooperative_queue_scheduled_count_dec(wq, thread_qos);
1258*8d741a5dSApple OSS Distributions 
1259*8d741a5dSApple OSS Distributions 		/* Before we get here, we always go through
1260*8d741a5dSApple OSS Distributions 		 * workq_select_threadreq_or_park_and_unlock. If we got here, it means
1261*8d741a5dSApple OSS Distributions 		 * that we went through the logic in workq_threadreq_select which
1262*8d741a5dSApple OSS Distributions 		 * did the refresh for the next best cooperative qos while
1263*8d741a5dSApple OSS Distributions 		 * excluding the current thread - we shouldn't need to do it again.
1264*8d741a5dSApple OSS Distributions 		 */
1265*8d741a5dSApple OSS Distributions 		assert(_wq_cooperative_queue_refresh_best_req_qos(wq) == false);
1266*8d741a5dSApple OSS Distributions 	} else if (workq_thread_is_nonovercommit(uth)) {
1267*8d741a5dSApple OSS Distributions 		assert(!is_creator);
1268*8d741a5dSApple OSS Distributions 
1269*8d741a5dSApple OSS Distributions 		wq->wq_constrained_threads_scheduled--;
1270*8d741a5dSApple OSS Distributions 	}
1271*8d741a5dSApple OSS Distributions 
1272*8d741a5dSApple OSS Distributions 	uth->uu_workq_flags &= ~(UT_WORKQ_RUNNING | UT_WORKQ_OVERCOMMIT | UT_WORKQ_COOPERATIVE);
1273*8d741a5dSApple OSS Distributions 	TAILQ_REMOVE(&wq->wq_thrunlist, uth, uu_workq_entry);
1274*8d741a5dSApple OSS Distributions 	wq->wq_threads_scheduled--;
1275*8d741a5dSApple OSS Distributions 
1276*8d741a5dSApple OSS Distributions 	if (is_creator) {
1277*8d741a5dSApple OSS Distributions 		wq->wq_creator = NULL;
1278*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_creator_select, wq, 3, 0,
1279*8d741a5dSApple OSS Distributions 		    uth->uu_save.uus_workq_park_data.yields);
1280*8d741a5dSApple OSS Distributions 	}
1281*8d741a5dSApple OSS Distributions 
1282*8d741a5dSApple OSS Distributions 	if (wq->wq_inheritor == get_machthread(uth)) {
1283*8d741a5dSApple OSS Distributions 		assert(wq->wq_creator == NULL);
1284*8d741a5dSApple OSS Distributions 		if (wq->wq_reqcount) {
1285*8d741a5dSApple OSS Distributions 			workq_turnstile_update_inheritor(wq, wq, TURNSTILE_INHERITOR_WORKQ);
1286*8d741a5dSApple OSS Distributions 		} else {
1287*8d741a5dSApple OSS Distributions 			workq_turnstile_update_inheritor(wq, TURNSTILE_INHERITOR_NULL, 0);
1288*8d741a5dSApple OSS Distributions 		}
1289*8d741a5dSApple OSS Distributions 	}
1290*8d741a5dSApple OSS Distributions 
1291*8d741a5dSApple OSS Distributions 	if (uth->uu_workq_flags & UT_WORKQ_NEW) {
1292*8d741a5dSApple OSS Distributions 		assert(is_creator || (_wq_flags(wq) & WQ_EXITING));
1293*8d741a5dSApple OSS Distributions 		TAILQ_INSERT_TAIL(&wq->wq_thnewlist, uth, uu_workq_entry);
1294*8d741a5dSApple OSS Distributions 		wq->wq_thidlecount++;
1295*8d741a5dSApple OSS Distributions 		return;
1296*8d741a5dSApple OSS Distributions 	}
1297*8d741a5dSApple OSS Distributions 
1298*8d741a5dSApple OSS Distributions 	if (!is_creator) {
1299*8d741a5dSApple OSS Distributions 		_wq_thactive_dec(wq, uth->uu_workq_pri.qos_bucket);
1300*8d741a5dSApple OSS Distributions 		wq->wq_thscheduled_count[_wq_bucket(uth->uu_workq_pri.qos_bucket)]--;
1301*8d741a5dSApple OSS Distributions 		uth->uu_workq_flags |= UT_WORKQ_IDLE_CLEANUP;
1302*8d741a5dSApple OSS Distributions 	}
1303*8d741a5dSApple OSS Distributions 
1304*8d741a5dSApple OSS Distributions 	uth->uu_save.uus_workq_park_data.idle_stamp = now;
1305*8d741a5dSApple OSS Distributions 
1306*8d741a5dSApple OSS Distributions 	struct uthread *oldest = workq_oldest_killable_idle_thread(wq);
1307*8d741a5dSApple OSS Distributions 	uint16_t cur_idle = wq->wq_thidlecount;
1308*8d741a5dSApple OSS Distributions 
1309*8d741a5dSApple OSS Distributions 	if (cur_idle >= wq_max_constrained_threads ||
1310*8d741a5dSApple OSS Distributions 	    (wq->wq_thdying_count == 0 && oldest &&
1311*8d741a5dSApple OSS Distributions 	    workq_should_kill_idle_thread(wq, oldest, now))) {
1312*8d741a5dSApple OSS Distributions 		/*
1313*8d741a5dSApple OSS Distributions 		 * Immediately kill threads if we have too may of them.
1314*8d741a5dSApple OSS Distributions 		 *
1315*8d741a5dSApple OSS Distributions 		 * And swap "place" with the oldest one we'd have woken up.
1316*8d741a5dSApple OSS Distributions 		 * This is a relatively desperate situation where we really
1317*8d741a5dSApple OSS Distributions 		 * need to kill threads quickly and it's best to kill
1318*8d741a5dSApple OSS Distributions 		 * the one that's currently on core than context switching.
1319*8d741a5dSApple OSS Distributions 		 */
1320*8d741a5dSApple OSS Distributions 		if (oldest) {
1321*8d741a5dSApple OSS Distributions 			oldest->uu_save.uus_workq_park_data.idle_stamp = now;
1322*8d741a5dSApple OSS Distributions 			TAILQ_REMOVE(&wq->wq_thidlelist, oldest, uu_workq_entry);
1323*8d741a5dSApple OSS Distributions 			TAILQ_INSERT_HEAD(&wq->wq_thidlelist, oldest, uu_workq_entry);
1324*8d741a5dSApple OSS Distributions 		}
1325*8d741a5dSApple OSS Distributions 
1326*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_thread_terminate | DBG_FUNC_START,
1327*8d741a5dSApple OSS Distributions 		    wq, cur_idle, 0, 0);
1328*8d741a5dSApple OSS Distributions 		wq->wq_thdying_count++;
1329*8d741a5dSApple OSS Distributions 		uth->uu_workq_flags |= UT_WORKQ_DYING;
1330*8d741a5dSApple OSS Distributions 		uth->uu_workq_flags &= ~UT_WORKQ_IDLE_CLEANUP;
1331*8d741a5dSApple OSS Distributions 		workq_unpark_for_death_and_unlock(p, wq, uth, 0, setup_flags);
1332*8d741a5dSApple OSS Distributions 		__builtin_unreachable();
1333*8d741a5dSApple OSS Distributions 	}
1334*8d741a5dSApple OSS Distributions 
1335*8d741a5dSApple OSS Distributions 	struct uthread *tail = TAILQ_LAST(&wq->wq_thidlelist, workq_uthread_head);
1336*8d741a5dSApple OSS Distributions 
1337*8d741a5dSApple OSS Distributions 	cur_idle += 1;
1338*8d741a5dSApple OSS Distributions 	wq->wq_thidlecount = cur_idle;
1339*8d741a5dSApple OSS Distributions 
1340*8d741a5dSApple OSS Distributions 	if (cur_idle >= wq_death_max_load && tail &&
1341*8d741a5dSApple OSS Distributions 	    tail->uu_save.uus_workq_park_data.has_stack) {
1342*8d741a5dSApple OSS Distributions 		uth->uu_save.uus_workq_park_data.has_stack = false;
1343*8d741a5dSApple OSS Distributions 		TAILQ_INSERT_TAIL(&wq->wq_thidlelist, uth, uu_workq_entry);
1344*8d741a5dSApple OSS Distributions 	} else {
1345*8d741a5dSApple OSS Distributions 		uth->uu_save.uus_workq_park_data.has_stack = true;
1346*8d741a5dSApple OSS Distributions 		TAILQ_INSERT_HEAD(&wq->wq_thidlelist, uth, uu_workq_entry);
1347*8d741a5dSApple OSS Distributions 	}
1348*8d741a5dSApple OSS Distributions 
1349*8d741a5dSApple OSS Distributions 	if (!tail) {
1350*8d741a5dSApple OSS Distributions 		uint64_t delay = workq_kill_delay_for_idle_thread(wq);
1351*8d741a5dSApple OSS Distributions 		workq_death_call_schedule(wq, now + delay);
1352*8d741a5dSApple OSS Distributions 	}
1353*8d741a5dSApple OSS Distributions }
1354*8d741a5dSApple OSS Distributions 
1355*8d741a5dSApple OSS Distributions #pragma mark thread requests
1356*8d741a5dSApple OSS Distributions 
1357*8d741a5dSApple OSS Distributions static inline bool
workq_tr_is_overcommit(workq_tr_flags_t tr_flags)1358*8d741a5dSApple OSS Distributions workq_tr_is_overcommit(workq_tr_flags_t tr_flags)
1359*8d741a5dSApple OSS Distributions {
1360*8d741a5dSApple OSS Distributions 	return (tr_flags & WORKQ_TR_FLAG_OVERCOMMIT) != 0;
1361*8d741a5dSApple OSS Distributions }
1362*8d741a5dSApple OSS Distributions 
1363*8d741a5dSApple OSS Distributions static inline bool
workq_tr_is_nonovercommit(workq_tr_flags_t tr_flags)1364*8d741a5dSApple OSS Distributions workq_tr_is_nonovercommit(workq_tr_flags_t tr_flags)
1365*8d741a5dSApple OSS Distributions {
1366*8d741a5dSApple OSS Distributions 	return (tr_flags & (WORKQ_TR_FLAG_OVERCOMMIT |
1367*8d741a5dSApple OSS Distributions 	       WORKQ_TR_FLAG_COOPERATIVE |
1368*8d741a5dSApple OSS Distributions 	       WORKQ_TR_FLAG_PERMANENT_BIND)) == 0;
1369*8d741a5dSApple OSS Distributions }
1370*8d741a5dSApple OSS Distributions 
1371*8d741a5dSApple OSS Distributions static inline bool
workq_tr_is_cooperative(workq_tr_flags_t tr_flags)1372*8d741a5dSApple OSS Distributions workq_tr_is_cooperative(workq_tr_flags_t tr_flags)
1373*8d741a5dSApple OSS Distributions {
1374*8d741a5dSApple OSS Distributions 	return (tr_flags & WORKQ_TR_FLAG_COOPERATIVE) != 0;
1375*8d741a5dSApple OSS Distributions }
1376*8d741a5dSApple OSS Distributions 
1377*8d741a5dSApple OSS Distributions #define workq_threadreq_is_overcommit(req) workq_tr_is_overcommit((req)->tr_flags)
1378*8d741a5dSApple OSS Distributions #define workq_threadreq_is_nonovercommit(req) workq_tr_is_nonovercommit((req)->tr_flags)
1379*8d741a5dSApple OSS Distributions #define workq_threadreq_is_cooperative(req) workq_tr_is_cooperative((req)->tr_flags)
1380*8d741a5dSApple OSS Distributions 
1381*8d741a5dSApple OSS Distributions static inline int
workq_priority_for_req(workq_threadreq_t req)1382*8d741a5dSApple OSS Distributions workq_priority_for_req(workq_threadreq_t req)
1383*8d741a5dSApple OSS Distributions {
1384*8d741a5dSApple OSS Distributions 	thread_qos_t qos = req->tr_qos;
1385*8d741a5dSApple OSS Distributions 
1386*8d741a5dSApple OSS Distributions 	if (req->tr_flags & WORKQ_TR_FLAG_WL_OUTSIDE_QOS) {
1387*8d741a5dSApple OSS Distributions 		workq_threadreq_param_t trp = kqueue_threadreq_workloop_param(req);
1388*8d741a5dSApple OSS Distributions 		assert(trp.trp_flags & TRP_PRIORITY);
1389*8d741a5dSApple OSS Distributions 		return trp.trp_pri;
1390*8d741a5dSApple OSS Distributions 	}
1391*8d741a5dSApple OSS Distributions 	return thread_workq_pri_for_qos(qos);
1392*8d741a5dSApple OSS Distributions }
1393*8d741a5dSApple OSS Distributions 
1394*8d741a5dSApple OSS Distributions static inline struct priority_queue_sched_max *
workq_priority_queue_for_req(struct workqueue * wq,workq_threadreq_t req)1395*8d741a5dSApple OSS Distributions workq_priority_queue_for_req(struct workqueue *wq, workq_threadreq_t req)
1396*8d741a5dSApple OSS Distributions {
1397*8d741a5dSApple OSS Distributions 	assert(!workq_tr_is_cooperative(req->tr_flags));
1398*8d741a5dSApple OSS Distributions 
1399*8d741a5dSApple OSS Distributions 	if (req->tr_flags & WORKQ_TR_FLAG_WL_OUTSIDE_QOS) {
1400*8d741a5dSApple OSS Distributions 		return &wq->wq_special_queue;
1401*8d741a5dSApple OSS Distributions 	} else if (workq_tr_is_overcommit(req->tr_flags)) {
1402*8d741a5dSApple OSS Distributions 		return &wq->wq_overcommit_queue;
1403*8d741a5dSApple OSS Distributions 	} else {
1404*8d741a5dSApple OSS Distributions 		return &wq->wq_constrained_queue;
1405*8d741a5dSApple OSS Distributions 	}
1406*8d741a5dSApple OSS Distributions }
1407*8d741a5dSApple OSS Distributions 
1408*8d741a5dSApple OSS Distributions /* Calculates the number of threads scheduled >= the input QoS */
1409*8d741a5dSApple OSS Distributions static uint64_t
workq_num_cooperative_threads_scheduled_to_qos_internal(struct workqueue * wq,thread_qos_t qos)1410*8d741a5dSApple OSS Distributions workq_num_cooperative_threads_scheduled_to_qos_internal(struct workqueue *wq, thread_qos_t qos)
1411*8d741a5dSApple OSS Distributions {
1412*8d741a5dSApple OSS Distributions 	uint64_t num_cooperative_threads = 0;
1413*8d741a5dSApple OSS Distributions 
1414*8d741a5dSApple OSS Distributions 	for (thread_qos_t cur_qos = WORKQ_THREAD_QOS_MAX; cur_qos >= qos; cur_qos--) {
1415*8d741a5dSApple OSS Distributions 		uint8_t bucket = _wq_bucket(cur_qos);
1416*8d741a5dSApple OSS Distributions 		num_cooperative_threads += wq->wq_cooperative_queue_scheduled_count[bucket];
1417*8d741a5dSApple OSS Distributions 	}
1418*8d741a5dSApple OSS Distributions 
1419*8d741a5dSApple OSS Distributions 	return num_cooperative_threads;
1420*8d741a5dSApple OSS Distributions }
1421*8d741a5dSApple OSS Distributions 
1422*8d741a5dSApple OSS Distributions /* Calculates the number of threads scheduled >= the input QoS */
1423*8d741a5dSApple OSS Distributions static uint64_t
workq_num_cooperative_threads_scheduled_to_qos_locked(struct workqueue * wq,thread_qos_t qos)1424*8d741a5dSApple OSS Distributions workq_num_cooperative_threads_scheduled_to_qos_locked(struct workqueue *wq, thread_qos_t qos)
1425*8d741a5dSApple OSS Distributions {
1426*8d741a5dSApple OSS Distributions 	workq_lock_held(wq);
1427*8d741a5dSApple OSS Distributions 	return workq_num_cooperative_threads_scheduled_to_qos_internal(wq, qos);
1428*8d741a5dSApple OSS Distributions }
1429*8d741a5dSApple OSS Distributions 
1430*8d741a5dSApple OSS Distributions static uint64_t
workq_num_cooperative_threads_scheduled_total(struct workqueue * wq)1431*8d741a5dSApple OSS Distributions workq_num_cooperative_threads_scheduled_total(struct workqueue *wq)
1432*8d741a5dSApple OSS Distributions {
1433*8d741a5dSApple OSS Distributions 	return workq_num_cooperative_threads_scheduled_to_qos_locked(wq, WORKQ_THREAD_QOS_MIN);
1434*8d741a5dSApple OSS Distributions }
1435*8d741a5dSApple OSS Distributions 
1436*8d741a5dSApple OSS Distributions static bool
workq_has_cooperative_thread_requests(struct workqueue * wq)1437*8d741a5dSApple OSS Distributions workq_has_cooperative_thread_requests(struct workqueue *wq)
1438*8d741a5dSApple OSS Distributions {
1439*8d741a5dSApple OSS Distributions 	for (thread_qos_t qos = WORKQ_THREAD_QOS_MAX; qos >= WORKQ_THREAD_QOS_MIN; qos--) {
1440*8d741a5dSApple OSS Distributions 		uint8_t bucket = _wq_bucket(qos);
1441*8d741a5dSApple OSS Distributions 		if (!STAILQ_EMPTY(&wq->wq_cooperative_queue[bucket])) {
1442*8d741a5dSApple OSS Distributions 			return true;
1443*8d741a5dSApple OSS Distributions 		}
1444*8d741a5dSApple OSS Distributions 	}
1445*8d741a5dSApple OSS Distributions 
1446*8d741a5dSApple OSS Distributions 	return false;
1447*8d741a5dSApple OSS Distributions }
1448*8d741a5dSApple OSS Distributions 
1449*8d741a5dSApple OSS Distributions /*
1450*8d741a5dSApple OSS Distributions  * Determines the next QoS bucket we should service next in the cooperative
1451*8d741a5dSApple OSS Distributions  * pool. This function will always return a QoS for cooperative pool as long as
1452*8d741a5dSApple OSS Distributions  * there are requests to be serviced.
1453*8d741a5dSApple OSS Distributions  *
1454*8d741a5dSApple OSS Distributions  * Unlike the other thread pools, for the cooperative thread pool the schedule
1455*8d741a5dSApple OSS Distributions  * counts for the various buckets in the pool affect the next best request for
1456*8d741a5dSApple OSS Distributions  * it.
1457*8d741a5dSApple OSS Distributions  *
1458*8d741a5dSApple OSS Distributions  * This function is called in the following contexts:
1459*8d741a5dSApple OSS Distributions  *
1460*8d741a5dSApple OSS Distributions  * a) When determining the best thread QoS for cooperative bucket for the
1461*8d741a5dSApple OSS Distributions  * creator/thread reuse
1462*8d741a5dSApple OSS Distributions  *
1463*8d741a5dSApple OSS Distributions  * b) Once (a) has happened and thread has bound to a thread request, figuring
1464*8d741a5dSApple OSS Distributions  * out whether the next best request for this pool has changed so that creator
1465*8d741a5dSApple OSS Distributions  * can be scheduled.
1466*8d741a5dSApple OSS Distributions  *
1467*8d741a5dSApple OSS Distributions  * Returns true if the cooperative queue's best qos changed from previous
1468*8d741a5dSApple OSS Distributions  * value.
1469*8d741a5dSApple OSS Distributions  */
1470*8d741a5dSApple OSS Distributions static bool
_wq_cooperative_queue_refresh_best_req_qos(struct workqueue * wq)1471*8d741a5dSApple OSS Distributions _wq_cooperative_queue_refresh_best_req_qos(struct workqueue *wq)
1472*8d741a5dSApple OSS Distributions {
1473*8d741a5dSApple OSS Distributions 	workq_lock_held(wq);
1474*8d741a5dSApple OSS Distributions 
1475*8d741a5dSApple OSS Distributions 	thread_qos_t old_best_req_qos = wq->wq_cooperative_queue_best_req_qos;
1476*8d741a5dSApple OSS Distributions 
1477*8d741a5dSApple OSS Distributions 	/* We determine the next best cooperative thread request based on the
1478*8d741a5dSApple OSS Distributions 	 * following:
1479*8d741a5dSApple OSS Distributions 	 *
1480*8d741a5dSApple OSS Distributions 	 * 1. Take the MAX of the following:
1481*8d741a5dSApple OSS Distributions 	 *		a) Highest qos with pending TRs such that number of scheduled
1482*8d741a5dSApple OSS Distributions 	 *		threads so far with >= qos is < wq_max_cooperative_threads
1483*8d741a5dSApple OSS Distributions 	 *		b) Highest qos bucket with pending TRs but no scheduled threads for that bucket
1484*8d741a5dSApple OSS Distributions 	 *
1485*8d741a5dSApple OSS Distributions 	 * 2. If the result of (1) is UN, then we pick the highest priority amongst
1486*8d741a5dSApple OSS Distributions 	 * pending thread requests in the pool.
1487*8d741a5dSApple OSS Distributions 	 *
1488*8d741a5dSApple OSS Distributions 	 */
1489*8d741a5dSApple OSS Distributions 	thread_qos_t highest_qos_with_no_scheduled = THREAD_QOS_UNSPECIFIED;
1490*8d741a5dSApple OSS Distributions 	thread_qos_t highest_qos_req_with_width = THREAD_QOS_UNSPECIFIED;
1491*8d741a5dSApple OSS Distributions 
1492*8d741a5dSApple OSS Distributions 	thread_qos_t highest_qos_req = THREAD_QOS_UNSPECIFIED;
1493*8d741a5dSApple OSS Distributions 
1494*8d741a5dSApple OSS Distributions 	int scheduled_count_till_qos = 0;
1495*8d741a5dSApple OSS Distributions 
1496*8d741a5dSApple OSS Distributions 	for (thread_qos_t qos = WORKQ_THREAD_QOS_MAX; qos >= WORKQ_THREAD_QOS_MIN; qos--) {
1497*8d741a5dSApple OSS Distributions 		uint8_t bucket = _wq_bucket(qos);
1498*8d741a5dSApple OSS Distributions 		uint8_t scheduled_count_for_bucket = wq->wq_cooperative_queue_scheduled_count[bucket];
1499*8d741a5dSApple OSS Distributions 		scheduled_count_till_qos += scheduled_count_for_bucket;
1500*8d741a5dSApple OSS Distributions 
1501*8d741a5dSApple OSS Distributions 		if (!STAILQ_EMPTY(&wq->wq_cooperative_queue[bucket])) {
1502*8d741a5dSApple OSS Distributions 			if (qos > highest_qos_req) {
1503*8d741a5dSApple OSS Distributions 				highest_qos_req = qos;
1504*8d741a5dSApple OSS Distributions 			}
1505*8d741a5dSApple OSS Distributions 			/*
1506*8d741a5dSApple OSS Distributions 			 * The pool isn't saturated for threads at and above this QoS, and
1507*8d741a5dSApple OSS Distributions 			 * this qos bucket has pending requests
1508*8d741a5dSApple OSS Distributions 			 */
1509*8d741a5dSApple OSS Distributions 			if (scheduled_count_till_qos < wq_cooperative_queue_max_size(wq)) {
1510*8d741a5dSApple OSS Distributions 				if (qos > highest_qos_req_with_width) {
1511*8d741a5dSApple OSS Distributions 					highest_qos_req_with_width = qos;
1512*8d741a5dSApple OSS Distributions 				}
1513*8d741a5dSApple OSS Distributions 			}
1514*8d741a5dSApple OSS Distributions 
1515*8d741a5dSApple OSS Distributions 			/*
1516*8d741a5dSApple OSS Distributions 			 * There are no threads scheduled for this bucket but there
1517*8d741a5dSApple OSS Distributions 			 * is work pending, give it at least 1 thread
1518*8d741a5dSApple OSS Distributions 			 */
1519*8d741a5dSApple OSS Distributions 			if (scheduled_count_for_bucket == 0) {
1520*8d741a5dSApple OSS Distributions 				if (qos > highest_qos_with_no_scheduled) {
1521*8d741a5dSApple OSS Distributions 					highest_qos_with_no_scheduled = qos;
1522*8d741a5dSApple OSS Distributions 				}
1523*8d741a5dSApple OSS Distributions 			}
1524*8d741a5dSApple OSS Distributions 		}
1525*8d741a5dSApple OSS Distributions 	}
1526*8d741a5dSApple OSS Distributions 
1527*8d741a5dSApple OSS Distributions 	wq->wq_cooperative_queue_best_req_qos = MAX(highest_qos_with_no_scheduled, highest_qos_req_with_width);
1528*8d741a5dSApple OSS Distributions 	if (wq->wq_cooperative_queue_best_req_qos == THREAD_QOS_UNSPECIFIED) {
1529*8d741a5dSApple OSS Distributions 		wq->wq_cooperative_queue_best_req_qos = highest_qos_req;
1530*8d741a5dSApple OSS Distributions 	}
1531*8d741a5dSApple OSS Distributions 
1532*8d741a5dSApple OSS Distributions #if MACH_ASSERT
1533*8d741a5dSApple OSS Distributions 	/* Assert that if we are showing up the next best req as UN, then there
1534*8d741a5dSApple OSS Distributions 	 * actually is no thread request in the cooperative pool buckets */
1535*8d741a5dSApple OSS Distributions 	if (wq->wq_cooperative_queue_best_req_qos == THREAD_QOS_UNSPECIFIED) {
1536*8d741a5dSApple OSS Distributions 		assert(!workq_has_cooperative_thread_requests(wq));
1537*8d741a5dSApple OSS Distributions 	}
1538*8d741a5dSApple OSS Distributions #endif
1539*8d741a5dSApple OSS Distributions 
1540*8d741a5dSApple OSS Distributions 	return old_best_req_qos != wq->wq_cooperative_queue_best_req_qos;
1541*8d741a5dSApple OSS Distributions }
1542*8d741a5dSApple OSS Distributions 
1543*8d741a5dSApple OSS Distributions /*
1544*8d741a5dSApple OSS Distributions  * Returns whether or not the input thread (or creator thread if uth is NULL)
1545*8d741a5dSApple OSS Distributions  * should be allowed to work as part of the cooperative pool for the <input qos>
1546*8d741a5dSApple OSS Distributions  * bucket.
1547*8d741a5dSApple OSS Distributions  *
1548*8d741a5dSApple OSS Distributions  * This function is called in a bunch of places:
1549*8d741a5dSApple OSS Distributions  *		a) Quantum expires for a thread and it is part of the cooperative pool
1550*8d741a5dSApple OSS Distributions  *		b) When trying to pick a thread request for the creator thread to
1551*8d741a5dSApple OSS Distributions  *		represent.
1552*8d741a5dSApple OSS Distributions  *		c) When a thread is trying to pick a thread request to actually bind to
1553*8d741a5dSApple OSS Distributions  *		and service.
1554*8d741a5dSApple OSS Distributions  *
1555*8d741a5dSApple OSS Distributions  * Called with workq lock held.
1556*8d741a5dSApple OSS Distributions  */
1557*8d741a5dSApple OSS Distributions 
1558*8d741a5dSApple OSS Distributions #define WQ_COOPERATIVE_POOL_UNSATURATED 1
1559*8d741a5dSApple OSS Distributions #define WQ_COOPERATIVE_BUCKET_UNSERVICED 2
1560*8d741a5dSApple OSS Distributions #define WQ_COOPERATIVE_POOL_SATURATED_UP_TO_QOS 3
1561*8d741a5dSApple OSS Distributions 
1562*8d741a5dSApple OSS Distributions static bool
workq_cooperative_allowance(struct workqueue * wq,thread_qos_t qos,struct uthread * uth,bool may_start_timer)1563*8d741a5dSApple OSS Distributions workq_cooperative_allowance(struct workqueue *wq, thread_qos_t qos, struct uthread *uth,
1564*8d741a5dSApple OSS Distributions     bool may_start_timer)
1565*8d741a5dSApple OSS Distributions {
1566*8d741a5dSApple OSS Distributions 	workq_lock_held(wq);
1567*8d741a5dSApple OSS Distributions 
1568*8d741a5dSApple OSS Distributions 	bool exclude_thread_as_scheduled = false;
1569*8d741a5dSApple OSS Distributions 	bool passed_admissions = false;
1570*8d741a5dSApple OSS Distributions 	uint8_t bucket = _wq_bucket(qos);
1571*8d741a5dSApple OSS Distributions 
1572*8d741a5dSApple OSS Distributions 	if (uth && workq_thread_is_cooperative(uth)) {
1573*8d741a5dSApple OSS Distributions 		exclude_thread_as_scheduled = true;
1574*8d741a5dSApple OSS Distributions 		_wq_cooperative_queue_scheduled_count_dec(wq, uth->uu_workq_pri.qos_req);
1575*8d741a5dSApple OSS Distributions 	}
1576*8d741a5dSApple OSS Distributions 
1577*8d741a5dSApple OSS Distributions 	/*
1578*8d741a5dSApple OSS Distributions 	 * We have not saturated the pool yet, let this thread continue
1579*8d741a5dSApple OSS Distributions 	 */
1580*8d741a5dSApple OSS Distributions 	uint64_t total_cooperative_threads;
1581*8d741a5dSApple OSS Distributions 	total_cooperative_threads = workq_num_cooperative_threads_scheduled_total(wq);
1582*8d741a5dSApple OSS Distributions 	if (total_cooperative_threads < wq_cooperative_queue_max_size(wq)) {
1583*8d741a5dSApple OSS Distributions 		passed_admissions = true;
1584*8d741a5dSApple OSS Distributions 		WQ_TRACE(TRACE_wq_cooperative_admission | DBG_FUNC_NONE,
1585*8d741a5dSApple OSS Distributions 		    total_cooperative_threads, qos, passed_admissions,
1586*8d741a5dSApple OSS Distributions 		    WQ_COOPERATIVE_POOL_UNSATURATED);
1587*8d741a5dSApple OSS Distributions 		goto out;
1588*8d741a5dSApple OSS Distributions 	}
1589*8d741a5dSApple OSS Distributions 
1590*8d741a5dSApple OSS Distributions 	/*
1591*8d741a5dSApple OSS Distributions 	 * Without this thread, nothing is servicing the bucket which has pending
1592*8d741a5dSApple OSS Distributions 	 * work
1593*8d741a5dSApple OSS Distributions 	 */
1594*8d741a5dSApple OSS Distributions 	uint64_t bucket_scheduled = wq->wq_cooperative_queue_scheduled_count[bucket];
1595*8d741a5dSApple OSS Distributions 	if (bucket_scheduled == 0 &&
1596*8d741a5dSApple OSS Distributions 	    !STAILQ_EMPTY(&wq->wq_cooperative_queue[bucket])) {
1597*8d741a5dSApple OSS Distributions 		passed_admissions = true;
1598*8d741a5dSApple OSS Distributions 		WQ_TRACE(TRACE_wq_cooperative_admission | DBG_FUNC_NONE,
1599*8d741a5dSApple OSS Distributions 		    total_cooperative_threads, qos, passed_admissions,
1600*8d741a5dSApple OSS Distributions 		    WQ_COOPERATIVE_BUCKET_UNSERVICED);
1601*8d741a5dSApple OSS Distributions 		goto out;
1602*8d741a5dSApple OSS Distributions 	}
1603*8d741a5dSApple OSS Distributions 
1604*8d741a5dSApple OSS Distributions 	/*
1605*8d741a5dSApple OSS Distributions 	 * If number of threads at the QoS bucket >= input QoS exceeds the max we want
1606*8d741a5dSApple OSS Distributions 	 * for the pool, deny this thread
1607*8d741a5dSApple OSS Distributions 	 */
1608*8d741a5dSApple OSS Distributions 	uint64_t aggregate_down_to_qos = workq_num_cooperative_threads_scheduled_to_qos_locked(wq, qos);
1609*8d741a5dSApple OSS Distributions 	passed_admissions = (aggregate_down_to_qos < wq_cooperative_queue_max_size(wq));
1610*8d741a5dSApple OSS Distributions 	WQ_TRACE(TRACE_wq_cooperative_admission | DBG_FUNC_NONE, aggregate_down_to_qos,
1611*8d741a5dSApple OSS Distributions 	    qos, passed_admissions, WQ_COOPERATIVE_POOL_SATURATED_UP_TO_QOS);
1612*8d741a5dSApple OSS Distributions 
1613*8d741a5dSApple OSS Distributions 	if (!passed_admissions && may_start_timer) {
1614*8d741a5dSApple OSS Distributions 		workq_schedule_delayed_thread_creation(wq, 0);
1615*8d741a5dSApple OSS Distributions 	}
1616*8d741a5dSApple OSS Distributions 
1617*8d741a5dSApple OSS Distributions out:
1618*8d741a5dSApple OSS Distributions 	if (exclude_thread_as_scheduled) {
1619*8d741a5dSApple OSS Distributions 		_wq_cooperative_queue_scheduled_count_inc(wq, uth->uu_workq_pri.qos_req);
1620*8d741a5dSApple OSS Distributions 	}
1621*8d741a5dSApple OSS Distributions 	return passed_admissions;
1622*8d741a5dSApple OSS Distributions }
1623*8d741a5dSApple OSS Distributions 
1624*8d741a5dSApple OSS Distributions /*
1625*8d741a5dSApple OSS Distributions  * returns true if the best request for the pool changed as a result of
1626*8d741a5dSApple OSS Distributions  * enqueuing this thread request.
1627*8d741a5dSApple OSS Distributions  */
1628*8d741a5dSApple OSS Distributions static bool
workq_threadreq_enqueue(struct workqueue * wq,workq_threadreq_t req)1629*8d741a5dSApple OSS Distributions workq_threadreq_enqueue(struct workqueue *wq, workq_threadreq_t req)
1630*8d741a5dSApple OSS Distributions {
1631*8d741a5dSApple OSS Distributions 	assert(req->tr_state == WORKQ_TR_STATE_NEW);
1632*8d741a5dSApple OSS Distributions 
1633*8d741a5dSApple OSS Distributions 	req->tr_state = WORKQ_TR_STATE_QUEUED;
1634*8d741a5dSApple OSS Distributions 	wq->wq_reqcount += req->tr_count;
1635*8d741a5dSApple OSS Distributions 
1636*8d741a5dSApple OSS Distributions 	if (req->tr_qos == WORKQ_THREAD_QOS_MANAGER) {
1637*8d741a5dSApple OSS Distributions 		assert(wq->wq_event_manager_threadreq == NULL);
1638*8d741a5dSApple OSS Distributions 		assert(req->tr_flags & WORKQ_TR_FLAG_KEVENT);
1639*8d741a5dSApple OSS Distributions 		assert(req->tr_count == 1);
1640*8d741a5dSApple OSS Distributions 		wq->wq_event_manager_threadreq = req;
1641*8d741a5dSApple OSS Distributions 		return true;
1642*8d741a5dSApple OSS Distributions 	}
1643*8d741a5dSApple OSS Distributions 
1644*8d741a5dSApple OSS Distributions 	if (workq_threadreq_is_cooperative(req)) {
1645*8d741a5dSApple OSS Distributions 		assert(req->tr_qos != WORKQ_THREAD_QOS_MANAGER);
1646*8d741a5dSApple OSS Distributions 		assert(req->tr_qos != WORKQ_THREAD_QOS_ABOVEUI);
1647*8d741a5dSApple OSS Distributions 
1648*8d741a5dSApple OSS Distributions 		struct workq_threadreq_tailq *bucket = &wq->wq_cooperative_queue[_wq_bucket(req->tr_qos)];
1649*8d741a5dSApple OSS Distributions 		STAILQ_INSERT_TAIL(bucket, req, tr_link);
1650*8d741a5dSApple OSS Distributions 
1651*8d741a5dSApple OSS Distributions 		return _wq_cooperative_queue_refresh_best_req_qos(wq);
1652*8d741a5dSApple OSS Distributions 	}
1653*8d741a5dSApple OSS Distributions 
1654*8d741a5dSApple OSS Distributions 	struct priority_queue_sched_max *q = workq_priority_queue_for_req(wq, req);
1655*8d741a5dSApple OSS Distributions 
1656*8d741a5dSApple OSS Distributions 	priority_queue_entry_set_sched_pri(q, &req->tr_entry,
1657*8d741a5dSApple OSS Distributions 	    workq_priority_for_req(req), false);
1658*8d741a5dSApple OSS Distributions 
1659*8d741a5dSApple OSS Distributions 	if (priority_queue_insert(q, &req->tr_entry)) {
1660*8d741a5dSApple OSS Distributions 		if (workq_threadreq_is_nonovercommit(req)) {
1661*8d741a5dSApple OSS Distributions 			_wq_thactive_refresh_best_constrained_req_qos(wq);
1662*8d741a5dSApple OSS Distributions 		}
1663*8d741a5dSApple OSS Distributions 		return true;
1664*8d741a5dSApple OSS Distributions 	}
1665*8d741a5dSApple OSS Distributions 	return false;
1666*8d741a5dSApple OSS Distributions }
1667*8d741a5dSApple OSS Distributions 
1668*8d741a5dSApple OSS Distributions /*
1669*8d741a5dSApple OSS Distributions  * returns true if one of the following is true (so as to update creator if
1670*8d741a5dSApple OSS Distributions  * needed):
1671*8d741a5dSApple OSS Distributions  *
1672*8d741a5dSApple OSS Distributions  * (a) the next highest request of the pool we dequeued the request from changed
1673*8d741a5dSApple OSS Distributions  * (b) the next highest requests of the pool the current thread used to be a
1674*8d741a5dSApple OSS Distributions  * part of, changed
1675*8d741a5dSApple OSS Distributions  *
1676*8d741a5dSApple OSS Distributions  * For overcommit, special and constrained pools, the next highest QoS for each
1677*8d741a5dSApple OSS Distributions  * pool just a MAX of pending requests so tracking (a) is sufficient.
1678*8d741a5dSApple OSS Distributions  *
1679*8d741a5dSApple OSS Distributions  * But for cooperative thread pool, the next highest QoS for the pool depends on
1680*8d741a5dSApple OSS Distributions  * schedule counts in the pool as well. So if the current thread used to be
1681*8d741a5dSApple OSS Distributions  * cooperative in it's previous logical run ie (b), then that can also affect
1682*8d741a5dSApple OSS Distributions  * cooperative pool's next best QoS requests.
1683*8d741a5dSApple OSS Distributions  */
1684*8d741a5dSApple OSS Distributions static bool
workq_threadreq_dequeue(struct workqueue * wq,workq_threadreq_t req,bool cooperative_sched_count_changed)1685*8d741a5dSApple OSS Distributions workq_threadreq_dequeue(struct workqueue *wq, workq_threadreq_t req,
1686*8d741a5dSApple OSS Distributions     bool cooperative_sched_count_changed)
1687*8d741a5dSApple OSS Distributions {
1688*8d741a5dSApple OSS Distributions 	wq->wq_reqcount--;
1689*8d741a5dSApple OSS Distributions 
1690*8d741a5dSApple OSS Distributions 	bool next_highest_request_changed = false;
1691*8d741a5dSApple OSS Distributions 
1692*8d741a5dSApple OSS Distributions 	if (--req->tr_count == 0) {
1693*8d741a5dSApple OSS Distributions 		if (req->tr_qos == WORKQ_THREAD_QOS_MANAGER) {
1694*8d741a5dSApple OSS Distributions 			assert(wq->wq_event_manager_threadreq == req);
1695*8d741a5dSApple OSS Distributions 			assert(req->tr_count == 0);
1696*8d741a5dSApple OSS Distributions 			wq->wq_event_manager_threadreq = NULL;
1697*8d741a5dSApple OSS Distributions 
1698*8d741a5dSApple OSS Distributions 			/* If a cooperative thread was the one which picked up the manager
1699*8d741a5dSApple OSS Distributions 			 * thread request, we need to reevaluate the cooperative pool
1700*8d741a5dSApple OSS Distributions 			 * anyways.
1701*8d741a5dSApple OSS Distributions 			 */
1702*8d741a5dSApple OSS Distributions 			if (cooperative_sched_count_changed) {
1703*8d741a5dSApple OSS Distributions 				_wq_cooperative_queue_refresh_best_req_qos(wq);
1704*8d741a5dSApple OSS Distributions 			}
1705*8d741a5dSApple OSS Distributions 			return true;
1706*8d741a5dSApple OSS Distributions 		}
1707*8d741a5dSApple OSS Distributions 
1708*8d741a5dSApple OSS Distributions 		if (workq_threadreq_is_cooperative(req)) {
1709*8d741a5dSApple OSS Distributions 			assert(req->tr_qos != WORKQ_THREAD_QOS_MANAGER);
1710*8d741a5dSApple OSS Distributions 			assert(req->tr_qos != WORKQ_THREAD_QOS_ABOVEUI);
1711*8d741a5dSApple OSS Distributions 			/* Account for the fact that BG and MT are coalesced when
1712*8d741a5dSApple OSS Distributions 			 * calculating best request for cooperative pool
1713*8d741a5dSApple OSS Distributions 			 */
1714*8d741a5dSApple OSS Distributions 			assert(_wq_bucket(req->tr_qos) == _wq_bucket(wq->wq_cooperative_queue_best_req_qos));
1715*8d741a5dSApple OSS Distributions 
1716*8d741a5dSApple OSS Distributions 			struct workq_threadreq_tailq *bucket = &wq->wq_cooperative_queue[_wq_bucket(req->tr_qos)];
1717*8d741a5dSApple OSS Distributions 			__assert_only workq_threadreq_t head = STAILQ_FIRST(bucket);
1718*8d741a5dSApple OSS Distributions 
1719*8d741a5dSApple OSS Distributions 			assert(head == req);
1720*8d741a5dSApple OSS Distributions 			STAILQ_REMOVE_HEAD(bucket, tr_link);
1721*8d741a5dSApple OSS Distributions 
1722*8d741a5dSApple OSS Distributions 			/*
1723*8d741a5dSApple OSS Distributions 			 * If the request we're dequeueing is cooperative, then the sched
1724*8d741a5dSApple OSS Distributions 			 * counts definitely changed.
1725*8d741a5dSApple OSS Distributions 			 */
1726*8d741a5dSApple OSS Distributions 			assert(cooperative_sched_count_changed);
1727*8d741a5dSApple OSS Distributions 		}
1728*8d741a5dSApple OSS Distributions 
1729*8d741a5dSApple OSS Distributions 		/*
1730*8d741a5dSApple OSS Distributions 		 * We want to do the cooperative pool refresh after dequeueing a
1731*8d741a5dSApple OSS Distributions 		 * cooperative thread request if any (to combine both effects into 1
1732*8d741a5dSApple OSS Distributions 		 * refresh operation)
1733*8d741a5dSApple OSS Distributions 		 */
1734*8d741a5dSApple OSS Distributions 		if (cooperative_sched_count_changed) {
1735*8d741a5dSApple OSS Distributions 			next_highest_request_changed = _wq_cooperative_queue_refresh_best_req_qos(wq);
1736*8d741a5dSApple OSS Distributions 		}
1737*8d741a5dSApple OSS Distributions 
1738*8d741a5dSApple OSS Distributions 		if (!workq_threadreq_is_cooperative(req)) {
1739*8d741a5dSApple OSS Distributions 			/*
1740*8d741a5dSApple OSS Distributions 			 * All other types of requests are enqueued in priority queues
1741*8d741a5dSApple OSS Distributions 			 */
1742*8d741a5dSApple OSS Distributions 
1743*8d741a5dSApple OSS Distributions 			if (priority_queue_remove(workq_priority_queue_for_req(wq, req),
1744*8d741a5dSApple OSS Distributions 			    &req->tr_entry)) {
1745*8d741a5dSApple OSS Distributions 				next_highest_request_changed |= true;
1746*8d741a5dSApple OSS Distributions 				if (workq_threadreq_is_nonovercommit(req)) {
1747*8d741a5dSApple OSS Distributions 					_wq_thactive_refresh_best_constrained_req_qos(wq);
1748*8d741a5dSApple OSS Distributions 				}
1749*8d741a5dSApple OSS Distributions 			}
1750*8d741a5dSApple OSS Distributions 		}
1751*8d741a5dSApple OSS Distributions 	}
1752*8d741a5dSApple OSS Distributions 
1753*8d741a5dSApple OSS Distributions 	return next_highest_request_changed;
1754*8d741a5dSApple OSS Distributions }
1755*8d741a5dSApple OSS Distributions 
1756*8d741a5dSApple OSS Distributions static void
workq_threadreq_destroy(proc_t p,workq_threadreq_t req)1757*8d741a5dSApple OSS Distributions workq_threadreq_destroy(proc_t p, workq_threadreq_t req)
1758*8d741a5dSApple OSS Distributions {
1759*8d741a5dSApple OSS Distributions 	req->tr_state = WORKQ_TR_STATE_CANCELED;
1760*8d741a5dSApple OSS Distributions 	if (req->tr_flags & (WORKQ_TR_FLAG_WORKLOOP | WORKQ_TR_FLAG_KEVENT)) {
1761*8d741a5dSApple OSS Distributions 		kqueue_threadreq_cancel(p, req);
1762*8d741a5dSApple OSS Distributions 	} else {
1763*8d741a5dSApple OSS Distributions 		zfree(workq_zone_threadreq, req);
1764*8d741a5dSApple OSS Distributions 	}
1765*8d741a5dSApple OSS Distributions }
1766*8d741a5dSApple OSS Distributions 
1767*8d741a5dSApple OSS Distributions #pragma mark workqueue thread creation thread calls
1768*8d741a5dSApple OSS Distributions 
1769*8d741a5dSApple OSS Distributions static inline bool
workq_thread_call_prepost(struct workqueue * wq,uint32_t sched,uint32_t pend,uint32_t fail_mask)1770*8d741a5dSApple OSS Distributions workq_thread_call_prepost(struct workqueue *wq, uint32_t sched, uint32_t pend,
1771*8d741a5dSApple OSS Distributions     uint32_t fail_mask)
1772*8d741a5dSApple OSS Distributions {
1773*8d741a5dSApple OSS Distributions 	uint32_t old_flags, new_flags;
1774*8d741a5dSApple OSS Distributions 
1775*8d741a5dSApple OSS Distributions 	os_atomic_rmw_loop(&wq->wq_flags, old_flags, new_flags, acquire, {
1776*8d741a5dSApple OSS Distributions 		if (__improbable(old_flags & (WQ_EXITING | sched | pend | fail_mask))) {
1777*8d741a5dSApple OSS Distributions 		        os_atomic_rmw_loop_give_up(return false);
1778*8d741a5dSApple OSS Distributions 		}
1779*8d741a5dSApple OSS Distributions 		if (__improbable(old_flags & WQ_PROC_SUSPENDED)) {
1780*8d741a5dSApple OSS Distributions 		        new_flags = old_flags | pend;
1781*8d741a5dSApple OSS Distributions 		} else {
1782*8d741a5dSApple OSS Distributions 		        new_flags = old_flags | sched;
1783*8d741a5dSApple OSS Distributions 		}
1784*8d741a5dSApple OSS Distributions 	});
1785*8d741a5dSApple OSS Distributions 
1786*8d741a5dSApple OSS Distributions 	return (old_flags & WQ_PROC_SUSPENDED) == 0;
1787*8d741a5dSApple OSS Distributions }
1788*8d741a5dSApple OSS Distributions 
1789*8d741a5dSApple OSS Distributions #define WORKQ_SCHEDULE_DELAYED_THREAD_CREATION_RESTART 0x1
1790*8d741a5dSApple OSS Distributions 
1791*8d741a5dSApple OSS Distributions static bool
workq_schedule_delayed_thread_creation(struct workqueue * wq,int flags)1792*8d741a5dSApple OSS Distributions workq_schedule_delayed_thread_creation(struct workqueue *wq, int flags)
1793*8d741a5dSApple OSS Distributions {
1794*8d741a5dSApple OSS Distributions 	assert(!preemption_enabled());
1795*8d741a5dSApple OSS Distributions 
1796*8d741a5dSApple OSS Distributions 	if (!workq_thread_call_prepost(wq, WQ_DELAYED_CALL_SCHEDULED,
1797*8d741a5dSApple OSS Distributions 	    WQ_DELAYED_CALL_PENDED, WQ_IMMEDIATE_CALL_PENDED |
1798*8d741a5dSApple OSS Distributions 	    WQ_IMMEDIATE_CALL_SCHEDULED)) {
1799*8d741a5dSApple OSS Distributions 		return false;
1800*8d741a5dSApple OSS Distributions 	}
1801*8d741a5dSApple OSS Distributions 
1802*8d741a5dSApple OSS Distributions 	uint64_t now = mach_absolute_time();
1803*8d741a5dSApple OSS Distributions 
1804*8d741a5dSApple OSS Distributions 	if (flags & WORKQ_SCHEDULE_DELAYED_THREAD_CREATION_RESTART) {
1805*8d741a5dSApple OSS Distributions 		/* do not change the window */
1806*8d741a5dSApple OSS Distributions 	} else if (now - wq->wq_thread_call_last_run <= wq->wq_timer_interval) {
1807*8d741a5dSApple OSS Distributions 		wq->wq_timer_interval *= 2;
1808*8d741a5dSApple OSS Distributions 		if (wq->wq_timer_interval > wq_max_timer_interval.abstime) {
1809*8d741a5dSApple OSS Distributions 			wq->wq_timer_interval = (uint32_t)wq_max_timer_interval.abstime;
1810*8d741a5dSApple OSS Distributions 		}
1811*8d741a5dSApple OSS Distributions 	} else if (now - wq->wq_thread_call_last_run > 2 * wq->wq_timer_interval) {
1812*8d741a5dSApple OSS Distributions 		wq->wq_timer_interval /= 2;
1813*8d741a5dSApple OSS Distributions 		if (wq->wq_timer_interval < wq_stalled_window.abstime) {
1814*8d741a5dSApple OSS Distributions 			wq->wq_timer_interval = (uint32_t)wq_stalled_window.abstime;
1815*8d741a5dSApple OSS Distributions 		}
1816*8d741a5dSApple OSS Distributions 	}
1817*8d741a5dSApple OSS Distributions 
1818*8d741a5dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_start_add_timer, wq, wq->wq_reqcount,
1819*8d741a5dSApple OSS Distributions 	    _wq_flags(wq), wq->wq_timer_interval);
1820*8d741a5dSApple OSS Distributions 
1821*8d741a5dSApple OSS Distributions 	thread_call_t call = wq->wq_delayed_call;
1822*8d741a5dSApple OSS Distributions 	uintptr_t arg = WQ_DELAYED_CALL_SCHEDULED;
1823*8d741a5dSApple OSS Distributions 	uint64_t deadline = now + wq->wq_timer_interval;
1824*8d741a5dSApple OSS Distributions 	if (thread_call_enter1_delayed(call, (void *)arg, deadline)) {
1825*8d741a5dSApple OSS Distributions 		panic("delayed_call was already enqueued");
1826*8d741a5dSApple OSS Distributions 	}
1827*8d741a5dSApple OSS Distributions 	return true;
1828*8d741a5dSApple OSS Distributions }
1829*8d741a5dSApple OSS Distributions 
1830*8d741a5dSApple OSS Distributions static void
workq_schedule_immediate_thread_creation(struct workqueue * wq)1831*8d741a5dSApple OSS Distributions workq_schedule_immediate_thread_creation(struct workqueue *wq)
1832*8d741a5dSApple OSS Distributions {
1833*8d741a5dSApple OSS Distributions 	assert(!preemption_enabled());
1834*8d741a5dSApple OSS Distributions 
1835*8d741a5dSApple OSS Distributions 	if (workq_thread_call_prepost(wq, WQ_IMMEDIATE_CALL_SCHEDULED,
1836*8d741a5dSApple OSS Distributions 	    WQ_IMMEDIATE_CALL_PENDED, 0)) {
1837*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_start_add_timer, wq, wq->wq_reqcount,
1838*8d741a5dSApple OSS Distributions 		    _wq_flags(wq), 0);
1839*8d741a5dSApple OSS Distributions 
1840*8d741a5dSApple OSS Distributions 		uintptr_t arg = WQ_IMMEDIATE_CALL_SCHEDULED;
1841*8d741a5dSApple OSS Distributions 		if (thread_call_enter1(wq->wq_immediate_call, (void *)arg)) {
1842*8d741a5dSApple OSS Distributions 			panic("immediate_call was already enqueued");
1843*8d741a5dSApple OSS Distributions 		}
1844*8d741a5dSApple OSS Distributions 	}
1845*8d741a5dSApple OSS Distributions }
1846*8d741a5dSApple OSS Distributions 
1847*8d741a5dSApple OSS Distributions void
workq_proc_suspended(struct proc * p)1848*8d741a5dSApple OSS Distributions workq_proc_suspended(struct proc *p)
1849*8d741a5dSApple OSS Distributions {
1850*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
1851*8d741a5dSApple OSS Distributions 
1852*8d741a5dSApple OSS Distributions 	if (wq) {
1853*8d741a5dSApple OSS Distributions 		os_atomic_or(&wq->wq_flags, WQ_PROC_SUSPENDED, relaxed);
1854*8d741a5dSApple OSS Distributions 	}
1855*8d741a5dSApple OSS Distributions }
1856*8d741a5dSApple OSS Distributions 
1857*8d741a5dSApple OSS Distributions void
workq_proc_resumed(struct proc * p)1858*8d741a5dSApple OSS Distributions workq_proc_resumed(struct proc *p)
1859*8d741a5dSApple OSS Distributions {
1860*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
1861*8d741a5dSApple OSS Distributions 	uint32_t wq_flags;
1862*8d741a5dSApple OSS Distributions 
1863*8d741a5dSApple OSS Distributions 	if (!wq) {
1864*8d741a5dSApple OSS Distributions 		return;
1865*8d741a5dSApple OSS Distributions 	}
1866*8d741a5dSApple OSS Distributions 
1867*8d741a5dSApple OSS Distributions 	wq_flags = os_atomic_andnot_orig(&wq->wq_flags, WQ_PROC_SUSPENDED |
1868*8d741a5dSApple OSS Distributions 	    WQ_DELAYED_CALL_PENDED | WQ_IMMEDIATE_CALL_PENDED, relaxed);
1869*8d741a5dSApple OSS Distributions 	if ((wq_flags & WQ_EXITING) == 0) {
1870*8d741a5dSApple OSS Distributions 		disable_preemption();
1871*8d741a5dSApple OSS Distributions 		if (wq_flags & WQ_IMMEDIATE_CALL_PENDED) {
1872*8d741a5dSApple OSS Distributions 			workq_schedule_immediate_thread_creation(wq);
1873*8d741a5dSApple OSS Distributions 		} else if (wq_flags & WQ_DELAYED_CALL_PENDED) {
1874*8d741a5dSApple OSS Distributions 			workq_schedule_delayed_thread_creation(wq,
1875*8d741a5dSApple OSS Distributions 			    WORKQ_SCHEDULE_DELAYED_THREAD_CREATION_RESTART);
1876*8d741a5dSApple OSS Distributions 		}
1877*8d741a5dSApple OSS Distributions 		enable_preemption();
1878*8d741a5dSApple OSS Distributions 	}
1879*8d741a5dSApple OSS Distributions }
1880*8d741a5dSApple OSS Distributions 
1881*8d741a5dSApple OSS Distributions /**
1882*8d741a5dSApple OSS Distributions  * returns whether lastblocked_tsp is within wq_stalled_window usecs of now
1883*8d741a5dSApple OSS Distributions  */
1884*8d741a5dSApple OSS Distributions static bool
workq_thread_is_busy(uint64_t now,_Atomic uint64_t * lastblocked_tsp)1885*8d741a5dSApple OSS Distributions workq_thread_is_busy(uint64_t now, _Atomic uint64_t *lastblocked_tsp)
1886*8d741a5dSApple OSS Distributions {
1887*8d741a5dSApple OSS Distributions 	uint64_t lastblocked_ts = os_atomic_load_wide(lastblocked_tsp, relaxed);
1888*8d741a5dSApple OSS Distributions 	if (now <= lastblocked_ts) {
1889*8d741a5dSApple OSS Distributions 		/*
1890*8d741a5dSApple OSS Distributions 		 * Because the update of the timestamp when a thread blocks
1891*8d741a5dSApple OSS Distributions 		 * isn't serialized against us looking at it (i.e. we don't hold
1892*8d741a5dSApple OSS Distributions 		 * the workq lock), it's possible to have a timestamp that matches
1893*8d741a5dSApple OSS Distributions 		 * the current time or that even looks to be in the future relative
1894*8d741a5dSApple OSS Distributions 		 * to when we grabbed the current time...
1895*8d741a5dSApple OSS Distributions 		 *
1896*8d741a5dSApple OSS Distributions 		 * Just treat this as a busy thread since it must have just blocked.
1897*8d741a5dSApple OSS Distributions 		 */
1898*8d741a5dSApple OSS Distributions 		return true;
1899*8d741a5dSApple OSS Distributions 	}
1900*8d741a5dSApple OSS Distributions 	return (now - lastblocked_ts) < wq_stalled_window.abstime;
1901*8d741a5dSApple OSS Distributions }
1902*8d741a5dSApple OSS Distributions 
1903*8d741a5dSApple OSS Distributions static void
workq_add_new_threads_call(void * _p,void * flags)1904*8d741a5dSApple OSS Distributions workq_add_new_threads_call(void *_p, void *flags)
1905*8d741a5dSApple OSS Distributions {
1906*8d741a5dSApple OSS Distributions 	proc_t p = _p;
1907*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
1908*8d741a5dSApple OSS Distributions 	uint32_t my_flag = (uint32_t)(uintptr_t)flags;
1909*8d741a5dSApple OSS Distributions 
1910*8d741a5dSApple OSS Distributions 	/*
1911*8d741a5dSApple OSS Distributions 	 * workq_exit() will set the workqueue to NULL before
1912*8d741a5dSApple OSS Distributions 	 * it cancels thread calls.
1913*8d741a5dSApple OSS Distributions 	 */
1914*8d741a5dSApple OSS Distributions 	if (!wq) {
1915*8d741a5dSApple OSS Distributions 		return;
1916*8d741a5dSApple OSS Distributions 	}
1917*8d741a5dSApple OSS Distributions 
1918*8d741a5dSApple OSS Distributions 	assert((my_flag == WQ_DELAYED_CALL_SCHEDULED) ||
1919*8d741a5dSApple OSS Distributions 	    (my_flag == WQ_IMMEDIATE_CALL_SCHEDULED));
1920*8d741a5dSApple OSS Distributions 
1921*8d741a5dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_add_timer | DBG_FUNC_START, wq, _wq_flags(wq),
1922*8d741a5dSApple OSS Distributions 	    wq->wq_nthreads, wq->wq_thidlecount);
1923*8d741a5dSApple OSS Distributions 
1924*8d741a5dSApple OSS Distributions 	workq_lock_spin(wq);
1925*8d741a5dSApple OSS Distributions 
1926*8d741a5dSApple OSS Distributions 	wq->wq_thread_call_last_run = mach_absolute_time();
1927*8d741a5dSApple OSS Distributions 	os_atomic_andnot(&wq->wq_flags, my_flag, release);
1928*8d741a5dSApple OSS Distributions 
1929*8d741a5dSApple OSS Distributions 	/* This can drop the workqueue lock, and take it again */
1930*8d741a5dSApple OSS Distributions 	workq_schedule_creator(p, wq, WORKQ_THREADREQ_CAN_CREATE_THREADS);
1931*8d741a5dSApple OSS Distributions 
1932*8d741a5dSApple OSS Distributions 	workq_unlock(wq);
1933*8d741a5dSApple OSS Distributions 
1934*8d741a5dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_add_timer | DBG_FUNC_END, wq, 0,
1935*8d741a5dSApple OSS Distributions 	    wq->wq_nthreads, wq->wq_thidlecount);
1936*8d741a5dSApple OSS Distributions }
1937*8d741a5dSApple OSS Distributions 
1938*8d741a5dSApple OSS Distributions #pragma mark thread state tracking
1939*8d741a5dSApple OSS Distributions 
1940*8d741a5dSApple OSS Distributions static void
workq_sched_callback(int type,thread_t thread)1941*8d741a5dSApple OSS Distributions workq_sched_callback(int type, thread_t thread)
1942*8d741a5dSApple OSS Distributions {
1943*8d741a5dSApple OSS Distributions 	thread_ro_t tro = get_thread_ro(thread);
1944*8d741a5dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(thread);
1945*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(tro->tro_proc);
1946*8d741a5dSApple OSS Distributions 	thread_qos_t req_qos, qos = uth->uu_workq_pri.qos_bucket;
1947*8d741a5dSApple OSS Distributions 	wq_thactive_t old_thactive;
1948*8d741a5dSApple OSS Distributions 	bool start_timer = false;
1949*8d741a5dSApple OSS Distributions 
1950*8d741a5dSApple OSS Distributions 	if (qos == WORKQ_THREAD_QOS_MANAGER) {
1951*8d741a5dSApple OSS Distributions 		return;
1952*8d741a5dSApple OSS Distributions 	}
1953*8d741a5dSApple OSS Distributions 
1954*8d741a5dSApple OSS Distributions 	switch (type) {
1955*8d741a5dSApple OSS Distributions 	case SCHED_CALL_BLOCK:
1956*8d741a5dSApple OSS Distributions 		old_thactive = _wq_thactive_dec(wq, qos);
1957*8d741a5dSApple OSS Distributions 		req_qos = WQ_THACTIVE_BEST_CONSTRAINED_REQ_QOS(old_thactive);
1958*8d741a5dSApple OSS Distributions 
1959*8d741a5dSApple OSS Distributions 		/*
1960*8d741a5dSApple OSS Distributions 		 * Remember the timestamp of the last thread that blocked in this
1961*8d741a5dSApple OSS Distributions 		 * bucket, it used used by admission checks to ignore one thread
1962*8d741a5dSApple OSS Distributions 		 * being inactive if this timestamp is recent enough.
1963*8d741a5dSApple OSS Distributions 		 *
1964*8d741a5dSApple OSS Distributions 		 * If we collide with another thread trying to update the
1965*8d741a5dSApple OSS Distributions 		 * last_blocked (really unlikely since another thread would have to
1966*8d741a5dSApple OSS Distributions 		 * get scheduled and then block after we start down this path), it's
1967*8d741a5dSApple OSS Distributions 		 * not a problem.  Either timestamp is adequate, so no need to retry
1968*8d741a5dSApple OSS Distributions 		 */
1969*8d741a5dSApple OSS Distributions 		os_atomic_store_wide(&wq->wq_lastblocked_ts[_wq_bucket(qos)],
1970*8d741a5dSApple OSS Distributions 		    thread_last_run_time(thread), relaxed);
1971*8d741a5dSApple OSS Distributions 
1972*8d741a5dSApple OSS Distributions 		if (req_qos == THREAD_QOS_UNSPECIFIED) {
1973*8d741a5dSApple OSS Distributions 			/*
1974*8d741a5dSApple OSS Distributions 			 * No pending request at the moment we could unblock, move on.
1975*8d741a5dSApple OSS Distributions 			 */
1976*8d741a5dSApple OSS Distributions 		} else if (qos < req_qos) {
1977*8d741a5dSApple OSS Distributions 			/*
1978*8d741a5dSApple OSS Distributions 			 * The blocking thread is at a lower QoS than the highest currently
1979*8d741a5dSApple OSS Distributions 			 * pending constrained request, nothing has to be redriven
1980*8d741a5dSApple OSS Distributions 			 */
1981*8d741a5dSApple OSS Distributions 		} else {
1982*8d741a5dSApple OSS Distributions 			uint32_t max_busycount, old_req_count;
1983*8d741a5dSApple OSS Distributions 			old_req_count = _wq_thactive_aggregate_downto_qos(wq, old_thactive,
1984*8d741a5dSApple OSS Distributions 			    req_qos, NULL, &max_busycount);
1985*8d741a5dSApple OSS Distributions 			/*
1986*8d741a5dSApple OSS Distributions 			 * If it is possible that may_start_constrained_thread had refused
1987*8d741a5dSApple OSS Distributions 			 * admission due to being over the max concurrency, we may need to
1988*8d741a5dSApple OSS Distributions 			 * spin up a new thread.
1989*8d741a5dSApple OSS Distributions 			 *
1990*8d741a5dSApple OSS Distributions 			 * We take into account the maximum number of busy threads
1991*8d741a5dSApple OSS Distributions 			 * that can affect may_start_constrained_thread as looking at the
1992*8d741a5dSApple OSS Distributions 			 * actual number may_start_constrained_thread will see is racy.
1993*8d741a5dSApple OSS Distributions 			 *
1994*8d741a5dSApple OSS Distributions 			 * IOW at NCPU = 4, for IN (req_qos = 1), if the old req count is
1995*8d741a5dSApple OSS Distributions 			 * between NCPU (4) and NCPU - 2 (2) we need to redrive.
1996*8d741a5dSApple OSS Distributions 			 */
1997*8d741a5dSApple OSS Distributions 			uint32_t conc = wq_max_parallelism[_wq_bucket(qos)];
1998*8d741a5dSApple OSS Distributions 			if (old_req_count <= conc && conc <= old_req_count + max_busycount) {
1999*8d741a5dSApple OSS Distributions 				start_timer = workq_schedule_delayed_thread_creation(wq, 0);
2000*8d741a5dSApple OSS Distributions 			}
2001*8d741a5dSApple OSS Distributions 		}
2002*8d741a5dSApple OSS Distributions 		if (__improbable(kdebug_enable)) {
2003*8d741a5dSApple OSS Distributions 			__unused uint32_t old = _wq_thactive_aggregate_downto_qos(wq,
2004*8d741a5dSApple OSS Distributions 			    old_thactive, qos, NULL, NULL);
2005*8d741a5dSApple OSS Distributions 			WQ_TRACE_WQ(TRACE_wq_thread_block | DBG_FUNC_START, wq,
2006*8d741a5dSApple OSS Distributions 			    old - 1, qos | (req_qos << 8),
2007*8d741a5dSApple OSS Distributions 			    wq->wq_reqcount << 1 | start_timer);
2008*8d741a5dSApple OSS Distributions 		}
2009*8d741a5dSApple OSS Distributions 		break;
2010*8d741a5dSApple OSS Distributions 
2011*8d741a5dSApple OSS Distributions 	case SCHED_CALL_UNBLOCK:
2012*8d741a5dSApple OSS Distributions 		/*
2013*8d741a5dSApple OSS Distributions 		 * we cannot take the workqueue_lock here...
2014*8d741a5dSApple OSS Distributions 		 * an UNBLOCK can occur from a timer event which
2015*8d741a5dSApple OSS Distributions 		 * is run from an interrupt context... if the workqueue_lock
2016*8d741a5dSApple OSS Distributions 		 * is already held by this processor, we'll deadlock...
2017*8d741a5dSApple OSS Distributions 		 * the thread lock for the thread being UNBLOCKED
2018*8d741a5dSApple OSS Distributions 		 * is also held
2019*8d741a5dSApple OSS Distributions 		 */
2020*8d741a5dSApple OSS Distributions 		old_thactive = _wq_thactive_inc(wq, qos);
2021*8d741a5dSApple OSS Distributions 		if (__improbable(kdebug_enable)) {
2022*8d741a5dSApple OSS Distributions 			__unused uint32_t old = _wq_thactive_aggregate_downto_qos(wq,
2023*8d741a5dSApple OSS Distributions 			    old_thactive, qos, NULL, NULL);
2024*8d741a5dSApple OSS Distributions 			req_qos = WQ_THACTIVE_BEST_CONSTRAINED_REQ_QOS(old_thactive);
2025*8d741a5dSApple OSS Distributions 			WQ_TRACE_WQ(TRACE_wq_thread_block | DBG_FUNC_END, wq,
2026*8d741a5dSApple OSS Distributions 			    old + 1, qos | (req_qos << 8),
2027*8d741a5dSApple OSS Distributions 			    wq->wq_threads_scheduled);
2028*8d741a5dSApple OSS Distributions 		}
2029*8d741a5dSApple OSS Distributions 		break;
2030*8d741a5dSApple OSS Distributions 	}
2031*8d741a5dSApple OSS Distributions }
2032*8d741a5dSApple OSS Distributions 
2033*8d741a5dSApple OSS Distributions #pragma mark workq lifecycle
2034*8d741a5dSApple OSS Distributions 
2035*8d741a5dSApple OSS Distributions void
workq_reference(struct workqueue * wq)2036*8d741a5dSApple OSS Distributions workq_reference(struct workqueue *wq)
2037*8d741a5dSApple OSS Distributions {
2038*8d741a5dSApple OSS Distributions 	os_ref_retain(&wq->wq_refcnt);
2039*8d741a5dSApple OSS Distributions }
2040*8d741a5dSApple OSS Distributions 
2041*8d741a5dSApple OSS Distributions static void
workq_deallocate_queue_invoke(mpsc_queue_chain_t e,__assert_only mpsc_daemon_queue_t dq)2042*8d741a5dSApple OSS Distributions workq_deallocate_queue_invoke(mpsc_queue_chain_t e,
2043*8d741a5dSApple OSS Distributions     __assert_only mpsc_daemon_queue_t dq)
2044*8d741a5dSApple OSS Distributions {
2045*8d741a5dSApple OSS Distributions 	struct workqueue *wq;
2046*8d741a5dSApple OSS Distributions 	struct turnstile *ts;
2047*8d741a5dSApple OSS Distributions 
2048*8d741a5dSApple OSS Distributions 	wq = mpsc_queue_element(e, struct workqueue, wq_destroy_link);
2049*8d741a5dSApple OSS Distributions 	assert(dq == &workq_deallocate_queue);
2050*8d741a5dSApple OSS Distributions 
2051*8d741a5dSApple OSS Distributions 	turnstile_complete((uintptr_t)wq, &wq->wq_turnstile, &ts, TURNSTILE_WORKQS);
2052*8d741a5dSApple OSS Distributions 	assert(ts);
2053*8d741a5dSApple OSS Distributions 	turnstile_cleanup();
2054*8d741a5dSApple OSS Distributions 	turnstile_deallocate(ts);
2055*8d741a5dSApple OSS Distributions 
2056*8d741a5dSApple OSS Distributions 	lck_ticket_destroy(&wq->wq_lock, &workq_lck_grp);
2057*8d741a5dSApple OSS Distributions 	zfree(workq_zone_workqueue, wq);
2058*8d741a5dSApple OSS Distributions }
2059*8d741a5dSApple OSS Distributions 
2060*8d741a5dSApple OSS Distributions static void
workq_deallocate(struct workqueue * wq)2061*8d741a5dSApple OSS Distributions workq_deallocate(struct workqueue *wq)
2062*8d741a5dSApple OSS Distributions {
2063*8d741a5dSApple OSS Distributions 	if (os_ref_release_relaxed(&wq->wq_refcnt) == 0) {
2064*8d741a5dSApple OSS Distributions 		workq_deallocate_queue_invoke(&wq->wq_destroy_link,
2065*8d741a5dSApple OSS Distributions 		    &workq_deallocate_queue);
2066*8d741a5dSApple OSS Distributions 	}
2067*8d741a5dSApple OSS Distributions }
2068*8d741a5dSApple OSS Distributions 
2069*8d741a5dSApple OSS Distributions void
workq_deallocate_safe(struct workqueue * wq)2070*8d741a5dSApple OSS Distributions workq_deallocate_safe(struct workqueue *wq)
2071*8d741a5dSApple OSS Distributions {
2072*8d741a5dSApple OSS Distributions 	if (__improbable(os_ref_release_relaxed(&wq->wq_refcnt) == 0)) {
2073*8d741a5dSApple OSS Distributions 		mpsc_daemon_enqueue(&workq_deallocate_queue, &wq->wq_destroy_link,
2074*8d741a5dSApple OSS Distributions 		    MPSC_QUEUE_DISABLE_PREEMPTION);
2075*8d741a5dSApple OSS Distributions 	}
2076*8d741a5dSApple OSS Distributions }
2077*8d741a5dSApple OSS Distributions 
2078*8d741a5dSApple OSS Distributions /**
2079*8d741a5dSApple OSS Distributions  * Setup per-process state for the workqueue.
2080*8d741a5dSApple OSS Distributions  */
2081*8d741a5dSApple OSS Distributions int
workq_open(struct proc * p,__unused struct workq_open_args * uap,__unused int32_t * retval)2082*8d741a5dSApple OSS Distributions workq_open(struct proc *p, __unused struct workq_open_args *uap,
2083*8d741a5dSApple OSS Distributions     __unused int32_t *retval)
2084*8d741a5dSApple OSS Distributions {
2085*8d741a5dSApple OSS Distributions 	struct workqueue *wq;
2086*8d741a5dSApple OSS Distributions 	int error = 0;
2087*8d741a5dSApple OSS Distributions 
2088*8d741a5dSApple OSS Distributions 	if ((p->p_lflag & P_LREGISTER) == 0) {
2089*8d741a5dSApple OSS Distributions 		return EINVAL;
2090*8d741a5dSApple OSS Distributions 	}
2091*8d741a5dSApple OSS Distributions 
2092*8d741a5dSApple OSS Distributions 	if (wq_init_constrained_limit) {
2093*8d741a5dSApple OSS Distributions 		uint32_t limit, num_cpus = ml_wait_max_cpus();
2094*8d741a5dSApple OSS Distributions 
2095*8d741a5dSApple OSS Distributions 		/*
2096*8d741a5dSApple OSS Distributions 		 * set up the limit for the constrained pool
2097*8d741a5dSApple OSS Distributions 		 * this is a virtual pool in that we don't
2098*8d741a5dSApple OSS Distributions 		 * maintain it on a separate idle and run list
2099*8d741a5dSApple OSS Distributions 		 */
2100*8d741a5dSApple OSS Distributions 		limit = num_cpus * WORKQUEUE_CONSTRAINED_FACTOR;
2101*8d741a5dSApple OSS Distributions 
2102*8d741a5dSApple OSS Distributions 		if (limit > wq_max_constrained_threads) {
2103*8d741a5dSApple OSS Distributions 			wq_max_constrained_threads = limit;
2104*8d741a5dSApple OSS Distributions 		}
2105*8d741a5dSApple OSS Distributions 
2106*8d741a5dSApple OSS Distributions 		if (wq_max_threads > WQ_THACTIVE_BUCKET_HALF) {
2107*8d741a5dSApple OSS Distributions 			wq_max_threads = WQ_THACTIVE_BUCKET_HALF;
2108*8d741a5dSApple OSS Distributions 		}
2109*8d741a5dSApple OSS Distributions 		if (wq_max_threads > CONFIG_THREAD_MAX - 20) {
2110*8d741a5dSApple OSS Distributions 			wq_max_threads = CONFIG_THREAD_MAX - 20;
2111*8d741a5dSApple OSS Distributions 		}
2112*8d741a5dSApple OSS Distributions 
2113*8d741a5dSApple OSS Distributions 		wq_death_max_load = (uint16_t)fls(num_cpus) + 1;
2114*8d741a5dSApple OSS Distributions 
2115*8d741a5dSApple OSS Distributions 		for (thread_qos_t qos = WORKQ_THREAD_QOS_MIN; qos <= WORKQ_THREAD_QOS_MAX; qos++) {
2116*8d741a5dSApple OSS Distributions 			wq_max_parallelism[_wq_bucket(qos)] =
2117*8d741a5dSApple OSS Distributions 			    qos_max_parallelism(qos, QOS_PARALLELISM_COUNT_LOGICAL);
2118*8d741a5dSApple OSS Distributions 		}
2119*8d741a5dSApple OSS Distributions 
2120*8d741a5dSApple OSS Distributions 		wq_max_cooperative_threads = num_cpus;
2121*8d741a5dSApple OSS Distributions 
2122*8d741a5dSApple OSS Distributions 		wq_init_constrained_limit = 0;
2123*8d741a5dSApple OSS Distributions 	}
2124*8d741a5dSApple OSS Distributions 
2125*8d741a5dSApple OSS Distributions 	if (proc_get_wqptr(p) == NULL) {
2126*8d741a5dSApple OSS Distributions 		if (proc_init_wqptr_or_wait(p) == FALSE) {
2127*8d741a5dSApple OSS Distributions 			assert(proc_get_wqptr(p) != NULL);
2128*8d741a5dSApple OSS Distributions 			goto out;
2129*8d741a5dSApple OSS Distributions 		}
2130*8d741a5dSApple OSS Distributions 
2131*8d741a5dSApple OSS Distributions 		wq = zalloc_flags(workq_zone_workqueue, Z_WAITOK | Z_ZERO);
2132*8d741a5dSApple OSS Distributions 
2133*8d741a5dSApple OSS Distributions 		os_ref_init_count(&wq->wq_refcnt, &workq_refgrp, 1);
2134*8d741a5dSApple OSS Distributions 
2135*8d741a5dSApple OSS Distributions 		// Start the event manager at the priority hinted at by the policy engine
2136*8d741a5dSApple OSS Distributions 		thread_qos_t mgr_priority_hint = task_get_default_manager_qos(current_task());
2137*8d741a5dSApple OSS Distributions 		pthread_priority_t pp = _pthread_priority_make_from_thread_qos(mgr_priority_hint, 0, 0);
2138*8d741a5dSApple OSS Distributions 		wq->wq_event_manager_priority = (uint32_t)pp;
2139*8d741a5dSApple OSS Distributions 		wq->wq_timer_interval = (uint32_t)wq_stalled_window.abstime;
2140*8d741a5dSApple OSS Distributions 		wq->wq_proc = p;
2141*8d741a5dSApple OSS Distributions 		turnstile_prepare((uintptr_t)wq, &wq->wq_turnstile, turnstile_alloc(),
2142*8d741a5dSApple OSS Distributions 		    TURNSTILE_WORKQS);
2143*8d741a5dSApple OSS Distributions 
2144*8d741a5dSApple OSS Distributions 		TAILQ_INIT(&wq->wq_thrunlist);
2145*8d741a5dSApple OSS Distributions 		TAILQ_INIT(&wq->wq_thnewlist);
2146*8d741a5dSApple OSS Distributions 		TAILQ_INIT(&wq->wq_thidlelist);
2147*8d741a5dSApple OSS Distributions 		priority_queue_init(&wq->wq_overcommit_queue);
2148*8d741a5dSApple OSS Distributions 		priority_queue_init(&wq->wq_constrained_queue);
2149*8d741a5dSApple OSS Distributions 		priority_queue_init(&wq->wq_special_queue);
2150*8d741a5dSApple OSS Distributions 		for (int bucket = 0; bucket < WORKQ_NUM_QOS_BUCKETS; bucket++) {
2151*8d741a5dSApple OSS Distributions 			STAILQ_INIT(&wq->wq_cooperative_queue[bucket]);
2152*8d741a5dSApple OSS Distributions 		}
2153*8d741a5dSApple OSS Distributions 
2154*8d741a5dSApple OSS Distributions 		/* We are only using the delayed thread call for the constrained pool
2155*8d741a5dSApple OSS Distributions 		 * which can't have work at >= UI QoS and so we can be fine with a
2156*8d741a5dSApple OSS Distributions 		 * UI QoS thread call.
2157*8d741a5dSApple OSS Distributions 		 */
2158*8d741a5dSApple OSS Distributions 		wq->wq_delayed_call = thread_call_allocate_with_qos(
2159*8d741a5dSApple OSS Distributions 			workq_add_new_threads_call, p, THREAD_QOS_USER_INTERACTIVE,
2160*8d741a5dSApple OSS Distributions 			THREAD_CALL_OPTIONS_ONCE);
2161*8d741a5dSApple OSS Distributions 		wq->wq_immediate_call = thread_call_allocate_with_options(
2162*8d741a5dSApple OSS Distributions 			workq_add_new_threads_call, p, THREAD_CALL_PRIORITY_KERNEL,
2163*8d741a5dSApple OSS Distributions 			THREAD_CALL_OPTIONS_ONCE);
2164*8d741a5dSApple OSS Distributions 		wq->wq_death_call = thread_call_allocate_with_options(
2165*8d741a5dSApple OSS Distributions 			workq_kill_old_threads_call, wq,
2166*8d741a5dSApple OSS Distributions 			THREAD_CALL_PRIORITY_USER, THREAD_CALL_OPTIONS_ONCE);
2167*8d741a5dSApple OSS Distributions 
2168*8d741a5dSApple OSS Distributions 		lck_ticket_init(&wq->wq_lock, &workq_lck_grp);
2169*8d741a5dSApple OSS Distributions 
2170*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_create | DBG_FUNC_NONE, wq,
2171*8d741a5dSApple OSS Distributions 		    VM_KERNEL_ADDRHIDE(wq), 0, 0);
2172*8d741a5dSApple OSS Distributions 		proc_set_wqptr(p, wq);
2173*8d741a5dSApple OSS Distributions 	}
2174*8d741a5dSApple OSS Distributions out:
2175*8d741a5dSApple OSS Distributions 
2176*8d741a5dSApple OSS Distributions 	return error;
2177*8d741a5dSApple OSS Distributions }
2178*8d741a5dSApple OSS Distributions 
2179*8d741a5dSApple OSS Distributions /*
2180*8d741a5dSApple OSS Distributions  * Routine:	workq_mark_exiting
2181*8d741a5dSApple OSS Distributions  *
2182*8d741a5dSApple OSS Distributions  * Function:	Mark the work queue such that new threads will not be added to the
2183*8d741a5dSApple OSS Distributions  *		work queue after we return.
2184*8d741a5dSApple OSS Distributions  *
2185*8d741a5dSApple OSS Distributions  * Conditions:	Called against the current process.
2186*8d741a5dSApple OSS Distributions  */
2187*8d741a5dSApple OSS Distributions void
workq_mark_exiting(struct proc * p)2188*8d741a5dSApple OSS Distributions workq_mark_exiting(struct proc *p)
2189*8d741a5dSApple OSS Distributions {
2190*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
2191*8d741a5dSApple OSS Distributions 	uint32_t wq_flags;
2192*8d741a5dSApple OSS Distributions 	workq_threadreq_t mgr_req;
2193*8d741a5dSApple OSS Distributions 
2194*8d741a5dSApple OSS Distributions 	if (!wq) {
2195*8d741a5dSApple OSS Distributions 		return;
2196*8d741a5dSApple OSS Distributions 	}
2197*8d741a5dSApple OSS Distributions 
2198*8d741a5dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_pthread_exit | DBG_FUNC_START, wq, 0, 0, 0);
2199*8d741a5dSApple OSS Distributions 
2200*8d741a5dSApple OSS Distributions 	workq_lock_spin(wq);
2201*8d741a5dSApple OSS Distributions 
2202*8d741a5dSApple OSS Distributions 	wq_flags = os_atomic_or_orig(&wq->wq_flags, WQ_EXITING, relaxed);
2203*8d741a5dSApple OSS Distributions 	if (__improbable(wq_flags & WQ_EXITING)) {
2204*8d741a5dSApple OSS Distributions 		panic("workq_mark_exiting called twice");
2205*8d741a5dSApple OSS Distributions 	}
2206*8d741a5dSApple OSS Distributions 
2207*8d741a5dSApple OSS Distributions 	/*
2208*8d741a5dSApple OSS Distributions 	 * Opportunistically try to cancel thread calls that are likely in flight.
2209*8d741a5dSApple OSS Distributions 	 * workq_exit() will do the proper cleanup.
2210*8d741a5dSApple OSS Distributions 	 */
2211*8d741a5dSApple OSS Distributions 	if (wq_flags & WQ_IMMEDIATE_CALL_SCHEDULED) {
2212*8d741a5dSApple OSS Distributions 		thread_call_cancel(wq->wq_immediate_call);
2213*8d741a5dSApple OSS Distributions 	}
2214*8d741a5dSApple OSS Distributions 	if (wq_flags & WQ_DELAYED_CALL_SCHEDULED) {
2215*8d741a5dSApple OSS Distributions 		thread_call_cancel(wq->wq_delayed_call);
2216*8d741a5dSApple OSS Distributions 	}
2217*8d741a5dSApple OSS Distributions 	if (wq_flags & WQ_DEATH_CALL_SCHEDULED) {
2218*8d741a5dSApple OSS Distributions 		thread_call_cancel(wq->wq_death_call);
2219*8d741a5dSApple OSS Distributions 	}
2220*8d741a5dSApple OSS Distributions 
2221*8d741a5dSApple OSS Distributions 	mgr_req = wq->wq_event_manager_threadreq;
2222*8d741a5dSApple OSS Distributions 	wq->wq_event_manager_threadreq = NULL;
2223*8d741a5dSApple OSS Distributions 	wq->wq_reqcount = 0; /* workq_schedule_creator must not look at queues */
2224*8d741a5dSApple OSS Distributions 	wq->wq_creator = NULL;
2225*8d741a5dSApple OSS Distributions 	workq_turnstile_update_inheritor(wq, TURNSTILE_INHERITOR_NULL, 0);
2226*8d741a5dSApple OSS Distributions 
2227*8d741a5dSApple OSS Distributions 	workq_unlock(wq);
2228*8d741a5dSApple OSS Distributions 
2229*8d741a5dSApple OSS Distributions 	if (mgr_req) {
2230*8d741a5dSApple OSS Distributions 		kqueue_threadreq_cancel(p, mgr_req);
2231*8d741a5dSApple OSS Distributions 	}
2232*8d741a5dSApple OSS Distributions 	/*
2233*8d741a5dSApple OSS Distributions 	 * No one touches the priority queues once WQ_EXITING is set.
2234*8d741a5dSApple OSS Distributions 	 * It is hence safe to do the tear down without holding any lock.
2235*8d741a5dSApple OSS Distributions 	 */
2236*8d741a5dSApple OSS Distributions 	priority_queue_destroy(&wq->wq_overcommit_queue,
2237*8d741a5dSApple OSS Distributions 	    struct workq_threadreq_s, tr_entry, ^(workq_threadreq_t e){
2238*8d741a5dSApple OSS Distributions 		workq_threadreq_destroy(p, e);
2239*8d741a5dSApple OSS Distributions 	});
2240*8d741a5dSApple OSS Distributions 	priority_queue_destroy(&wq->wq_constrained_queue,
2241*8d741a5dSApple OSS Distributions 	    struct workq_threadreq_s, tr_entry, ^(workq_threadreq_t e){
2242*8d741a5dSApple OSS Distributions 		workq_threadreq_destroy(p, e);
2243*8d741a5dSApple OSS Distributions 	});
2244*8d741a5dSApple OSS Distributions 	priority_queue_destroy(&wq->wq_special_queue,
2245*8d741a5dSApple OSS Distributions 	    struct workq_threadreq_s, tr_entry, ^(workq_threadreq_t e){
2246*8d741a5dSApple OSS Distributions 		workq_threadreq_destroy(p, e);
2247*8d741a5dSApple OSS Distributions 	});
2248*8d741a5dSApple OSS Distributions 
2249*8d741a5dSApple OSS Distributions 	WQ_TRACE(TRACE_wq_pthread_exit | DBG_FUNC_END, 0, 0, 0, 0);
2250*8d741a5dSApple OSS Distributions }
2251*8d741a5dSApple OSS Distributions 
2252*8d741a5dSApple OSS Distributions /*
2253*8d741a5dSApple OSS Distributions  * Routine:	workq_exit
2254*8d741a5dSApple OSS Distributions  *
2255*8d741a5dSApple OSS Distributions  * Function:	clean up the work queue structure(s) now that there are no threads
2256*8d741a5dSApple OSS Distributions  *		left running inside the work queue (except possibly current_thread).
2257*8d741a5dSApple OSS Distributions  *
2258*8d741a5dSApple OSS Distributions  * Conditions:	Called by the last thread in the process.
2259*8d741a5dSApple OSS Distributions  *		Called against current process.
2260*8d741a5dSApple OSS Distributions  */
2261*8d741a5dSApple OSS Distributions void
workq_exit(struct proc * p)2262*8d741a5dSApple OSS Distributions workq_exit(struct proc *p)
2263*8d741a5dSApple OSS Distributions {
2264*8d741a5dSApple OSS Distributions 	struct workqueue *wq;
2265*8d741a5dSApple OSS Distributions 	struct uthread *uth, *tmp;
2266*8d741a5dSApple OSS Distributions 
2267*8d741a5dSApple OSS Distributions 	wq = os_atomic_xchg(&p->p_wqptr, NULL, relaxed);
2268*8d741a5dSApple OSS Distributions 	if (wq != NULL) {
2269*8d741a5dSApple OSS Distributions 		thread_t th = current_thread();
2270*8d741a5dSApple OSS Distributions 
2271*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_workqueue_exit | DBG_FUNC_START, wq, 0, 0, 0);
2272*8d741a5dSApple OSS Distributions 
2273*8d741a5dSApple OSS Distributions 		if (thread_get_tag(th) & THREAD_TAG_WORKQUEUE) {
2274*8d741a5dSApple OSS Distributions 			/*
2275*8d741a5dSApple OSS Distributions 			 * <rdar://problem/40111515> Make sure we will no longer call the
2276*8d741a5dSApple OSS Distributions 			 * sched call, if we ever block this thread, which the cancel_wait
2277*8d741a5dSApple OSS Distributions 			 * below can do.
2278*8d741a5dSApple OSS Distributions 			 */
2279*8d741a5dSApple OSS Distributions 			thread_sched_call(th, NULL);
2280*8d741a5dSApple OSS Distributions 		}
2281*8d741a5dSApple OSS Distributions 
2282*8d741a5dSApple OSS Distributions 		/*
2283*8d741a5dSApple OSS Distributions 		 * Thread calls are always scheduled by the proc itself or under the
2284*8d741a5dSApple OSS Distributions 		 * workqueue spinlock if WQ_EXITING is not yet set.
2285*8d741a5dSApple OSS Distributions 		 *
2286*8d741a5dSApple OSS Distributions 		 * Either way, when this runs, the proc has no threads left beside
2287*8d741a5dSApple OSS Distributions 		 * the one running this very code, so we know no thread call can be
2288*8d741a5dSApple OSS Distributions 		 * dispatched anymore.
2289*8d741a5dSApple OSS Distributions 		 */
2290*8d741a5dSApple OSS Distributions 		thread_call_cancel_wait(wq->wq_delayed_call);
2291*8d741a5dSApple OSS Distributions 		thread_call_cancel_wait(wq->wq_immediate_call);
2292*8d741a5dSApple OSS Distributions 		thread_call_cancel_wait(wq->wq_death_call);
2293*8d741a5dSApple OSS Distributions 		thread_call_free(wq->wq_delayed_call);
2294*8d741a5dSApple OSS Distributions 		thread_call_free(wq->wq_immediate_call);
2295*8d741a5dSApple OSS Distributions 		thread_call_free(wq->wq_death_call);
2296*8d741a5dSApple OSS Distributions 
2297*8d741a5dSApple OSS Distributions 		/*
2298*8d741a5dSApple OSS Distributions 		 * Clean up workqueue data structures for threads that exited and
2299*8d741a5dSApple OSS Distributions 		 * didn't get a chance to clean up after themselves.
2300*8d741a5dSApple OSS Distributions 		 *
2301*8d741a5dSApple OSS Distributions 		 * idle/new threads should have been interrupted and died on their own
2302*8d741a5dSApple OSS Distributions 		 */
2303*8d741a5dSApple OSS Distributions 		TAILQ_FOREACH_SAFE(uth, &wq->wq_thrunlist, uu_workq_entry, tmp) {
2304*8d741a5dSApple OSS Distributions 			thread_t mth = get_machthread(uth);
2305*8d741a5dSApple OSS Distributions 			thread_sched_call(mth, NULL);
2306*8d741a5dSApple OSS Distributions 			thread_deallocate(mth);
2307*8d741a5dSApple OSS Distributions 		}
2308*8d741a5dSApple OSS Distributions 		assert(TAILQ_EMPTY(&wq->wq_thnewlist));
2309*8d741a5dSApple OSS Distributions 		assert(TAILQ_EMPTY(&wq->wq_thidlelist));
2310*8d741a5dSApple OSS Distributions 
2311*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_destroy | DBG_FUNC_END, wq,
2312*8d741a5dSApple OSS Distributions 		    VM_KERNEL_ADDRHIDE(wq), 0, 0);
2313*8d741a5dSApple OSS Distributions 
2314*8d741a5dSApple OSS Distributions 		workq_deallocate(wq);
2315*8d741a5dSApple OSS Distributions 
2316*8d741a5dSApple OSS Distributions 		WQ_TRACE(TRACE_wq_workqueue_exit | DBG_FUNC_END, 0, 0, 0, 0);
2317*8d741a5dSApple OSS Distributions 	}
2318*8d741a5dSApple OSS Distributions }
2319*8d741a5dSApple OSS Distributions 
2320*8d741a5dSApple OSS Distributions 
2321*8d741a5dSApple OSS Distributions #pragma mark bsd thread control
2322*8d741a5dSApple OSS Distributions 
2323*8d741a5dSApple OSS Distributions bool
bsdthread_part_of_cooperative_workqueue(struct uthread * uth)2324*8d741a5dSApple OSS Distributions bsdthread_part_of_cooperative_workqueue(struct uthread *uth)
2325*8d741a5dSApple OSS Distributions {
2326*8d741a5dSApple OSS Distributions 	return (workq_thread_is_cooperative(uth) || workq_thread_is_nonovercommit(uth)) &&
2327*8d741a5dSApple OSS Distributions 	       (uth->uu_workq_pri.qos_bucket != WORKQ_THREAD_QOS_MANAGER) &&
2328*8d741a5dSApple OSS Distributions 	       (!workq_thread_is_permanently_bound(uth));
2329*8d741a5dSApple OSS Distributions }
2330*8d741a5dSApple OSS Distributions 
2331*8d741a5dSApple OSS Distributions static bool
_pthread_priority_to_policy(pthread_priority_t priority,thread_qos_policy_data_t * data)2332*8d741a5dSApple OSS Distributions _pthread_priority_to_policy(pthread_priority_t priority,
2333*8d741a5dSApple OSS Distributions     thread_qos_policy_data_t *data)
2334*8d741a5dSApple OSS Distributions {
2335*8d741a5dSApple OSS Distributions 	data->qos_tier = _pthread_priority_thread_qos(priority);
2336*8d741a5dSApple OSS Distributions 	data->tier_importance = _pthread_priority_relpri(priority);
2337*8d741a5dSApple OSS Distributions 	if (data->qos_tier == THREAD_QOS_UNSPECIFIED || data->tier_importance > 0 ||
2338*8d741a5dSApple OSS Distributions 	    data->tier_importance < THREAD_QOS_MIN_TIER_IMPORTANCE) {
2339*8d741a5dSApple OSS Distributions 		return false;
2340*8d741a5dSApple OSS Distributions 	}
2341*8d741a5dSApple OSS Distributions 	return true;
2342*8d741a5dSApple OSS Distributions }
2343*8d741a5dSApple OSS Distributions 
2344*8d741a5dSApple OSS Distributions static int
bsdthread_set_self(proc_t p,thread_t th,pthread_priority_t priority,mach_port_name_t voucher,enum workq_set_self_flags flags)2345*8d741a5dSApple OSS Distributions bsdthread_set_self(proc_t p, thread_t th, pthread_priority_t priority,
2346*8d741a5dSApple OSS Distributions     mach_port_name_t voucher, enum workq_set_self_flags flags)
2347*8d741a5dSApple OSS Distributions {
2348*8d741a5dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(th);
2349*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
2350*8d741a5dSApple OSS Distributions 
2351*8d741a5dSApple OSS Distributions 	kern_return_t kr;
2352*8d741a5dSApple OSS Distributions 	int unbind_rv = 0, qos_rv = 0, voucher_rv = 0, fixedpri_rv = 0;
2353*8d741a5dSApple OSS Distributions 	bool is_wq_thread = (thread_get_tag(th) & THREAD_TAG_WORKQUEUE);
2354*8d741a5dSApple OSS Distributions 
2355*8d741a5dSApple OSS Distributions 	assert(th == current_thread());
2356*8d741a5dSApple OSS Distributions 	if (flags & WORKQ_SET_SELF_WQ_KEVENT_UNBIND) {
2357*8d741a5dSApple OSS Distributions 		if (!is_wq_thread) {
2358*8d741a5dSApple OSS Distributions 			unbind_rv = EINVAL;
2359*8d741a5dSApple OSS Distributions 			goto qos;
2360*8d741a5dSApple OSS Distributions 		}
2361*8d741a5dSApple OSS Distributions 
2362*8d741a5dSApple OSS Distributions 		if (uth->uu_workq_pri.qos_bucket == WORKQ_THREAD_QOS_MANAGER) {
2363*8d741a5dSApple OSS Distributions 			unbind_rv = EINVAL;
2364*8d741a5dSApple OSS Distributions 			goto qos;
2365*8d741a5dSApple OSS Distributions 		}
2366*8d741a5dSApple OSS Distributions 
2367*8d741a5dSApple OSS Distributions 		workq_threadreq_t kqr = uth->uu_kqr_bound;
2368*8d741a5dSApple OSS Distributions 		if (kqr == NULL) {
2369*8d741a5dSApple OSS Distributions 			unbind_rv = EALREADY;
2370*8d741a5dSApple OSS Distributions 			goto qos;
2371*8d741a5dSApple OSS Distributions 		}
2372*8d741a5dSApple OSS Distributions 
2373*8d741a5dSApple OSS Distributions 		if (kqr->tr_flags & WORKQ_TR_FLAG_WORKLOOP) {
2374*8d741a5dSApple OSS Distributions 			unbind_rv = EINVAL;
2375*8d741a5dSApple OSS Distributions 			goto qos;
2376*8d741a5dSApple OSS Distributions 		}
2377*8d741a5dSApple OSS Distributions 
2378*8d741a5dSApple OSS Distributions 		kqueue_threadreq_unbind(p, kqr);
2379*8d741a5dSApple OSS Distributions 	}
2380*8d741a5dSApple OSS Distributions 
2381*8d741a5dSApple OSS Distributions qos:
2382*8d741a5dSApple OSS Distributions 	if (flags & (WORKQ_SET_SELF_QOS_FLAG | WORKQ_SET_SELF_QOS_OVERRIDE_FLAG)) {
2383*8d741a5dSApple OSS Distributions 		assert(flags & WORKQ_SET_SELF_QOS_FLAG);
2384*8d741a5dSApple OSS Distributions 
2385*8d741a5dSApple OSS Distributions 		thread_qos_policy_data_t new_policy;
2386*8d741a5dSApple OSS Distributions 		thread_qos_t qos_override = THREAD_QOS_UNSPECIFIED;
2387*8d741a5dSApple OSS Distributions 
2388*8d741a5dSApple OSS Distributions 		if (!_pthread_priority_to_policy(priority, &new_policy)) {
2389*8d741a5dSApple OSS Distributions 			qos_rv = EINVAL;
2390*8d741a5dSApple OSS Distributions 			goto voucher;
2391*8d741a5dSApple OSS Distributions 		}
2392*8d741a5dSApple OSS Distributions 
2393*8d741a5dSApple OSS Distributions 		if (flags & WORKQ_SET_SELF_QOS_OVERRIDE_FLAG) {
2394*8d741a5dSApple OSS Distributions 			/*
2395*8d741a5dSApple OSS Distributions 			 * If the WORKQ_SET_SELF_QOS_OVERRIDE_FLAG is set, we definitely
2396*8d741a5dSApple OSS Distributions 			 * should have an override QoS in the pthread_priority_t and we should
2397*8d741a5dSApple OSS Distributions 			 * only come into this path for cooperative thread requests
2398*8d741a5dSApple OSS Distributions 			 */
2399*8d741a5dSApple OSS Distributions 			if (!_pthread_priority_has_override_qos(priority) ||
2400*8d741a5dSApple OSS Distributions 			    !_pthread_priority_is_cooperative(priority)) {
2401*8d741a5dSApple OSS Distributions 				qos_rv = EINVAL;
2402*8d741a5dSApple OSS Distributions 				goto voucher;
2403*8d741a5dSApple OSS Distributions 			}
2404*8d741a5dSApple OSS Distributions 			qos_override = _pthread_priority_thread_override_qos(priority);
2405*8d741a5dSApple OSS Distributions 		} else {
2406*8d741a5dSApple OSS Distributions 			/*
2407*8d741a5dSApple OSS Distributions 			 * If the WORKQ_SET_SELF_QOS_OVERRIDE_FLAG is not set, we definitely
2408*8d741a5dSApple OSS Distributions 			 * should not have an override QoS in the pthread_priority_t
2409*8d741a5dSApple OSS Distributions 			 */
2410*8d741a5dSApple OSS Distributions 			if (_pthread_priority_has_override_qos(priority)) {
2411*8d741a5dSApple OSS Distributions 				qos_rv = EINVAL;
2412*8d741a5dSApple OSS Distributions 				goto voucher;
2413*8d741a5dSApple OSS Distributions 			}
2414*8d741a5dSApple OSS Distributions 		}
2415*8d741a5dSApple OSS Distributions 
2416*8d741a5dSApple OSS Distributions 		if (!is_wq_thread) {
2417*8d741a5dSApple OSS Distributions 			/*
2418*8d741a5dSApple OSS Distributions 			 * Threads opted out of QoS can't change QoS
2419*8d741a5dSApple OSS Distributions 			 */
2420*8d741a5dSApple OSS Distributions 			if (!thread_has_qos_policy(th)) {
2421*8d741a5dSApple OSS Distributions 				qos_rv = EPERM;
2422*8d741a5dSApple OSS Distributions 				goto voucher;
2423*8d741a5dSApple OSS Distributions 			}
2424*8d741a5dSApple OSS Distributions 		} else if (uth->uu_workq_pri.qos_bucket == WORKQ_THREAD_QOS_MANAGER ||
2425*8d741a5dSApple OSS Distributions 		    uth->uu_workq_pri.qos_bucket == WORKQ_THREAD_QOS_ABOVEUI) {
2426*8d741a5dSApple OSS Distributions 			/*
2427*8d741a5dSApple OSS Distributions 			 * Workqueue manager threads or threads above UI can't change QoS
2428*8d741a5dSApple OSS Distributions 			 */
2429*8d741a5dSApple OSS Distributions 			qos_rv = EINVAL;
2430*8d741a5dSApple OSS Distributions 			goto voucher;
2431*8d741a5dSApple OSS Distributions 		} else {
2432*8d741a5dSApple OSS Distributions 			/*
2433*8d741a5dSApple OSS Distributions 			 * For workqueue threads, possibly adjust buckets and redrive thread
2434*8d741a5dSApple OSS Distributions 			 * requests.
2435*8d741a5dSApple OSS Distributions 			 *
2436*8d741a5dSApple OSS Distributions 			 * Transitions allowed:
2437*8d741a5dSApple OSS Distributions 			 *
2438*8d741a5dSApple OSS Distributions 			 * overcommit --> non-overcommit
2439*8d741a5dSApple OSS Distributions 			 * overcommit --> overcommit
2440*8d741a5dSApple OSS Distributions 			 * non-overcommit --> non-overcommit
2441*8d741a5dSApple OSS Distributions 			 * non-overcommit --> overcommit (to be deprecated later)
2442*8d741a5dSApple OSS Distributions 			 * cooperative --> cooperative
2443*8d741a5dSApple OSS Distributions 			 *
2444*8d741a5dSApple OSS Distributions 			 * All other transitions aren't allowed so reject them.
2445*8d741a5dSApple OSS Distributions 			 */
2446*8d741a5dSApple OSS Distributions 			if (workq_thread_is_overcommit(uth) && _pthread_priority_is_cooperative(priority)) {
2447*8d741a5dSApple OSS Distributions 				qos_rv = EINVAL;
2448*8d741a5dSApple OSS Distributions 				goto voucher;
2449*8d741a5dSApple OSS Distributions 			} else if (workq_thread_is_cooperative(uth) && !_pthread_priority_is_cooperative(priority)) {
2450*8d741a5dSApple OSS Distributions 				qos_rv = EINVAL;
2451*8d741a5dSApple OSS Distributions 				goto voucher;
2452*8d741a5dSApple OSS Distributions 			} else if (workq_thread_is_nonovercommit(uth) && _pthread_priority_is_cooperative(priority)) {
2453*8d741a5dSApple OSS Distributions 				qos_rv = EINVAL;
2454*8d741a5dSApple OSS Distributions 				goto voucher;
2455*8d741a5dSApple OSS Distributions 			}
2456*8d741a5dSApple OSS Distributions 
2457*8d741a5dSApple OSS Distributions 			struct uu_workq_policy old_pri, new_pri;
2458*8d741a5dSApple OSS Distributions 			bool force_run = false;
2459*8d741a5dSApple OSS Distributions 
2460*8d741a5dSApple OSS Distributions 			if (qos_override) {
2461*8d741a5dSApple OSS Distributions 				/*
2462*8d741a5dSApple OSS Distributions 				 * We're in the case of a thread clarifying that it is for eg. not IN
2463*8d741a5dSApple OSS Distributions 				 * req QoS but rather, UT req QoS with IN override. However, this can
2464*8d741a5dSApple OSS Distributions 				 * race with a concurrent override happening to the thread via
2465*8d741a5dSApple OSS Distributions 				 * workq_thread_add_dispatch_override so this needs to be
2466*8d741a5dSApple OSS Distributions 				 * synchronized with the thread mutex.
2467*8d741a5dSApple OSS Distributions 				 */
2468*8d741a5dSApple OSS Distributions 				thread_mtx_lock(th);
2469*8d741a5dSApple OSS Distributions 			}
2470*8d741a5dSApple OSS Distributions 
2471*8d741a5dSApple OSS Distributions 			workq_lock_spin(wq);
2472*8d741a5dSApple OSS Distributions 
2473*8d741a5dSApple OSS Distributions 			old_pri = new_pri = uth->uu_workq_pri;
2474*8d741a5dSApple OSS Distributions 			new_pri.qos_req = (thread_qos_t)new_policy.qos_tier;
2475*8d741a5dSApple OSS Distributions 
2476*8d741a5dSApple OSS Distributions 			if (old_pri.qos_override < qos_override) {
2477*8d741a5dSApple OSS Distributions 				/*
2478*8d741a5dSApple OSS Distributions 				 * Since this can race with a concurrent override via
2479*8d741a5dSApple OSS Distributions 				 * workq_thread_add_dispatch_override, only adjust override value if we
2480*8d741a5dSApple OSS Distributions 				 * are higher - this is a saturating function.
2481*8d741a5dSApple OSS Distributions 				 *
2482*8d741a5dSApple OSS Distributions 				 * We should not be changing the final override values, we should simply
2483*8d741a5dSApple OSS Distributions 				 * be redistributing the current value with a different breakdown of req
2484*8d741a5dSApple OSS Distributions 				 * vs override QoS - assert to that effect. Therefore, buckets should
2485*8d741a5dSApple OSS Distributions 				 * not change.
2486*8d741a5dSApple OSS Distributions 				 */
2487*8d741a5dSApple OSS Distributions 				new_pri.qos_override = qos_override;
2488*8d741a5dSApple OSS Distributions 				assert(workq_pri_override(new_pri) == workq_pri_override(old_pri));
2489*8d741a5dSApple OSS Distributions 				assert(workq_pri_bucket(new_pri) == workq_pri_bucket(old_pri));
2490*8d741a5dSApple OSS Distributions 			}
2491*8d741a5dSApple OSS Distributions 
2492*8d741a5dSApple OSS Distributions 			/* Adjust schedule counts for various types of transitions */
2493*8d741a5dSApple OSS Distributions 
2494*8d741a5dSApple OSS Distributions 			/* overcommit -> non-overcommit */
2495*8d741a5dSApple OSS Distributions 			if (workq_thread_is_overcommit(uth) && _pthread_priority_is_nonovercommit(priority)) {
2496*8d741a5dSApple OSS Distributions 				workq_thread_set_type(uth, 0);
2497*8d741a5dSApple OSS Distributions 				wq->wq_constrained_threads_scheduled++;
2498*8d741a5dSApple OSS Distributions 
2499*8d741a5dSApple OSS Distributions 				/* non-overcommit -> overcommit */
2500*8d741a5dSApple OSS Distributions 			} else if (workq_thread_is_nonovercommit(uth) && _pthread_priority_is_overcommit(priority)) {
2501*8d741a5dSApple OSS Distributions 				workq_thread_set_type(uth, UT_WORKQ_OVERCOMMIT);
2502*8d741a5dSApple OSS Distributions 				force_run = (wq->wq_constrained_threads_scheduled-- == wq_max_constrained_threads);
2503*8d741a5dSApple OSS Distributions 
2504*8d741a5dSApple OSS Distributions 				/* cooperative -> cooperative */
2505*8d741a5dSApple OSS Distributions 			} else if (workq_thread_is_cooperative(uth)) {
2506*8d741a5dSApple OSS Distributions 				_wq_cooperative_queue_scheduled_count_dec(wq, old_pri.qos_req);
2507*8d741a5dSApple OSS Distributions 				_wq_cooperative_queue_scheduled_count_inc(wq, new_pri.qos_req);
2508*8d741a5dSApple OSS Distributions 
2509*8d741a5dSApple OSS Distributions 				/* We're changing schedule counts within cooperative pool, we
2510*8d741a5dSApple OSS Distributions 				 * need to refresh best cooperative QoS logic again */
2511*8d741a5dSApple OSS Distributions 				force_run = _wq_cooperative_queue_refresh_best_req_qos(wq);
2512*8d741a5dSApple OSS Distributions 			}
2513*8d741a5dSApple OSS Distributions 
2514*8d741a5dSApple OSS Distributions 			/*
2515*8d741a5dSApple OSS Distributions 			 * This will set up an override on the thread if any and will also call
2516*8d741a5dSApple OSS Distributions 			 * schedule_creator if needed
2517*8d741a5dSApple OSS Distributions 			 */
2518*8d741a5dSApple OSS Distributions 			workq_thread_update_bucket(p, wq, uth, old_pri, new_pri, force_run);
2519*8d741a5dSApple OSS Distributions 			workq_unlock(wq);
2520*8d741a5dSApple OSS Distributions 
2521*8d741a5dSApple OSS Distributions 			if (qos_override) {
2522*8d741a5dSApple OSS Distributions 				thread_mtx_unlock(th);
2523*8d741a5dSApple OSS Distributions 			}
2524*8d741a5dSApple OSS Distributions 
2525*8d741a5dSApple OSS Distributions 			if (workq_thread_is_overcommit(uth)) {
2526*8d741a5dSApple OSS Distributions 				thread_disarm_workqueue_quantum(th);
2527*8d741a5dSApple OSS Distributions 			} else {
2528*8d741a5dSApple OSS Distributions 				/* If the thread changed QoS buckets, the quantum duration
2529*8d741a5dSApple OSS Distributions 				 * may have changed too */
2530*8d741a5dSApple OSS Distributions 				thread_arm_workqueue_quantum(th);
2531*8d741a5dSApple OSS Distributions 			}
2532*8d741a5dSApple OSS Distributions 		}
2533*8d741a5dSApple OSS Distributions 
2534*8d741a5dSApple OSS Distributions 		kr = thread_policy_set_internal(th, THREAD_QOS_POLICY,
2535*8d741a5dSApple OSS Distributions 		    (thread_policy_t)&new_policy, THREAD_QOS_POLICY_COUNT);
2536*8d741a5dSApple OSS Distributions 		if (kr != KERN_SUCCESS) {
2537*8d741a5dSApple OSS Distributions 			qos_rv = EINVAL;
2538*8d741a5dSApple OSS Distributions 		}
2539*8d741a5dSApple OSS Distributions 	}
2540*8d741a5dSApple OSS Distributions 
2541*8d741a5dSApple OSS Distributions voucher:
2542*8d741a5dSApple OSS Distributions 	if (flags & WORKQ_SET_SELF_VOUCHER_FLAG) {
2543*8d741a5dSApple OSS Distributions 		kr = thread_set_voucher_name(voucher);
2544*8d741a5dSApple OSS Distributions 		if (kr != KERN_SUCCESS) {
2545*8d741a5dSApple OSS Distributions 			voucher_rv = ENOENT;
2546*8d741a5dSApple OSS Distributions 			goto fixedpri;
2547*8d741a5dSApple OSS Distributions 		}
2548*8d741a5dSApple OSS Distributions 	}
2549*8d741a5dSApple OSS Distributions 
2550*8d741a5dSApple OSS Distributions fixedpri:
2551*8d741a5dSApple OSS Distributions 	if (qos_rv) {
2552*8d741a5dSApple OSS Distributions 		goto done;
2553*8d741a5dSApple OSS Distributions 	}
2554*8d741a5dSApple OSS Distributions 	if (flags & WORKQ_SET_SELF_FIXEDPRIORITY_FLAG) {
2555*8d741a5dSApple OSS Distributions 		thread_extended_policy_data_t extpol = {.timeshare = 0};
2556*8d741a5dSApple OSS Distributions 
2557*8d741a5dSApple OSS Distributions 		if (is_wq_thread) {
2558*8d741a5dSApple OSS Distributions 			/* Not allowed on workqueue threads */
2559*8d741a5dSApple OSS Distributions 			fixedpri_rv = ENOTSUP;
2560*8d741a5dSApple OSS Distributions 			goto done;
2561*8d741a5dSApple OSS Distributions 		}
2562*8d741a5dSApple OSS Distributions 
2563*8d741a5dSApple OSS Distributions 		kr = thread_policy_set_internal(th, THREAD_EXTENDED_POLICY,
2564*8d741a5dSApple OSS Distributions 		    (thread_policy_t)&extpol, THREAD_EXTENDED_POLICY_COUNT);
2565*8d741a5dSApple OSS Distributions 		if (kr != KERN_SUCCESS) {
2566*8d741a5dSApple OSS Distributions 			fixedpri_rv = EINVAL;
2567*8d741a5dSApple OSS Distributions 			goto done;
2568*8d741a5dSApple OSS Distributions 		}
2569*8d741a5dSApple OSS Distributions 	} else if (flags & WORKQ_SET_SELF_TIMESHARE_FLAG) {
2570*8d741a5dSApple OSS Distributions 		thread_extended_policy_data_t extpol = {.timeshare = 1};
2571*8d741a5dSApple OSS Distributions 
2572*8d741a5dSApple OSS Distributions 		if (is_wq_thread) {
2573*8d741a5dSApple OSS Distributions 			/* Not allowed on workqueue threads */
2574*8d741a5dSApple OSS Distributions 			fixedpri_rv = ENOTSUP;
2575*8d741a5dSApple OSS Distributions 			goto done;
2576*8d741a5dSApple OSS Distributions 		}
2577*8d741a5dSApple OSS Distributions 
2578*8d741a5dSApple OSS Distributions 		kr = thread_policy_set_internal(th, THREAD_EXTENDED_POLICY,
2579*8d741a5dSApple OSS Distributions 		    (thread_policy_t)&extpol, THREAD_EXTENDED_POLICY_COUNT);
2580*8d741a5dSApple OSS Distributions 		if (kr != KERN_SUCCESS) {
2581*8d741a5dSApple OSS Distributions 			fixedpri_rv = EINVAL;
2582*8d741a5dSApple OSS Distributions 			goto done;
2583*8d741a5dSApple OSS Distributions 		}
2584*8d741a5dSApple OSS Distributions 	}
2585*8d741a5dSApple OSS Distributions 
2586*8d741a5dSApple OSS Distributions done:
2587*8d741a5dSApple OSS Distributions 	if (qos_rv && voucher_rv) {
2588*8d741a5dSApple OSS Distributions 		/* Both failed, give that a unique error. */
2589*8d741a5dSApple OSS Distributions 		return EBADMSG;
2590*8d741a5dSApple OSS Distributions 	}
2591*8d741a5dSApple OSS Distributions 
2592*8d741a5dSApple OSS Distributions 	if (unbind_rv) {
2593*8d741a5dSApple OSS Distributions 		return unbind_rv;
2594*8d741a5dSApple OSS Distributions 	}
2595*8d741a5dSApple OSS Distributions 
2596*8d741a5dSApple OSS Distributions 	if (qos_rv) {
2597*8d741a5dSApple OSS Distributions 		return qos_rv;
2598*8d741a5dSApple OSS Distributions 	}
2599*8d741a5dSApple OSS Distributions 
2600*8d741a5dSApple OSS Distributions 	if (voucher_rv) {
2601*8d741a5dSApple OSS Distributions 		return voucher_rv;
2602*8d741a5dSApple OSS Distributions 	}
2603*8d741a5dSApple OSS Distributions 
2604*8d741a5dSApple OSS Distributions 	if (fixedpri_rv) {
2605*8d741a5dSApple OSS Distributions 		return fixedpri_rv;
2606*8d741a5dSApple OSS Distributions 	}
2607*8d741a5dSApple OSS Distributions 
2608*8d741a5dSApple OSS Distributions 
2609*8d741a5dSApple OSS Distributions 	return 0;
2610*8d741a5dSApple OSS Distributions }
2611*8d741a5dSApple OSS Distributions 
2612*8d741a5dSApple OSS Distributions static int
bsdthread_add_explicit_override(proc_t p,mach_port_name_t kport,pthread_priority_t pp,user_addr_t resource)2613*8d741a5dSApple OSS Distributions bsdthread_add_explicit_override(proc_t p, mach_port_name_t kport,
2614*8d741a5dSApple OSS Distributions     pthread_priority_t pp, user_addr_t resource)
2615*8d741a5dSApple OSS Distributions {
2616*8d741a5dSApple OSS Distributions 	thread_qos_t qos = _pthread_priority_thread_qos(pp);
2617*8d741a5dSApple OSS Distributions 	if (qos == THREAD_QOS_UNSPECIFIED) {
2618*8d741a5dSApple OSS Distributions 		return EINVAL;
2619*8d741a5dSApple OSS Distributions 	}
2620*8d741a5dSApple OSS Distributions 
2621*8d741a5dSApple OSS Distributions 	thread_t th = port_name_to_thread(kport,
2622*8d741a5dSApple OSS Distributions 	    PORT_INTRANS_THREAD_IN_CURRENT_TASK);
2623*8d741a5dSApple OSS Distributions 	if (th == THREAD_NULL) {
2624*8d741a5dSApple OSS Distributions 		return ESRCH;
2625*8d741a5dSApple OSS Distributions 	}
2626*8d741a5dSApple OSS Distributions 
2627*8d741a5dSApple OSS Distributions 	int rv = proc_thread_qos_add_override(proc_task(p), th, 0, qos, TRUE,
2628*8d741a5dSApple OSS Distributions 	    resource, THREAD_QOS_OVERRIDE_TYPE_PTHREAD_EXPLICIT_OVERRIDE);
2629*8d741a5dSApple OSS Distributions 
2630*8d741a5dSApple OSS Distributions 	thread_deallocate(th);
2631*8d741a5dSApple OSS Distributions 	return rv;
2632*8d741a5dSApple OSS Distributions }
2633*8d741a5dSApple OSS Distributions 
2634*8d741a5dSApple OSS Distributions static int
bsdthread_remove_explicit_override(proc_t p,mach_port_name_t kport,user_addr_t resource)2635*8d741a5dSApple OSS Distributions bsdthread_remove_explicit_override(proc_t p, mach_port_name_t kport,
2636*8d741a5dSApple OSS Distributions     user_addr_t resource)
2637*8d741a5dSApple OSS Distributions {
2638*8d741a5dSApple OSS Distributions 	thread_t th = port_name_to_thread(kport,
2639*8d741a5dSApple OSS Distributions 	    PORT_INTRANS_THREAD_IN_CURRENT_TASK);
2640*8d741a5dSApple OSS Distributions 	if (th == THREAD_NULL) {
2641*8d741a5dSApple OSS Distributions 		return ESRCH;
2642*8d741a5dSApple OSS Distributions 	}
2643*8d741a5dSApple OSS Distributions 
2644*8d741a5dSApple OSS Distributions 	int rv = proc_thread_qos_remove_override(proc_task(p), th, 0, resource,
2645*8d741a5dSApple OSS Distributions 	    THREAD_QOS_OVERRIDE_TYPE_PTHREAD_EXPLICIT_OVERRIDE);
2646*8d741a5dSApple OSS Distributions 
2647*8d741a5dSApple OSS Distributions 	thread_deallocate(th);
2648*8d741a5dSApple OSS Distributions 	return rv;
2649*8d741a5dSApple OSS Distributions }
2650*8d741a5dSApple OSS Distributions 
2651*8d741a5dSApple OSS Distributions static int
workq_thread_add_dispatch_override(proc_t p,mach_port_name_t kport,pthread_priority_t pp,user_addr_t ulock_addr)2652*8d741a5dSApple OSS Distributions workq_thread_add_dispatch_override(proc_t p, mach_port_name_t kport,
2653*8d741a5dSApple OSS Distributions     pthread_priority_t pp, user_addr_t ulock_addr)
2654*8d741a5dSApple OSS Distributions {
2655*8d741a5dSApple OSS Distributions 	struct uu_workq_policy old_pri, new_pri;
2656*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
2657*8d741a5dSApple OSS Distributions 
2658*8d741a5dSApple OSS Distributions 	thread_qos_t qos_override = _pthread_priority_thread_qos(pp);
2659*8d741a5dSApple OSS Distributions 	if (qos_override == THREAD_QOS_UNSPECIFIED) {
2660*8d741a5dSApple OSS Distributions 		return EINVAL;
2661*8d741a5dSApple OSS Distributions 	}
2662*8d741a5dSApple OSS Distributions 
2663*8d741a5dSApple OSS Distributions 	thread_t thread = port_name_to_thread(kport,
2664*8d741a5dSApple OSS Distributions 	    PORT_INTRANS_THREAD_IN_CURRENT_TASK);
2665*8d741a5dSApple OSS Distributions 	if (thread == THREAD_NULL) {
2666*8d741a5dSApple OSS Distributions 		return ESRCH;
2667*8d741a5dSApple OSS Distributions 	}
2668*8d741a5dSApple OSS Distributions 
2669*8d741a5dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(thread);
2670*8d741a5dSApple OSS Distributions 	if ((thread_get_tag(thread) & THREAD_TAG_WORKQUEUE) == 0) {
2671*8d741a5dSApple OSS Distributions 		thread_deallocate(thread);
2672*8d741a5dSApple OSS Distributions 		return EPERM;
2673*8d741a5dSApple OSS Distributions 	}
2674*8d741a5dSApple OSS Distributions 
2675*8d741a5dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_override_dispatch | DBG_FUNC_NONE,
2676*8d741a5dSApple OSS Distributions 	    wq, thread_tid(thread), 1, pp);
2677*8d741a5dSApple OSS Distributions 
2678*8d741a5dSApple OSS Distributions 	thread_mtx_lock(thread);
2679*8d741a5dSApple OSS Distributions 
2680*8d741a5dSApple OSS Distributions 	if (ulock_addr) {
2681*8d741a5dSApple OSS Distributions 		uint32_t val;
2682*8d741a5dSApple OSS Distributions 		int rc;
2683*8d741a5dSApple OSS Distributions 		/*
2684*8d741a5dSApple OSS Distributions 		 * Workaround lack of explicit support for 'no-fault copyin'
2685*8d741a5dSApple OSS Distributions 		 * <rdar://problem/24999882>, as disabling preemption prevents paging in
2686*8d741a5dSApple OSS Distributions 		 */
2687*8d741a5dSApple OSS Distributions 		disable_preemption();
2688*8d741a5dSApple OSS Distributions 		rc = copyin_atomic32(ulock_addr, &val);
2689*8d741a5dSApple OSS Distributions 		enable_preemption();
2690*8d741a5dSApple OSS Distributions 		if (rc == 0 && ulock_owner_value_to_port_name(val) != kport) {
2691*8d741a5dSApple OSS Distributions 			goto out;
2692*8d741a5dSApple OSS Distributions 		}
2693*8d741a5dSApple OSS Distributions 	}
2694*8d741a5dSApple OSS Distributions 
2695*8d741a5dSApple OSS Distributions 	workq_lock_spin(wq);
2696*8d741a5dSApple OSS Distributions 
2697*8d741a5dSApple OSS Distributions 	old_pri = uth->uu_workq_pri;
2698*8d741a5dSApple OSS Distributions 	if (old_pri.qos_override >= qos_override) {
2699*8d741a5dSApple OSS Distributions 		/* Nothing to do */
2700*8d741a5dSApple OSS Distributions 	} else if (thread == current_thread()) {
2701*8d741a5dSApple OSS Distributions 		new_pri = old_pri;
2702*8d741a5dSApple OSS Distributions 		new_pri.qos_override = qos_override;
2703*8d741a5dSApple OSS Distributions 		workq_thread_update_bucket(p, wq, uth, old_pri, new_pri, false);
2704*8d741a5dSApple OSS Distributions 	} else {
2705*8d741a5dSApple OSS Distributions 		uth->uu_workq_pri.qos_override = qos_override;
2706*8d741a5dSApple OSS Distributions 		if (qos_override > workq_pri_override(old_pri)) {
2707*8d741a5dSApple OSS Distributions 			thread_set_workq_override(thread, qos_override);
2708*8d741a5dSApple OSS Distributions 		}
2709*8d741a5dSApple OSS Distributions 	}
2710*8d741a5dSApple OSS Distributions 
2711*8d741a5dSApple OSS Distributions 	workq_unlock(wq);
2712*8d741a5dSApple OSS Distributions 
2713*8d741a5dSApple OSS Distributions out:
2714*8d741a5dSApple OSS Distributions 	thread_mtx_unlock(thread);
2715*8d741a5dSApple OSS Distributions 	thread_deallocate(thread);
2716*8d741a5dSApple OSS Distributions 	return 0;
2717*8d741a5dSApple OSS Distributions }
2718*8d741a5dSApple OSS Distributions 
2719*8d741a5dSApple OSS Distributions static int
workq_thread_reset_dispatch_override(proc_t p,thread_t thread)2720*8d741a5dSApple OSS Distributions workq_thread_reset_dispatch_override(proc_t p, thread_t thread)
2721*8d741a5dSApple OSS Distributions {
2722*8d741a5dSApple OSS Distributions 	struct uu_workq_policy old_pri, new_pri;
2723*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
2724*8d741a5dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(thread);
2725*8d741a5dSApple OSS Distributions 
2726*8d741a5dSApple OSS Distributions 	if ((thread_get_tag(thread) & THREAD_TAG_WORKQUEUE) == 0) {
2727*8d741a5dSApple OSS Distributions 		return EPERM;
2728*8d741a5dSApple OSS Distributions 	}
2729*8d741a5dSApple OSS Distributions 
2730*8d741a5dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_override_reset | DBG_FUNC_NONE, wq, 0, 0, 0);
2731*8d741a5dSApple OSS Distributions 
2732*8d741a5dSApple OSS Distributions 	/*
2733*8d741a5dSApple OSS Distributions 	 * workq_thread_add_dispatch_override takes the thread mutex before doing the
2734*8d741a5dSApple OSS Distributions 	 * copyin to validate the drainer and apply the override. We need to do the
2735*8d741a5dSApple OSS Distributions 	 * same here. See rdar://84472518
2736*8d741a5dSApple OSS Distributions 	 */
2737*8d741a5dSApple OSS Distributions 	thread_mtx_lock(thread);
2738*8d741a5dSApple OSS Distributions 
2739*8d741a5dSApple OSS Distributions 	workq_lock_spin(wq);
2740*8d741a5dSApple OSS Distributions 	old_pri = new_pri = uth->uu_workq_pri;
2741*8d741a5dSApple OSS Distributions 	new_pri.qos_override = THREAD_QOS_UNSPECIFIED;
2742*8d741a5dSApple OSS Distributions 	workq_thread_update_bucket(p, wq, uth, old_pri, new_pri, false);
2743*8d741a5dSApple OSS Distributions 	workq_unlock(wq);
2744*8d741a5dSApple OSS Distributions 
2745*8d741a5dSApple OSS Distributions 	thread_mtx_unlock(thread);
2746*8d741a5dSApple OSS Distributions 	return 0;
2747*8d741a5dSApple OSS Distributions }
2748*8d741a5dSApple OSS Distributions 
2749*8d741a5dSApple OSS Distributions static int
workq_thread_allow_kill(__unused proc_t p,thread_t thread,bool enable)2750*8d741a5dSApple OSS Distributions workq_thread_allow_kill(__unused proc_t p, thread_t thread, bool enable)
2751*8d741a5dSApple OSS Distributions {
2752*8d741a5dSApple OSS Distributions 	if (!(thread_get_tag(thread) & THREAD_TAG_WORKQUEUE)) {
2753*8d741a5dSApple OSS Distributions 		// If the thread isn't a workqueue thread, don't set the
2754*8d741a5dSApple OSS Distributions 		// kill_allowed bit; however, we still need to return 0
2755*8d741a5dSApple OSS Distributions 		// instead of an error code since this code is executed
2756*8d741a5dSApple OSS Distributions 		// on the abort path which needs to not depend on the
2757*8d741a5dSApple OSS Distributions 		// pthread_t (returning an error depends on pthread_t via
2758*8d741a5dSApple OSS Distributions 		// cerror_nocancel)
2759*8d741a5dSApple OSS Distributions 		return 0;
2760*8d741a5dSApple OSS Distributions 	}
2761*8d741a5dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(thread);
2762*8d741a5dSApple OSS Distributions 	uth->uu_workq_pthread_kill_allowed = enable;
2763*8d741a5dSApple OSS Distributions 	return 0;
2764*8d741a5dSApple OSS Distributions }
2765*8d741a5dSApple OSS Distributions 
2766*8d741a5dSApple OSS Distributions static int
workq_allow_sigmask(proc_t p,sigset_t mask)2767*8d741a5dSApple OSS Distributions workq_allow_sigmask(proc_t p, sigset_t mask)
2768*8d741a5dSApple OSS Distributions {
2769*8d741a5dSApple OSS Distributions 	if (mask & workq_threadmask) {
2770*8d741a5dSApple OSS Distributions 		return EINVAL;
2771*8d741a5dSApple OSS Distributions 	}
2772*8d741a5dSApple OSS Distributions 
2773*8d741a5dSApple OSS Distributions 	proc_lock(p);
2774*8d741a5dSApple OSS Distributions 	p->p_workq_allow_sigmask |= mask;
2775*8d741a5dSApple OSS Distributions 	proc_unlock(p);
2776*8d741a5dSApple OSS Distributions 
2777*8d741a5dSApple OSS Distributions 	return 0;
2778*8d741a5dSApple OSS Distributions }
2779*8d741a5dSApple OSS Distributions 
2780*8d741a5dSApple OSS Distributions static int
bsdthread_get_max_parallelism(thread_qos_t qos,unsigned long flags,int * retval)2781*8d741a5dSApple OSS Distributions bsdthread_get_max_parallelism(thread_qos_t qos, unsigned long flags,
2782*8d741a5dSApple OSS Distributions     int *retval)
2783*8d741a5dSApple OSS Distributions {
2784*8d741a5dSApple OSS Distributions 	static_assert(QOS_PARALLELISM_COUNT_LOGICAL ==
2785*8d741a5dSApple OSS Distributions 	    _PTHREAD_QOS_PARALLELISM_COUNT_LOGICAL, "logical");
2786*8d741a5dSApple OSS Distributions 	static_assert(QOS_PARALLELISM_REALTIME ==
2787*8d741a5dSApple OSS Distributions 	    _PTHREAD_QOS_PARALLELISM_REALTIME, "realtime");
2788*8d741a5dSApple OSS Distributions 	static_assert(QOS_PARALLELISM_CLUSTER_SHARED_RESOURCE ==
2789*8d741a5dSApple OSS Distributions 	    _PTHREAD_QOS_PARALLELISM_CLUSTER_SHARED_RSRC, "cluster shared resource");
2790*8d741a5dSApple OSS Distributions 
2791*8d741a5dSApple OSS Distributions 	if (flags & ~(QOS_PARALLELISM_REALTIME | QOS_PARALLELISM_COUNT_LOGICAL | QOS_PARALLELISM_CLUSTER_SHARED_RESOURCE)) {
2792*8d741a5dSApple OSS Distributions 		return EINVAL;
2793*8d741a5dSApple OSS Distributions 	}
2794*8d741a5dSApple OSS Distributions 
2795*8d741a5dSApple OSS Distributions 	/* No units are present */
2796*8d741a5dSApple OSS Distributions 	if (flags & QOS_PARALLELISM_CLUSTER_SHARED_RESOURCE) {
2797*8d741a5dSApple OSS Distributions 		return ENOTSUP;
2798*8d741a5dSApple OSS Distributions 	}
2799*8d741a5dSApple OSS Distributions 
2800*8d741a5dSApple OSS Distributions 	if (flags & QOS_PARALLELISM_REALTIME) {
2801*8d741a5dSApple OSS Distributions 		if (qos) {
2802*8d741a5dSApple OSS Distributions 			return EINVAL;
2803*8d741a5dSApple OSS Distributions 		}
2804*8d741a5dSApple OSS Distributions 	} else if (qos == THREAD_QOS_UNSPECIFIED || qos >= THREAD_QOS_LAST) {
2805*8d741a5dSApple OSS Distributions 		return EINVAL;
2806*8d741a5dSApple OSS Distributions 	}
2807*8d741a5dSApple OSS Distributions 
2808*8d741a5dSApple OSS Distributions 	*retval = qos_max_parallelism(qos, flags);
2809*8d741a5dSApple OSS Distributions 	return 0;
2810*8d741a5dSApple OSS Distributions }
2811*8d741a5dSApple OSS Distributions 
2812*8d741a5dSApple OSS Distributions static int
bsdthread_dispatch_apply_attr(__unused struct proc * p,thread_t thread,unsigned long flags,uint64_t value1,__unused uint64_t value2)2813*8d741a5dSApple OSS Distributions bsdthread_dispatch_apply_attr(__unused struct proc *p, thread_t thread,
2814*8d741a5dSApple OSS Distributions     unsigned long flags, uint64_t value1, __unused uint64_t value2)
2815*8d741a5dSApple OSS Distributions {
2816*8d741a5dSApple OSS Distributions 	uint32_t apply_worker_index;
2817*8d741a5dSApple OSS Distributions 	kern_return_t kr;
2818*8d741a5dSApple OSS Distributions 
2819*8d741a5dSApple OSS Distributions 	switch (flags) {
2820*8d741a5dSApple OSS Distributions 	case _PTHREAD_DISPATCH_APPLY_ATTR_CLUSTER_SHARED_RSRC_SET:
2821*8d741a5dSApple OSS Distributions 		apply_worker_index = (uint32_t)value1;
2822*8d741a5dSApple OSS Distributions 		kr = thread_shared_rsrc_policy_set(thread, apply_worker_index, CLUSTER_SHARED_RSRC_TYPE_RR, SHARED_RSRC_POLICY_AGENT_DISPATCH);
2823*8d741a5dSApple OSS Distributions 		/*
2824*8d741a5dSApple OSS Distributions 		 * KERN_INVALID_POLICY indicates that the thread was trying to bind to a
2825*8d741a5dSApple OSS Distributions 		 * cluster which it was not eligible to execute on.
2826*8d741a5dSApple OSS Distributions 		 */
2827*8d741a5dSApple OSS Distributions 		return (kr == KERN_SUCCESS) ? 0 : ((kr == KERN_INVALID_POLICY) ? ENOTSUP : EINVAL);
2828*8d741a5dSApple OSS Distributions 	case _PTHREAD_DISPATCH_APPLY_ATTR_CLUSTER_SHARED_RSRC_CLEAR:
2829*8d741a5dSApple OSS Distributions 		kr = thread_shared_rsrc_policy_clear(thread, CLUSTER_SHARED_RSRC_TYPE_RR, SHARED_RSRC_POLICY_AGENT_DISPATCH);
2830*8d741a5dSApple OSS Distributions 		return (kr == KERN_SUCCESS) ? 0 : EINVAL;
2831*8d741a5dSApple OSS Distributions 	default:
2832*8d741a5dSApple OSS Distributions 		return EINVAL;
2833*8d741a5dSApple OSS Distributions 	}
2834*8d741a5dSApple OSS Distributions }
2835*8d741a5dSApple OSS Distributions 
2836*8d741a5dSApple OSS Distributions #define ENSURE_UNUSED(arg) \
2837*8d741a5dSApple OSS Distributions 	        ({ if ((arg) != 0) { return EINVAL; } })
2838*8d741a5dSApple OSS Distributions 
2839*8d741a5dSApple OSS Distributions int
bsdthread_ctl(struct proc * p,struct bsdthread_ctl_args * uap,int * retval)2840*8d741a5dSApple OSS Distributions bsdthread_ctl(struct proc *p, struct bsdthread_ctl_args *uap, int *retval)
2841*8d741a5dSApple OSS Distributions {
2842*8d741a5dSApple OSS Distributions 	switch (uap->cmd) {
2843*8d741a5dSApple OSS Distributions 	case BSDTHREAD_CTL_QOS_OVERRIDE_START:
2844*8d741a5dSApple OSS Distributions 		return bsdthread_add_explicit_override(p, (mach_port_name_t)uap->arg1,
2845*8d741a5dSApple OSS Distributions 		           (pthread_priority_t)uap->arg2, uap->arg3);
2846*8d741a5dSApple OSS Distributions 	case BSDTHREAD_CTL_QOS_OVERRIDE_END:
2847*8d741a5dSApple OSS Distributions 		ENSURE_UNUSED(uap->arg3);
2848*8d741a5dSApple OSS Distributions 		return bsdthread_remove_explicit_override(p, (mach_port_name_t)uap->arg1,
2849*8d741a5dSApple OSS Distributions 		           (user_addr_t)uap->arg2);
2850*8d741a5dSApple OSS Distributions 
2851*8d741a5dSApple OSS Distributions 	case BSDTHREAD_CTL_QOS_OVERRIDE_DISPATCH:
2852*8d741a5dSApple OSS Distributions 		return workq_thread_add_dispatch_override(p, (mach_port_name_t)uap->arg1,
2853*8d741a5dSApple OSS Distributions 		           (pthread_priority_t)uap->arg2, uap->arg3);
2854*8d741a5dSApple OSS Distributions 	case BSDTHREAD_CTL_QOS_OVERRIDE_RESET:
2855*8d741a5dSApple OSS Distributions 		return workq_thread_reset_dispatch_override(p, current_thread());
2856*8d741a5dSApple OSS Distributions 
2857*8d741a5dSApple OSS Distributions 	case BSDTHREAD_CTL_SET_SELF:
2858*8d741a5dSApple OSS Distributions 		return bsdthread_set_self(p, current_thread(),
2859*8d741a5dSApple OSS Distributions 		           (pthread_priority_t)uap->arg1, (mach_port_name_t)uap->arg2,
2860*8d741a5dSApple OSS Distributions 		           (enum workq_set_self_flags)uap->arg3);
2861*8d741a5dSApple OSS Distributions 
2862*8d741a5dSApple OSS Distributions 	case BSDTHREAD_CTL_QOS_MAX_PARALLELISM:
2863*8d741a5dSApple OSS Distributions 		ENSURE_UNUSED(uap->arg3);
2864*8d741a5dSApple OSS Distributions 		return bsdthread_get_max_parallelism((thread_qos_t)uap->arg1,
2865*8d741a5dSApple OSS Distributions 		           (unsigned long)uap->arg2, retval);
2866*8d741a5dSApple OSS Distributions 	case BSDTHREAD_CTL_WORKQ_ALLOW_KILL:
2867*8d741a5dSApple OSS Distributions 		ENSURE_UNUSED(uap->arg2);
2868*8d741a5dSApple OSS Distributions 		ENSURE_UNUSED(uap->arg3);
2869*8d741a5dSApple OSS Distributions 		return workq_thread_allow_kill(p, current_thread(), (bool)uap->arg1);
2870*8d741a5dSApple OSS Distributions 	case BSDTHREAD_CTL_DISPATCH_APPLY_ATTR:
2871*8d741a5dSApple OSS Distributions 		return bsdthread_dispatch_apply_attr(p, current_thread(),
2872*8d741a5dSApple OSS Distributions 		           (unsigned long)uap->arg1, (uint64_t)uap->arg2,
2873*8d741a5dSApple OSS Distributions 		           (uint64_t)uap->arg3);
2874*8d741a5dSApple OSS Distributions 	case BSDTHREAD_CTL_WORKQ_ALLOW_SIGMASK:
2875*8d741a5dSApple OSS Distributions 		return workq_allow_sigmask(p, (int)uap->arg1);
2876*8d741a5dSApple OSS Distributions 	case BSDTHREAD_CTL_SET_QOS:
2877*8d741a5dSApple OSS Distributions 	case BSDTHREAD_CTL_QOS_DISPATCH_ASYNCHRONOUS_OVERRIDE_ADD:
2878*8d741a5dSApple OSS Distributions 	case BSDTHREAD_CTL_QOS_DISPATCH_ASYNCHRONOUS_OVERRIDE_RESET:
2879*8d741a5dSApple OSS Distributions 		/* no longer supported */
2880*8d741a5dSApple OSS Distributions 		return ENOTSUP;
2881*8d741a5dSApple OSS Distributions 
2882*8d741a5dSApple OSS Distributions 	default:
2883*8d741a5dSApple OSS Distributions 		return EINVAL;
2884*8d741a5dSApple OSS Distributions 	}
2885*8d741a5dSApple OSS Distributions }
2886*8d741a5dSApple OSS Distributions 
2887*8d741a5dSApple OSS Distributions #pragma mark workqueue thread manipulation
2888*8d741a5dSApple OSS Distributions 
2889*8d741a5dSApple OSS Distributions static void __dead2
2890*8d741a5dSApple OSS Distributions workq_unpark_select_threadreq_or_park_and_unlock(proc_t p, struct workqueue *wq,
2891*8d741a5dSApple OSS Distributions     struct uthread *uth, uint32_t setup_flags);
2892*8d741a5dSApple OSS Distributions 
2893*8d741a5dSApple OSS Distributions static void __dead2
2894*8d741a5dSApple OSS Distributions workq_select_threadreq_or_park_and_unlock(proc_t p, struct workqueue *wq,
2895*8d741a5dSApple OSS Distributions     struct uthread *uth, uint32_t setup_flags);
2896*8d741a5dSApple OSS Distributions 
2897*8d741a5dSApple OSS Distributions static void workq_setup_and_run(proc_t p, struct uthread *uth, int flags) __dead2;
2898*8d741a5dSApple OSS Distributions 
2899*8d741a5dSApple OSS Distributions #if KDEBUG_LEVEL >= KDEBUG_LEVEL_STANDARD
2900*8d741a5dSApple OSS Distributions static inline uint64_t
workq_trace_req_id(workq_threadreq_t req)2901*8d741a5dSApple OSS Distributions workq_trace_req_id(workq_threadreq_t req)
2902*8d741a5dSApple OSS Distributions {
2903*8d741a5dSApple OSS Distributions 	struct kqworkloop *kqwl;
2904*8d741a5dSApple OSS Distributions 	if (req->tr_flags & WORKQ_TR_FLAG_WORKLOOP) {
2905*8d741a5dSApple OSS Distributions 		kqwl = __container_of(req, struct kqworkloop, kqwl_request);
2906*8d741a5dSApple OSS Distributions 		return kqwl->kqwl_dynamicid;
2907*8d741a5dSApple OSS Distributions 	}
2908*8d741a5dSApple OSS Distributions 
2909*8d741a5dSApple OSS Distributions 	return VM_KERNEL_ADDRHIDE(req);
2910*8d741a5dSApple OSS Distributions }
2911*8d741a5dSApple OSS Distributions #endif
2912*8d741a5dSApple OSS Distributions 
2913*8d741a5dSApple OSS Distributions /**
2914*8d741a5dSApple OSS Distributions  * Entry point for libdispatch to ask for threads
2915*8d741a5dSApple OSS Distributions  */
2916*8d741a5dSApple OSS Distributions static int
workq_reqthreads(struct proc * p,uint32_t reqcount,pthread_priority_t pp,bool cooperative)2917*8d741a5dSApple OSS Distributions workq_reqthreads(struct proc *p, uint32_t reqcount, pthread_priority_t pp, bool cooperative)
2918*8d741a5dSApple OSS Distributions {
2919*8d741a5dSApple OSS Distributions 	thread_qos_t qos = _pthread_priority_thread_qos(pp);
2920*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
2921*8d741a5dSApple OSS Distributions 	uint32_t unpaced, upcall_flags = WQ_FLAG_THREAD_NEWSPI;
2922*8d741a5dSApple OSS Distributions 	int ret = 0;
2923*8d741a5dSApple OSS Distributions 
2924*8d741a5dSApple OSS Distributions 	if (wq == NULL || reqcount <= 0 || reqcount > UINT16_MAX ||
2925*8d741a5dSApple OSS Distributions 	    qos == THREAD_QOS_UNSPECIFIED) {
2926*8d741a5dSApple OSS Distributions 		ret = EINVAL;
2927*8d741a5dSApple OSS Distributions 		goto exit;
2928*8d741a5dSApple OSS Distributions 	}
2929*8d741a5dSApple OSS Distributions 
2930*8d741a5dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_wqops_reqthreads | DBG_FUNC_NONE,
2931*8d741a5dSApple OSS Distributions 	    wq, reqcount, pp, cooperative);
2932*8d741a5dSApple OSS Distributions 
2933*8d741a5dSApple OSS Distributions 	workq_threadreq_t req = zalloc(workq_zone_threadreq);
2934*8d741a5dSApple OSS Distributions 	priority_queue_entry_init(&req->tr_entry);
2935*8d741a5dSApple OSS Distributions 	req->tr_state = WORKQ_TR_STATE_NEW;
2936*8d741a5dSApple OSS Distributions 	req->tr_qos   = qos;
2937*8d741a5dSApple OSS Distributions 	workq_tr_flags_t tr_flags = 0;
2938*8d741a5dSApple OSS Distributions 
2939*8d741a5dSApple OSS Distributions 	if (pp & _PTHREAD_PRIORITY_OVERCOMMIT_FLAG) {
2940*8d741a5dSApple OSS Distributions 		tr_flags |= WORKQ_TR_FLAG_OVERCOMMIT;
2941*8d741a5dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_OVERCOMMIT;
2942*8d741a5dSApple OSS Distributions 	}
2943*8d741a5dSApple OSS Distributions 
2944*8d741a5dSApple OSS Distributions 	if (cooperative) {
2945*8d741a5dSApple OSS Distributions 		tr_flags |= WORKQ_TR_FLAG_COOPERATIVE;
2946*8d741a5dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_COOPERATIVE;
2947*8d741a5dSApple OSS Distributions 
2948*8d741a5dSApple OSS Distributions 		if (reqcount > 1) {
2949*8d741a5dSApple OSS Distributions 			ret = ENOTSUP;
2950*8d741a5dSApple OSS Distributions 			goto free_and_exit;
2951*8d741a5dSApple OSS Distributions 		}
2952*8d741a5dSApple OSS Distributions 	}
2953*8d741a5dSApple OSS Distributions 
2954*8d741a5dSApple OSS Distributions 	/* A thread request cannot be both overcommit and cooperative */
2955*8d741a5dSApple OSS Distributions 	if (workq_tr_is_cooperative(tr_flags) &&
2956*8d741a5dSApple OSS Distributions 	    workq_tr_is_overcommit(tr_flags)) {
2957*8d741a5dSApple OSS Distributions 		ret = EINVAL;
2958*8d741a5dSApple OSS Distributions 		goto free_and_exit;
2959*8d741a5dSApple OSS Distributions 	}
2960*8d741a5dSApple OSS Distributions 	req->tr_flags = tr_flags;
2961*8d741a5dSApple OSS Distributions 
2962*8d741a5dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_thread_request_initiate | DBG_FUNC_NONE,
2963*8d741a5dSApple OSS Distributions 	    wq, workq_trace_req_id(req), req->tr_qos, reqcount);
2964*8d741a5dSApple OSS Distributions 
2965*8d741a5dSApple OSS Distributions 	workq_lock_spin(wq);
2966*8d741a5dSApple OSS Distributions 	do {
2967*8d741a5dSApple OSS Distributions 		if (_wq_exiting(wq)) {
2968*8d741a5dSApple OSS Distributions 			goto unlock_and_exit;
2969*8d741a5dSApple OSS Distributions 		}
2970*8d741a5dSApple OSS Distributions 
2971*8d741a5dSApple OSS Distributions 		/*
2972*8d741a5dSApple OSS Distributions 		 * When userspace is asking for parallelism, wakeup up to (reqcount - 1)
2973*8d741a5dSApple OSS Distributions 		 * threads without pacing, to inform the scheduler of that workload.
2974*8d741a5dSApple OSS Distributions 		 *
2975*8d741a5dSApple OSS Distributions 		 * The last requests, or the ones that failed the admission checks are
2976*8d741a5dSApple OSS Distributions 		 * enqueued and go through the regular creator codepath.
2977*8d741a5dSApple OSS Distributions 		 *
2978*8d741a5dSApple OSS Distributions 		 * If there aren't enough threads, add one, but re-evaluate everything
2979*8d741a5dSApple OSS Distributions 		 * as conditions may now have changed.
2980*8d741a5dSApple OSS Distributions 		 */
2981*8d741a5dSApple OSS Distributions 		unpaced = reqcount - 1;
2982*8d741a5dSApple OSS Distributions 
2983*8d741a5dSApple OSS Distributions 		if (reqcount > 1) {
2984*8d741a5dSApple OSS Distributions 			/* We don't handle asking for parallelism on the cooperative
2985*8d741a5dSApple OSS Distributions 			 * workqueue just yet */
2986*8d741a5dSApple OSS Distributions 			assert(!workq_threadreq_is_cooperative(req));
2987*8d741a5dSApple OSS Distributions 
2988*8d741a5dSApple OSS Distributions 			if (workq_threadreq_is_nonovercommit(req)) {
2989*8d741a5dSApple OSS Distributions 				unpaced = workq_constrained_allowance(wq, qos, NULL, false, true);
2990*8d741a5dSApple OSS Distributions 				if (unpaced >= reqcount - 1) {
2991*8d741a5dSApple OSS Distributions 					unpaced = reqcount - 1;
2992*8d741a5dSApple OSS Distributions 				}
2993*8d741a5dSApple OSS Distributions 			}
2994*8d741a5dSApple OSS Distributions 		}
2995*8d741a5dSApple OSS Distributions 
2996*8d741a5dSApple OSS Distributions 		/*
2997*8d741a5dSApple OSS Distributions 		 * This path does not currently handle custom workloop parameters
2998*8d741a5dSApple OSS Distributions 		 * when creating threads for parallelism.
2999*8d741a5dSApple OSS Distributions 		 */
3000*8d741a5dSApple OSS Distributions 		assert(!(req->tr_flags & WORKQ_TR_FLAG_WL_PARAMS));
3001*8d741a5dSApple OSS Distributions 
3002*8d741a5dSApple OSS Distributions 		/*
3003*8d741a5dSApple OSS Distributions 		 * This is a trimmed down version of workq_threadreq_bind_and_unlock()
3004*8d741a5dSApple OSS Distributions 		 */
3005*8d741a5dSApple OSS Distributions 		while (unpaced > 0 && wq->wq_thidlecount) {
3006*8d741a5dSApple OSS Distributions 			struct uthread *uth;
3007*8d741a5dSApple OSS Distributions 			bool needs_wakeup;
3008*8d741a5dSApple OSS Distributions 			uint8_t uu_flags = UT_WORKQ_EARLY_BOUND;
3009*8d741a5dSApple OSS Distributions 
3010*8d741a5dSApple OSS Distributions 			if (workq_tr_is_overcommit(req->tr_flags)) {
3011*8d741a5dSApple OSS Distributions 				uu_flags |= UT_WORKQ_OVERCOMMIT;
3012*8d741a5dSApple OSS Distributions 			}
3013*8d741a5dSApple OSS Distributions 
3014*8d741a5dSApple OSS Distributions 			uth = workq_pop_idle_thread(wq, uu_flags, &needs_wakeup);
3015*8d741a5dSApple OSS Distributions 
3016*8d741a5dSApple OSS Distributions 			_wq_thactive_inc(wq, qos);
3017*8d741a5dSApple OSS Distributions 			wq->wq_thscheduled_count[_wq_bucket(qos)]++;
3018*8d741a5dSApple OSS Distributions 			workq_thread_reset_pri(wq, uth, req, /*unpark*/ true);
3019*8d741a5dSApple OSS Distributions 			wq->wq_fulfilled++;
3020*8d741a5dSApple OSS Distributions 
3021*8d741a5dSApple OSS Distributions 			uth->uu_save.uus_workq_park_data.upcall_flags = upcall_flags;
3022*8d741a5dSApple OSS Distributions 			uth->uu_save.uus_workq_park_data.thread_request = req;
3023*8d741a5dSApple OSS Distributions 			if (needs_wakeup) {
3024*8d741a5dSApple OSS Distributions 				workq_thread_wakeup(uth);
3025*8d741a5dSApple OSS Distributions 			}
3026*8d741a5dSApple OSS Distributions 			unpaced--;
3027*8d741a5dSApple OSS Distributions 			reqcount--;
3028*8d741a5dSApple OSS Distributions 		}
3029*8d741a5dSApple OSS Distributions 	} while (unpaced && wq->wq_nthreads < wq_max_threads &&
3030*8d741a5dSApple OSS Distributions 	    (workq_add_new_idle_thread(p, wq, workq_unpark_continue,
3031*8d741a5dSApple OSS Distributions 	    false, NULL) == KERN_SUCCESS));
3032*8d741a5dSApple OSS Distributions 
3033*8d741a5dSApple OSS Distributions 	if (_wq_exiting(wq)) {
3034*8d741a5dSApple OSS Distributions 		goto unlock_and_exit;
3035*8d741a5dSApple OSS Distributions 	}
3036*8d741a5dSApple OSS Distributions 
3037*8d741a5dSApple OSS Distributions 	req->tr_count = (uint16_t)reqcount;
3038*8d741a5dSApple OSS Distributions 	if (workq_threadreq_enqueue(wq, req)) {
3039*8d741a5dSApple OSS Distributions 		/* This can drop the workqueue lock, and take it again */
3040*8d741a5dSApple OSS Distributions 		workq_schedule_creator(p, wq, WORKQ_THREADREQ_CAN_CREATE_THREADS);
3041*8d741a5dSApple OSS Distributions 	}
3042*8d741a5dSApple OSS Distributions 	workq_unlock(wq);
3043*8d741a5dSApple OSS Distributions 	return 0;
3044*8d741a5dSApple OSS Distributions 
3045*8d741a5dSApple OSS Distributions unlock_and_exit:
3046*8d741a5dSApple OSS Distributions 	workq_unlock(wq);
3047*8d741a5dSApple OSS Distributions free_and_exit:
3048*8d741a5dSApple OSS Distributions 	zfree(workq_zone_threadreq, req);
3049*8d741a5dSApple OSS Distributions exit:
3050*8d741a5dSApple OSS Distributions 	return ret;
3051*8d741a5dSApple OSS Distributions }
3052*8d741a5dSApple OSS Distributions 
3053*8d741a5dSApple OSS Distributions bool
workq_kern_threadreq_initiate(struct proc * p,workq_threadreq_t req,struct turnstile * workloop_ts,thread_qos_t qos,workq_kern_threadreq_flags_t flags)3054*8d741a5dSApple OSS Distributions workq_kern_threadreq_initiate(struct proc *p, workq_threadreq_t req,
3055*8d741a5dSApple OSS Distributions     struct turnstile *workloop_ts, thread_qos_t qos,
3056*8d741a5dSApple OSS Distributions     workq_kern_threadreq_flags_t flags)
3057*8d741a5dSApple OSS Distributions {
3058*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr_fast(p);
3059*8d741a5dSApple OSS Distributions 	struct uthread *uth = NULL;
3060*8d741a5dSApple OSS Distributions 
3061*8d741a5dSApple OSS Distributions 	assert(req->tr_flags & (WORKQ_TR_FLAG_WORKLOOP | WORKQ_TR_FLAG_KEVENT));
3062*8d741a5dSApple OSS Distributions 
3063*8d741a5dSApple OSS Distributions 	/*
3064*8d741a5dSApple OSS Distributions 	 * For any new initialization changes done to workqueue thread request below,
3065*8d741a5dSApple OSS Distributions 	 * please also consider if they are relevant to permanently bound thread
3066*8d741a5dSApple OSS Distributions 	 * request. See workq_kern_threadreq_permanent_bind.
3067*8d741a5dSApple OSS Distributions 	 */
3068*8d741a5dSApple OSS Distributions 	if (req->tr_flags & WORKQ_TR_FLAG_WL_OUTSIDE_QOS) {
3069*8d741a5dSApple OSS Distributions 		workq_threadreq_param_t trp = kqueue_threadreq_workloop_param(req);
3070*8d741a5dSApple OSS Distributions 		qos = thread_workq_qos_for_pri(trp.trp_pri);
3071*8d741a5dSApple OSS Distributions 		if (qos == THREAD_QOS_UNSPECIFIED) {
3072*8d741a5dSApple OSS Distributions 			qos = WORKQ_THREAD_QOS_ABOVEUI;
3073*8d741a5dSApple OSS Distributions 		}
3074*8d741a5dSApple OSS Distributions 	}
3075*8d741a5dSApple OSS Distributions 
3076*8d741a5dSApple OSS Distributions 	assert(req->tr_state == WORKQ_TR_STATE_IDLE);
3077*8d741a5dSApple OSS Distributions 	priority_queue_entry_init(&req->tr_entry);
3078*8d741a5dSApple OSS Distributions 	req->tr_count = 1;
3079*8d741a5dSApple OSS Distributions 	req->tr_state = WORKQ_TR_STATE_NEW;
3080*8d741a5dSApple OSS Distributions 	req->tr_qos   = qos;
3081*8d741a5dSApple OSS Distributions 
3082*8d741a5dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_thread_request_initiate | DBG_FUNC_NONE, wq,
3083*8d741a5dSApple OSS Distributions 	    workq_trace_req_id(req), qos, 1);
3084*8d741a5dSApple OSS Distributions 
3085*8d741a5dSApple OSS Distributions 	if (flags & WORKQ_THREADREQ_ATTEMPT_REBIND) {
3086*8d741a5dSApple OSS Distributions 		/*
3087*8d741a5dSApple OSS Distributions 		 * we're called back synchronously from the context of
3088*8d741a5dSApple OSS Distributions 		 * kqueue_threadreq_unbind from within workq_thread_return()
3089*8d741a5dSApple OSS Distributions 		 * we can try to match up this thread with this request !
3090*8d741a5dSApple OSS Distributions 		 */
3091*8d741a5dSApple OSS Distributions 		uth = current_uthread();
3092*8d741a5dSApple OSS Distributions 		assert(uth->uu_kqr_bound == NULL);
3093*8d741a5dSApple OSS Distributions 	}
3094*8d741a5dSApple OSS Distributions 
3095*8d741a5dSApple OSS Distributions 	workq_lock_spin(wq);
3096*8d741a5dSApple OSS Distributions 	if (_wq_exiting(wq)) {
3097*8d741a5dSApple OSS Distributions 		req->tr_state = WORKQ_TR_STATE_IDLE;
3098*8d741a5dSApple OSS Distributions 		workq_unlock(wq);
3099*8d741a5dSApple OSS Distributions 		return false;
3100*8d741a5dSApple OSS Distributions 	}
3101*8d741a5dSApple OSS Distributions 
3102*8d741a5dSApple OSS Distributions 	if (uth && workq_threadreq_admissible(wq, uth, req)) {
3103*8d741a5dSApple OSS Distributions 		/* This is the case of the rebind - we were about to park and unbind
3104*8d741a5dSApple OSS Distributions 		 * when more events came so keep the binding.
3105*8d741a5dSApple OSS Distributions 		 */
3106*8d741a5dSApple OSS Distributions 		assert(uth != wq->wq_creator);
3107*8d741a5dSApple OSS Distributions 
3108*8d741a5dSApple OSS Distributions 		if (uth->uu_workq_pri.qos_bucket != req->tr_qos) {
3109*8d741a5dSApple OSS Distributions 			_wq_thactive_move(wq, uth->uu_workq_pri.qos_bucket, req->tr_qos);
3110*8d741a5dSApple OSS Distributions 			workq_thread_reset_pri(wq, uth, req, /*unpark*/ false);
3111*8d741a5dSApple OSS Distributions 		}
3112*8d741a5dSApple OSS Distributions 		/*
3113*8d741a5dSApple OSS Distributions 		 * We're called from workq_kern_threadreq_initiate()
3114*8d741a5dSApple OSS Distributions 		 * due to an unbind, with the kq req held.
3115*8d741a5dSApple OSS Distributions 		 */
3116*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_thread_logical_run | DBG_FUNC_START, wq,
3117*8d741a5dSApple OSS Distributions 		    workq_trace_req_id(req), req->tr_flags, 0);
3118*8d741a5dSApple OSS Distributions 		wq->wq_fulfilled++;
3119*8d741a5dSApple OSS Distributions 
3120*8d741a5dSApple OSS Distributions 		kqueue_threadreq_bind(p, req, get_machthread(uth), 0);
3121*8d741a5dSApple OSS Distributions 	} else {
3122*8d741a5dSApple OSS Distributions 		if (workloop_ts) {
3123*8d741a5dSApple OSS Distributions 			workq_perform_turnstile_operation_locked(wq, ^{
3124*8d741a5dSApple OSS Distributions 				turnstile_update_inheritor(workloop_ts, wq->wq_turnstile,
3125*8d741a5dSApple OSS Distributions 				TURNSTILE_IMMEDIATE_UPDATE | TURNSTILE_INHERITOR_TURNSTILE);
3126*8d741a5dSApple OSS Distributions 				turnstile_update_inheritor_complete(workloop_ts,
3127*8d741a5dSApple OSS Distributions 				TURNSTILE_INTERLOCK_HELD);
3128*8d741a5dSApple OSS Distributions 			});
3129*8d741a5dSApple OSS Distributions 		}
3130*8d741a5dSApple OSS Distributions 
3131*8d741a5dSApple OSS Distributions 		bool reevaluate_creator_thread_group = false;
3132*8d741a5dSApple OSS Distributions #if CONFIG_PREADOPT_TG
3133*8d741a5dSApple OSS Distributions 		reevaluate_creator_thread_group = (flags & WORKQ_THREADREQ_REEVALUATE_PREADOPT_TG);
3134*8d741a5dSApple OSS Distributions #endif
3135*8d741a5dSApple OSS Distributions 		/* We enqueued the highest priority item or we may need to reevaluate if
3136*8d741a5dSApple OSS Distributions 		 * the creator needs a thread group pre-adoption */
3137*8d741a5dSApple OSS Distributions 		if (workq_threadreq_enqueue(wq, req) || reevaluate_creator_thread_group) {
3138*8d741a5dSApple OSS Distributions 			workq_schedule_creator(p, wq, flags);
3139*8d741a5dSApple OSS Distributions 		}
3140*8d741a5dSApple OSS Distributions 	}
3141*8d741a5dSApple OSS Distributions 
3142*8d741a5dSApple OSS Distributions 	workq_unlock(wq);
3143*8d741a5dSApple OSS Distributions 
3144*8d741a5dSApple OSS Distributions 	return true;
3145*8d741a5dSApple OSS Distributions }
3146*8d741a5dSApple OSS Distributions 
3147*8d741a5dSApple OSS Distributions void
workq_kern_threadreq_modify(struct proc * p,workq_threadreq_t req,thread_qos_t qos,workq_kern_threadreq_flags_t flags)3148*8d741a5dSApple OSS Distributions workq_kern_threadreq_modify(struct proc *p, workq_threadreq_t req,
3149*8d741a5dSApple OSS Distributions     thread_qos_t qos, workq_kern_threadreq_flags_t flags)
3150*8d741a5dSApple OSS Distributions {
3151*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr_fast(p);
3152*8d741a5dSApple OSS Distributions 	bool make_overcommit = false;
3153*8d741a5dSApple OSS Distributions 
3154*8d741a5dSApple OSS Distributions 	if (req->tr_flags & WORKQ_TR_FLAG_WL_OUTSIDE_QOS) {
3155*8d741a5dSApple OSS Distributions 		/* Requests outside-of-QoS shouldn't accept modify operations */
3156*8d741a5dSApple OSS Distributions 		return;
3157*8d741a5dSApple OSS Distributions 	}
3158*8d741a5dSApple OSS Distributions 
3159*8d741a5dSApple OSS Distributions 	workq_lock_spin(wq);
3160*8d741a5dSApple OSS Distributions 
3161*8d741a5dSApple OSS Distributions 	assert(req->tr_qos != WORKQ_THREAD_QOS_MANAGER);
3162*8d741a5dSApple OSS Distributions 	assert(req->tr_flags & (WORKQ_TR_FLAG_KEVENT | WORKQ_TR_FLAG_WORKLOOP));
3163*8d741a5dSApple OSS Distributions 
3164*8d741a5dSApple OSS Distributions 	if (req->tr_state == WORKQ_TR_STATE_BINDING) {
3165*8d741a5dSApple OSS Distributions 		kqueue_threadreq_bind(p, req, req->tr_thread, 0);
3166*8d741a5dSApple OSS Distributions 		workq_unlock(wq);
3167*8d741a5dSApple OSS Distributions 		return;
3168*8d741a5dSApple OSS Distributions 	}
3169*8d741a5dSApple OSS Distributions 
3170*8d741a5dSApple OSS Distributions 	if (flags & WORKQ_THREADREQ_MAKE_OVERCOMMIT) {
3171*8d741a5dSApple OSS Distributions 		/* TODO (rokhinip): We come into this code path for kqwl thread
3172*8d741a5dSApple OSS Distributions 		 * requests. kqwl requests cannot be cooperative.
3173*8d741a5dSApple OSS Distributions 		 */
3174*8d741a5dSApple OSS Distributions 		assert(!workq_threadreq_is_cooperative(req));
3175*8d741a5dSApple OSS Distributions 
3176*8d741a5dSApple OSS Distributions 		make_overcommit = workq_threadreq_is_nonovercommit(req);
3177*8d741a5dSApple OSS Distributions 	}
3178*8d741a5dSApple OSS Distributions 
3179*8d741a5dSApple OSS Distributions 	if (_wq_exiting(wq) || (req->tr_qos == qos && !make_overcommit)) {
3180*8d741a5dSApple OSS Distributions 		workq_unlock(wq);
3181*8d741a5dSApple OSS Distributions 		return;
3182*8d741a5dSApple OSS Distributions 	}
3183*8d741a5dSApple OSS Distributions 
3184*8d741a5dSApple OSS Distributions 	assert(req->tr_count == 1);
3185*8d741a5dSApple OSS Distributions 	if (req->tr_state != WORKQ_TR_STATE_QUEUED) {
3186*8d741a5dSApple OSS Distributions 		panic("Invalid thread request (%p) state %d", req, req->tr_state);
3187*8d741a5dSApple OSS Distributions 	}
3188*8d741a5dSApple OSS Distributions 
3189*8d741a5dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_thread_request_modify | DBG_FUNC_NONE, wq,
3190*8d741a5dSApple OSS Distributions 	    workq_trace_req_id(req), qos, 0);
3191*8d741a5dSApple OSS Distributions 
3192*8d741a5dSApple OSS Distributions 	struct priority_queue_sched_max *pq = workq_priority_queue_for_req(wq, req);
3193*8d741a5dSApple OSS Distributions 	workq_threadreq_t req_max;
3194*8d741a5dSApple OSS Distributions 
3195*8d741a5dSApple OSS Distributions 	/*
3196*8d741a5dSApple OSS Distributions 	 * Stage 1: Dequeue the request from its priority queue.
3197*8d741a5dSApple OSS Distributions 	 *
3198*8d741a5dSApple OSS Distributions 	 * If we dequeue the root item of the constrained priority queue,
3199*8d741a5dSApple OSS Distributions 	 * maintain the best constrained request qos invariant.
3200*8d741a5dSApple OSS Distributions 	 */
3201*8d741a5dSApple OSS Distributions 	if (priority_queue_remove(pq, &req->tr_entry)) {
3202*8d741a5dSApple OSS Distributions 		if (workq_threadreq_is_nonovercommit(req)) {
3203*8d741a5dSApple OSS Distributions 			_wq_thactive_refresh_best_constrained_req_qos(wq);
3204*8d741a5dSApple OSS Distributions 		}
3205*8d741a5dSApple OSS Distributions 	}
3206*8d741a5dSApple OSS Distributions 
3207*8d741a5dSApple OSS Distributions 	/*
3208*8d741a5dSApple OSS Distributions 	 * Stage 2: Apply changes to the thread request
3209*8d741a5dSApple OSS Distributions 	 *
3210*8d741a5dSApple OSS Distributions 	 * If the item will not become the root of the priority queue it belongs to,
3211*8d741a5dSApple OSS Distributions 	 * then we need to wait in line, just enqueue and return quickly.
3212*8d741a5dSApple OSS Distributions 	 */
3213*8d741a5dSApple OSS Distributions 	if (__improbable(make_overcommit)) {
3214*8d741a5dSApple OSS Distributions 		req->tr_flags ^= WORKQ_TR_FLAG_OVERCOMMIT;
3215*8d741a5dSApple OSS Distributions 		pq = workq_priority_queue_for_req(wq, req);
3216*8d741a5dSApple OSS Distributions 	}
3217*8d741a5dSApple OSS Distributions 	req->tr_qos = qos;
3218*8d741a5dSApple OSS Distributions 
3219*8d741a5dSApple OSS Distributions 	req_max = priority_queue_max(pq, struct workq_threadreq_s, tr_entry);
3220*8d741a5dSApple OSS Distributions 	if (req_max && req_max->tr_qos >= qos) {
3221*8d741a5dSApple OSS Distributions 		priority_queue_entry_set_sched_pri(pq, &req->tr_entry,
3222*8d741a5dSApple OSS Distributions 		    workq_priority_for_req(req), false);
3223*8d741a5dSApple OSS Distributions 		priority_queue_insert(pq, &req->tr_entry);
3224*8d741a5dSApple OSS Distributions 		workq_unlock(wq);
3225*8d741a5dSApple OSS Distributions 		return;
3226*8d741a5dSApple OSS Distributions 	}
3227*8d741a5dSApple OSS Distributions 
3228*8d741a5dSApple OSS Distributions 	/*
3229*8d741a5dSApple OSS Distributions 	 * Stage 3: Reevaluate whether we should run the thread request.
3230*8d741a5dSApple OSS Distributions 	 *
3231*8d741a5dSApple OSS Distributions 	 * Pretend the thread request is new again:
3232*8d741a5dSApple OSS Distributions 	 * - adjust wq_reqcount to not count it anymore.
3233*8d741a5dSApple OSS Distributions 	 * - make its state WORKQ_TR_STATE_NEW (so that workq_threadreq_bind_and_unlock
3234*8d741a5dSApple OSS Distributions 	 *   properly attempts a synchronous bind)
3235*8d741a5dSApple OSS Distributions 	 */
3236*8d741a5dSApple OSS Distributions 	wq->wq_reqcount--;
3237*8d741a5dSApple OSS Distributions 	req->tr_state = WORKQ_TR_STATE_NEW;
3238*8d741a5dSApple OSS Distributions 
3239*8d741a5dSApple OSS Distributions 	/* We enqueued the highest priority item or we may need to reevaluate if
3240*8d741a5dSApple OSS Distributions 	 * the creator needs a thread group pre-adoption if the request got a new TG */
3241*8d741a5dSApple OSS Distributions 	bool reevaluate_creator_tg = false;
3242*8d741a5dSApple OSS Distributions 
3243*8d741a5dSApple OSS Distributions #if CONFIG_PREADOPT_TG
3244*8d741a5dSApple OSS Distributions 	reevaluate_creator_tg = (flags & WORKQ_THREADREQ_REEVALUATE_PREADOPT_TG);
3245*8d741a5dSApple OSS Distributions #endif
3246*8d741a5dSApple OSS Distributions 
3247*8d741a5dSApple OSS Distributions 	if (workq_threadreq_enqueue(wq, req) || reevaluate_creator_tg) {
3248*8d741a5dSApple OSS Distributions 		workq_schedule_creator(p, wq, flags);
3249*8d741a5dSApple OSS Distributions 	}
3250*8d741a5dSApple OSS Distributions 	workq_unlock(wq);
3251*8d741a5dSApple OSS Distributions }
3252*8d741a5dSApple OSS Distributions 
3253*8d741a5dSApple OSS Distributions void
workq_kern_bound_thread_reset_pri(workq_threadreq_t req,struct uthread * uth)3254*8d741a5dSApple OSS Distributions workq_kern_bound_thread_reset_pri(workq_threadreq_t req, struct uthread *uth)
3255*8d741a5dSApple OSS Distributions {
3256*8d741a5dSApple OSS Distributions 	assert(workq_thread_is_permanently_bound(uth));
3257*8d741a5dSApple OSS Distributions 
3258*8d741a5dSApple OSS Distributions 	if (req && (req->tr_flags & WORKQ_TR_FLAG_WL_OUTSIDE_QOS)) {
3259*8d741a5dSApple OSS Distributions 		/*
3260*8d741a5dSApple OSS Distributions 		 * For requests outside-of-QoS, we set the scheduling policy and
3261*8d741a5dSApple OSS Distributions 		 * absolute priority for the bound thread right at the initialization
3262*8d741a5dSApple OSS Distributions 		 * time. See workq_kern_threadreq_permanent_bind.
3263*8d741a5dSApple OSS Distributions 		 */
3264*8d741a5dSApple OSS Distributions 		return;
3265*8d741a5dSApple OSS Distributions 	}
3266*8d741a5dSApple OSS Distributions 
3267*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr_fast(current_proc());
3268*8d741a5dSApple OSS Distributions 	if (req) {
3269*8d741a5dSApple OSS Distributions 		assert(req->tr_qos != WORKQ_THREAD_QOS_MANAGER);
3270*8d741a5dSApple OSS Distributions 		workq_thread_reset_pri(wq, uth, req, /*unpark*/ true);
3271*8d741a5dSApple OSS Distributions 	} else {
3272*8d741a5dSApple OSS Distributions 		thread_qos_t qos = workq_pri_override(uth->uu_workq_pri);
3273*8d741a5dSApple OSS Distributions 		if (qos > WORKQ_THREAD_QOS_CLEANUP) {
3274*8d741a5dSApple OSS Distributions 			workq_thread_reset_pri(wq, uth, NULL, /*unpark*/ true);
3275*8d741a5dSApple OSS Distributions 		} else {
3276*8d741a5dSApple OSS Distributions 			uth->uu_save.uus_workq_park_data.qos = qos;
3277*8d741a5dSApple OSS Distributions 		}
3278*8d741a5dSApple OSS Distributions 	}
3279*8d741a5dSApple OSS Distributions }
3280*8d741a5dSApple OSS Distributions 
3281*8d741a5dSApple OSS Distributions void
workq_kern_threadreq_lock(struct proc * p)3282*8d741a5dSApple OSS Distributions workq_kern_threadreq_lock(struct proc *p)
3283*8d741a5dSApple OSS Distributions {
3284*8d741a5dSApple OSS Distributions 	workq_lock_spin(proc_get_wqptr_fast(p));
3285*8d741a5dSApple OSS Distributions }
3286*8d741a5dSApple OSS Distributions 
3287*8d741a5dSApple OSS Distributions void
workq_kern_threadreq_unlock(struct proc * p)3288*8d741a5dSApple OSS Distributions workq_kern_threadreq_unlock(struct proc *p)
3289*8d741a5dSApple OSS Distributions {
3290*8d741a5dSApple OSS Distributions 	workq_unlock(proc_get_wqptr_fast(p));
3291*8d741a5dSApple OSS Distributions }
3292*8d741a5dSApple OSS Distributions 
3293*8d741a5dSApple OSS Distributions void
workq_kern_threadreq_update_inheritor(struct proc * p,workq_threadreq_t req,thread_t owner,struct turnstile * wl_ts,turnstile_update_flags_t flags)3294*8d741a5dSApple OSS Distributions workq_kern_threadreq_update_inheritor(struct proc *p, workq_threadreq_t req,
3295*8d741a5dSApple OSS Distributions     thread_t owner, struct turnstile *wl_ts,
3296*8d741a5dSApple OSS Distributions     turnstile_update_flags_t flags)
3297*8d741a5dSApple OSS Distributions {
3298*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr_fast(p);
3299*8d741a5dSApple OSS Distributions 	turnstile_inheritor_t inheritor;
3300*8d741a5dSApple OSS Distributions 
3301*8d741a5dSApple OSS Distributions 	assert(req->tr_qos != WORKQ_THREAD_QOS_MANAGER);
3302*8d741a5dSApple OSS Distributions 	assert(req->tr_flags & WORKQ_TR_FLAG_WORKLOOP);
3303*8d741a5dSApple OSS Distributions 	workq_lock_held(wq);
3304*8d741a5dSApple OSS Distributions 
3305*8d741a5dSApple OSS Distributions 	if (req->tr_state == WORKQ_TR_STATE_BINDING) {
3306*8d741a5dSApple OSS Distributions 		kqueue_threadreq_bind(p, req, req->tr_thread,
3307*8d741a5dSApple OSS Distributions 		    KQUEUE_THREADREQ_BIND_NO_INHERITOR_UPDATE);
3308*8d741a5dSApple OSS Distributions 		return;
3309*8d741a5dSApple OSS Distributions 	}
3310*8d741a5dSApple OSS Distributions 
3311*8d741a5dSApple OSS Distributions 	if (_wq_exiting(wq)) {
3312*8d741a5dSApple OSS Distributions 		inheritor = TURNSTILE_INHERITOR_NULL;
3313*8d741a5dSApple OSS Distributions 	} else {
3314*8d741a5dSApple OSS Distributions 		if (req->tr_state != WORKQ_TR_STATE_QUEUED) {
3315*8d741a5dSApple OSS Distributions 			panic("Invalid thread request (%p) state %d", req, req->tr_state);
3316*8d741a5dSApple OSS Distributions 		}
3317*8d741a5dSApple OSS Distributions 
3318*8d741a5dSApple OSS Distributions 		if (owner) {
3319*8d741a5dSApple OSS Distributions 			inheritor = owner;
3320*8d741a5dSApple OSS Distributions 			flags |= TURNSTILE_INHERITOR_THREAD;
3321*8d741a5dSApple OSS Distributions 		} else {
3322*8d741a5dSApple OSS Distributions 			inheritor = wq->wq_turnstile;
3323*8d741a5dSApple OSS Distributions 			flags |= TURNSTILE_INHERITOR_TURNSTILE;
3324*8d741a5dSApple OSS Distributions 		}
3325*8d741a5dSApple OSS Distributions 	}
3326*8d741a5dSApple OSS Distributions 
3327*8d741a5dSApple OSS Distributions 	workq_perform_turnstile_operation_locked(wq, ^{
3328*8d741a5dSApple OSS Distributions 		turnstile_update_inheritor(wl_ts, inheritor, flags);
3329*8d741a5dSApple OSS Distributions 	});
3330*8d741a5dSApple OSS Distributions }
3331*8d741a5dSApple OSS Distributions 
3332*8d741a5dSApple OSS Distributions /*
3333*8d741a5dSApple OSS Distributions  * An entry point for kevent to request a newly created workqueue thread
3334*8d741a5dSApple OSS Distributions  * and bind it permanently to the given workqueue thread request.
3335*8d741a5dSApple OSS Distributions  *
3336*8d741a5dSApple OSS Distributions  * It currently only supports fixed scheduler priority thread requests.
3337*8d741a5dSApple OSS Distributions  *
3338*8d741a5dSApple OSS Distributions  * The newly created thread counts towards wq_nthreads. This function returns
3339*8d741a5dSApple OSS Distributions  * an error if we are above that limit. There is no concept of delayed thread
3340*8d741a5dSApple OSS Distributions  * creation for such specially configured kqworkloops.
3341*8d741a5dSApple OSS Distributions  *
3342*8d741a5dSApple OSS Distributions  * If successful, the newly created thread will be parked in
3343*8d741a5dSApple OSS Distributions  * workq_bound_thread_initialize_and_unpark_continue waiting for
3344*8d741a5dSApple OSS Distributions  * new incoming events.
3345*8d741a5dSApple OSS Distributions  */
3346*8d741a5dSApple OSS Distributions kern_return_t
workq_kern_threadreq_permanent_bind(struct proc * p,struct workq_threadreq_s * kqr)3347*8d741a5dSApple OSS Distributions workq_kern_threadreq_permanent_bind(struct proc *p, struct workq_threadreq_s *kqr)
3348*8d741a5dSApple OSS Distributions {
3349*8d741a5dSApple OSS Distributions 	kern_return_t ret = 0;
3350*8d741a5dSApple OSS Distributions 	thread_t new_thread = NULL;
3351*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr_fast(p);
3352*8d741a5dSApple OSS Distributions 
3353*8d741a5dSApple OSS Distributions 	workq_lock_spin(wq);
3354*8d741a5dSApple OSS Distributions 
3355*8d741a5dSApple OSS Distributions 	if (wq->wq_nthreads >= wq_max_threads) {
3356*8d741a5dSApple OSS Distributions 		ret = EDOM;
3357*8d741a5dSApple OSS Distributions 	} else {
3358*8d741a5dSApple OSS Distributions 		if (kqr->tr_flags & WORKQ_TR_FLAG_WL_OUTSIDE_QOS) {
3359*8d741a5dSApple OSS Distributions 			workq_threadreq_param_t trp = kqueue_threadreq_workloop_param(kqr);
3360*8d741a5dSApple OSS Distributions 			/*
3361*8d741a5dSApple OSS Distributions 			 * For requests outside-of-QoS, we fully initialize the thread
3362*8d741a5dSApple OSS Distributions 			 * request here followed by preadopting the scheduling properties
3363*8d741a5dSApple OSS Distributions 			 * on the newly created bound thread.
3364*8d741a5dSApple OSS Distributions 			 */
3365*8d741a5dSApple OSS Distributions 			thread_qos_t qos = thread_workq_qos_for_pri(trp.trp_pri);
3366*8d741a5dSApple OSS Distributions 			if (qos == THREAD_QOS_UNSPECIFIED) {
3367*8d741a5dSApple OSS Distributions 				qos = WORKQ_THREAD_QOS_ABOVEUI;
3368*8d741a5dSApple OSS Distributions 			}
3369*8d741a5dSApple OSS Distributions 			kqr->tr_qos = qos;
3370*8d741a5dSApple OSS Distributions 		}
3371*8d741a5dSApple OSS Distributions 		kqr->tr_count = 1;
3372*8d741a5dSApple OSS Distributions 
3373*8d741a5dSApple OSS Distributions 		/* workq_lock dropped and retaken around thread creation below. */
3374*8d741a5dSApple OSS Distributions 		ret = workq_add_new_idle_thread(p, wq,
3375*8d741a5dSApple OSS Distributions 		    workq_bound_thread_initialize_and_unpark_continue,
3376*8d741a5dSApple OSS Distributions 		    true, &new_thread);
3377*8d741a5dSApple OSS Distributions 		if (ret == KERN_SUCCESS) {
3378*8d741a5dSApple OSS Distributions 			struct uthread *uth = get_bsdthread_info(new_thread);
3379*8d741a5dSApple OSS Distributions 			if (kqr->tr_flags & WORKQ_TR_FLAG_WL_OUTSIDE_QOS) {
3380*8d741a5dSApple OSS Distributions 				workq_thread_reset_pri(wq, uth, kqr, /*unpark*/ true);
3381*8d741a5dSApple OSS Distributions 			}
3382*8d741a5dSApple OSS Distributions 			/*
3383*8d741a5dSApple OSS Distributions 			 * The newly created thread goes through a full bind to the kqwl
3384*8d741a5dSApple OSS Distributions 			 * right upon creation.
3385*8d741a5dSApple OSS Distributions 			 * It then falls back to soft bind/unbind upon wakeup/park.
3386*8d741a5dSApple OSS Distributions 			 */
3387*8d741a5dSApple OSS Distributions 			kqueue_threadreq_bind_prepost(p, kqr, uth);
3388*8d741a5dSApple OSS Distributions 			uth->uu_workq_flags |= UT_WORKQ_PERMANENT_BIND;
3389*8d741a5dSApple OSS Distributions 		}
3390*8d741a5dSApple OSS Distributions 	}
3391*8d741a5dSApple OSS Distributions 
3392*8d741a5dSApple OSS Distributions 	workq_unlock(wq);
3393*8d741a5dSApple OSS Distributions 
3394*8d741a5dSApple OSS Distributions 	if (ret == KERN_SUCCESS) {
3395*8d741a5dSApple OSS Distributions 		kqueue_threadreq_bind_commit(p, new_thread);
3396*8d741a5dSApple OSS Distributions 	}
3397*8d741a5dSApple OSS Distributions 	return ret;
3398*8d741a5dSApple OSS Distributions }
3399*8d741a5dSApple OSS Distributions 
3400*8d741a5dSApple OSS Distributions /*
3401*8d741a5dSApple OSS Distributions  * Called with kqlock held. It does not need to take the process wide
3402*8d741a5dSApple OSS Distributions  * global workq lock -> making it faster.
3403*8d741a5dSApple OSS Distributions  */
3404*8d741a5dSApple OSS Distributions void
workq_kern_bound_thread_wakeup(struct workq_threadreq_s * kqr)3405*8d741a5dSApple OSS Distributions workq_kern_bound_thread_wakeup(struct workq_threadreq_s *kqr)
3406*8d741a5dSApple OSS Distributions {
3407*8d741a5dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(kqr->tr_thread);
3408*8d741a5dSApple OSS Distributions 	workq_threadreq_param_t trp = kqueue_threadreq_workloop_param(kqr);
3409*8d741a5dSApple OSS Distributions 
3410*8d741a5dSApple OSS Distributions 	/*
3411*8d741a5dSApple OSS Distributions 	 * See "Locking model for accessing uu_workq_flags" for more information
3412*8d741a5dSApple OSS Distributions 	 * on how access to uu_workq_flags for the bound thread is synchronized.
3413*8d741a5dSApple OSS Distributions 	 */
3414*8d741a5dSApple OSS Distributions 	assert((uth->uu_workq_flags & (UT_WORKQ_RUNNING | UT_WORKQ_DYING)) == 0);
3415*8d741a5dSApple OSS Distributions 
3416*8d741a5dSApple OSS Distributions 	if (trp.trp_flags & TRP_RELEASED) {
3417*8d741a5dSApple OSS Distributions 		uth->uu_workq_flags |= UT_WORKQ_DYING;
3418*8d741a5dSApple OSS Distributions 	} else {
3419*8d741a5dSApple OSS Distributions 		uth->uu_workq_flags |= UT_WORKQ_RUNNING;
3420*8d741a5dSApple OSS Distributions 	}
3421*8d741a5dSApple OSS Distributions 
3422*8d741a5dSApple OSS Distributions 	workq_thread_wakeup(uth);
3423*8d741a5dSApple OSS Distributions }
3424*8d741a5dSApple OSS Distributions 
3425*8d741a5dSApple OSS Distributions /*
3426*8d741a5dSApple OSS Distributions  * Called with kqlock held. Dropped before parking.
3427*8d741a5dSApple OSS Distributions  * It does not need to take process wide global workqueue
3428*8d741a5dSApple OSS Distributions  * lock -> making it faster.
3429*8d741a5dSApple OSS Distributions  */
3430*8d741a5dSApple OSS Distributions __attribute__((noreturn, noinline))
3431*8d741a5dSApple OSS Distributions void
workq_kern_bound_thread_park(struct workq_threadreq_s * kqr)3432*8d741a5dSApple OSS Distributions workq_kern_bound_thread_park(struct workq_threadreq_s *kqr)
3433*8d741a5dSApple OSS Distributions {
3434*8d741a5dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(kqr->tr_thread);
3435*8d741a5dSApple OSS Distributions 	assert(uth == current_uthread());
3436*8d741a5dSApple OSS Distributions 
3437*8d741a5dSApple OSS Distributions 	/*
3438*8d741a5dSApple OSS Distributions 	 * See "Locking model for accessing uu_workq_flags" for more information
3439*8d741a5dSApple OSS Distributions 	 * on how access to uu_workq_flags for the bound thread is synchronized.
3440*8d741a5dSApple OSS Distributions 	 */
3441*8d741a5dSApple OSS Distributions 	uth->uu_workq_flags &= ~(UT_WORKQ_RUNNING);
3442*8d741a5dSApple OSS Distributions 
3443*8d741a5dSApple OSS Distributions 	thread_disarm_workqueue_quantum(get_machthread(uth));
3444*8d741a5dSApple OSS Distributions 
3445*8d741a5dSApple OSS Distributions 	/*
3446*8d741a5dSApple OSS Distributions 	 * TODO (pavhad) We could do the reusable userspace stack performance
3447*8d741a5dSApple OSS Distributions 	 * optimization here.
3448*8d741a5dSApple OSS Distributions 	 */
3449*8d741a5dSApple OSS Distributions 
3450*8d741a5dSApple OSS Distributions 	kqworkloop_bound_thread_park_prepost(kqr);
3451*8d741a5dSApple OSS Distributions 	/* KQ_SLEEP bit is set and kqlock is dropped. */
3452*8d741a5dSApple OSS Distributions 
3453*8d741a5dSApple OSS Distributions 	__assert_only kern_return_t kr;
3454*8d741a5dSApple OSS Distributions 	kr = thread_set_voucher_name(MACH_PORT_NULL);
3455*8d741a5dSApple OSS Distributions 	assert(kr == KERN_SUCCESS);
3456*8d741a5dSApple OSS Distributions 
3457*8d741a5dSApple OSS Distributions 	kqworkloop_bound_thread_park_commit(kqr,
3458*8d741a5dSApple OSS Distributions 	    workq_parked_wait_event(uth), workq_bound_thread_unpark_continue);
3459*8d741a5dSApple OSS Distributions 
3460*8d741a5dSApple OSS Distributions 	__builtin_unreachable();
3461*8d741a5dSApple OSS Distributions }
3462*8d741a5dSApple OSS Distributions 
3463*8d741a5dSApple OSS Distributions /*
3464*8d741a5dSApple OSS Distributions  * To terminate the permenantly bound workqueue thread. It unbinds itself
3465*8d741a5dSApple OSS Distributions  * with the kqwl during uthread_cleanup -> kqueue_threadreq_unbind.
3466*8d741a5dSApple OSS Distributions  * It is also when it will release its reference on the kqwl.
3467*8d741a5dSApple OSS Distributions  */
3468*8d741a5dSApple OSS Distributions __attribute__((noreturn, noinline))
3469*8d741a5dSApple OSS Distributions void
workq_kern_bound_thread_terminate(struct workq_threadreq_s * kqr)3470*8d741a5dSApple OSS Distributions workq_kern_bound_thread_terminate(struct workq_threadreq_s *kqr)
3471*8d741a5dSApple OSS Distributions {
3472*8d741a5dSApple OSS Distributions 	proc_t p = current_proc();
3473*8d741a5dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(kqr->tr_thread);
3474*8d741a5dSApple OSS Distributions 	uint16_t uu_workq_flags_orig;
3475*8d741a5dSApple OSS Distributions 
3476*8d741a5dSApple OSS Distributions 	assert(uth == current_uthread());
3477*8d741a5dSApple OSS Distributions 
3478*8d741a5dSApple OSS Distributions 	/*
3479*8d741a5dSApple OSS Distributions 	 * See "Locking model for accessing uu_workq_flags" for more information
3480*8d741a5dSApple OSS Distributions 	 * on how access to uu_workq_flags for the bound thread is synchronized.
3481*8d741a5dSApple OSS Distributions 	 */
3482*8d741a5dSApple OSS Distributions 	kqworkloop_bound_thread_terminate(kqr, &uu_workq_flags_orig);
3483*8d741a5dSApple OSS Distributions 
3484*8d741a5dSApple OSS Distributions 	if (uu_workq_flags_orig & UT_WORKQ_WORK_INTERVAL_JOINED) {
3485*8d741a5dSApple OSS Distributions 		__assert_only kern_return_t kr;
3486*8d741a5dSApple OSS Distributions 		kr = kern_work_interval_join(get_machthread(uth), MACH_PORT_NULL);
3487*8d741a5dSApple OSS Distributions 		/* The bound thread un-joins the work interval and drops its +1 ref. */
3488*8d741a5dSApple OSS Distributions 		assert(kr == KERN_SUCCESS);
3489*8d741a5dSApple OSS Distributions 	}
3490*8d741a5dSApple OSS Distributions 
3491*8d741a5dSApple OSS Distributions 	/*
3492*8d741a5dSApple OSS Distributions 	 * Drop the voucher now that we are on our way to termination.
3493*8d741a5dSApple OSS Distributions 	 */
3494*8d741a5dSApple OSS Distributions 	__assert_only kern_return_t kr;
3495*8d741a5dSApple OSS Distributions 	kr = thread_set_voucher_name(MACH_PORT_NULL);
3496*8d741a5dSApple OSS Distributions 	assert(kr == KERN_SUCCESS);
3497*8d741a5dSApple OSS Distributions 
3498*8d741a5dSApple OSS Distributions 	uint32_t upcall_flags = WQ_FLAG_THREAD_NEWSPI;
3499*8d741a5dSApple OSS Distributions 	upcall_flags |= uth->uu_save.uus_workq_park_data.qos |
3500*8d741a5dSApple OSS Distributions 	    WQ_FLAG_THREAD_PRIO_QOS;
3501*8d741a5dSApple OSS Distributions 
3502*8d741a5dSApple OSS Distributions 	thread_t th = get_machthread(uth);
3503*8d741a5dSApple OSS Distributions 	vm_map_t vmap = get_task_map(proc_task(p));
3504*8d741a5dSApple OSS Distributions 
3505*8d741a5dSApple OSS Distributions 	if ((uu_workq_flags_orig & UT_WORKQ_NEW) == 0) {
3506*8d741a5dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_REUSE;
3507*8d741a5dSApple OSS Distributions 	}
3508*8d741a5dSApple OSS Distributions 
3509*8d741a5dSApple OSS Distributions 	pthread_functions->workq_setup_thread(p, th, vmap, uth->uu_workq_stackaddr,
3510*8d741a5dSApple OSS Distributions 	    uth->uu_workq_thport, 0, WQ_SETUP_EXIT_THREAD, upcall_flags);
3511*8d741a5dSApple OSS Distributions 	__builtin_unreachable();
3512*8d741a5dSApple OSS Distributions }
3513*8d741a5dSApple OSS Distributions 
3514*8d741a5dSApple OSS Distributions void
workq_kern_threadreq_redrive(struct proc * p,workq_kern_threadreq_flags_t flags)3515*8d741a5dSApple OSS Distributions workq_kern_threadreq_redrive(struct proc *p, workq_kern_threadreq_flags_t flags)
3516*8d741a5dSApple OSS Distributions {
3517*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr_fast(p);
3518*8d741a5dSApple OSS Distributions 
3519*8d741a5dSApple OSS Distributions 	workq_lock_spin(wq);
3520*8d741a5dSApple OSS Distributions 	workq_schedule_creator(p, wq, flags);
3521*8d741a5dSApple OSS Distributions 	workq_unlock(wq);
3522*8d741a5dSApple OSS Distributions }
3523*8d741a5dSApple OSS Distributions 
3524*8d741a5dSApple OSS Distributions /*
3525*8d741a5dSApple OSS Distributions  * Always called at AST by the thread on itself
3526*8d741a5dSApple OSS Distributions  *
3527*8d741a5dSApple OSS Distributions  * Upon quantum expiry, the workqueue subsystem evaluates its state and decides
3528*8d741a5dSApple OSS Distributions  * on what the thread should do next. The TSD value is always set by the thread
3529*8d741a5dSApple OSS Distributions  * on itself in the kernel and cleared either by userspace when it acks the TSD
3530*8d741a5dSApple OSS Distributions  * value and takes action, or by the thread in the kernel when the quantum
3531*8d741a5dSApple OSS Distributions  * expires again.
3532*8d741a5dSApple OSS Distributions  */
3533*8d741a5dSApple OSS Distributions void
workq_kern_quantum_expiry_reevaluate(proc_t proc,thread_t thread)3534*8d741a5dSApple OSS Distributions workq_kern_quantum_expiry_reevaluate(proc_t proc, thread_t thread)
3535*8d741a5dSApple OSS Distributions {
3536*8d741a5dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(thread);
3537*8d741a5dSApple OSS Distributions 
3538*8d741a5dSApple OSS Distributions 	if (uth->uu_workq_flags & UT_WORKQ_DYING) {
3539*8d741a5dSApple OSS Distributions 		return;
3540*8d741a5dSApple OSS Distributions 	}
3541*8d741a5dSApple OSS Distributions 
3542*8d741a5dSApple OSS Distributions 	if (!thread_supports_cooperative_workqueue(thread)) {
3543*8d741a5dSApple OSS Distributions 		panic("Quantum expired for thread that doesn't support cooperative workqueue");
3544*8d741a5dSApple OSS Distributions 	}
3545*8d741a5dSApple OSS Distributions 
3546*8d741a5dSApple OSS Distributions 	thread_qos_t qos = uth->uu_workq_pri.qos_bucket;
3547*8d741a5dSApple OSS Distributions 	if (qos == THREAD_QOS_UNSPECIFIED) {
3548*8d741a5dSApple OSS Distributions 		panic("Thread should not have workq bucket of QoS UN");
3549*8d741a5dSApple OSS Distributions 	}
3550*8d741a5dSApple OSS Distributions 
3551*8d741a5dSApple OSS Distributions 	assert(thread_has_expired_workqueue_quantum(thread, false));
3552*8d741a5dSApple OSS Distributions 
3553*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(proc);
3554*8d741a5dSApple OSS Distributions 	assert(wq != NULL);
3555*8d741a5dSApple OSS Distributions 
3556*8d741a5dSApple OSS Distributions 	/*
3557*8d741a5dSApple OSS Distributions 	 * For starters, we're just going to evaluate and see if we need to narrow
3558*8d741a5dSApple OSS Distributions 	 * the pool and tell this thread to park if needed. In the future, we'll
3559*8d741a5dSApple OSS Distributions 	 * evaluate and convey other workqueue state information like needing to
3560*8d741a5dSApple OSS Distributions 	 * pump kevents, etc.
3561*8d741a5dSApple OSS Distributions 	 */
3562*8d741a5dSApple OSS Distributions 	uint64_t flags = 0;
3563*8d741a5dSApple OSS Distributions 
3564*8d741a5dSApple OSS Distributions 	workq_lock_spin(wq);
3565*8d741a5dSApple OSS Distributions 
3566*8d741a5dSApple OSS Distributions 	if (workq_thread_is_cooperative(uth)) {
3567*8d741a5dSApple OSS Distributions 		if (!workq_cooperative_allowance(wq, qos, uth, false)) {
3568*8d741a5dSApple OSS Distributions 			flags |= PTHREAD_WQ_QUANTUM_EXPIRY_NARROW;
3569*8d741a5dSApple OSS Distributions 		} else {
3570*8d741a5dSApple OSS Distributions 			/* In the future, when we have kevent hookups for the cooperative
3571*8d741a5dSApple OSS Distributions 			 * pool, we need fancier logic for what userspace should do. But
3572*8d741a5dSApple OSS Distributions 			 * right now, only userspace thread requests exist - so we'll just
3573*8d741a5dSApple OSS Distributions 			 * tell userspace to shuffle work items */
3574*8d741a5dSApple OSS Distributions 			flags |= PTHREAD_WQ_QUANTUM_EXPIRY_SHUFFLE;
3575*8d741a5dSApple OSS Distributions 		}
3576*8d741a5dSApple OSS Distributions 	} else if (workq_thread_is_nonovercommit(uth)) {
3577*8d741a5dSApple OSS Distributions 		if (!workq_constrained_allowance(wq, qos, uth, false, false)) {
3578*8d741a5dSApple OSS Distributions 			flags |= PTHREAD_WQ_QUANTUM_EXPIRY_NARROW;
3579*8d741a5dSApple OSS Distributions 		}
3580*8d741a5dSApple OSS Distributions 	}
3581*8d741a5dSApple OSS Distributions 	workq_unlock(wq);
3582*8d741a5dSApple OSS Distributions 
3583*8d741a5dSApple OSS Distributions 	WQ_TRACE(TRACE_wq_quantum_expiry_reevaluate, flags, 0, 0, 0);
3584*8d741a5dSApple OSS Distributions 
3585*8d741a5dSApple OSS Distributions 	kevent_set_workq_quantum_expiry_user_tsd(proc, thread, flags);
3586*8d741a5dSApple OSS Distributions 
3587*8d741a5dSApple OSS Distributions 	/* We have conveyed to userspace about what it needs to do upon quantum
3588*8d741a5dSApple OSS Distributions 	 * expiry, now rearm the workqueue quantum again */
3589*8d741a5dSApple OSS Distributions 	thread_arm_workqueue_quantum(get_machthread(uth));
3590*8d741a5dSApple OSS Distributions }
3591*8d741a5dSApple OSS Distributions 
3592*8d741a5dSApple OSS Distributions void
workq_schedule_creator_turnstile_redrive(struct workqueue * wq,bool locked)3593*8d741a5dSApple OSS Distributions workq_schedule_creator_turnstile_redrive(struct workqueue *wq, bool locked)
3594*8d741a5dSApple OSS Distributions {
3595*8d741a5dSApple OSS Distributions 	if (locked) {
3596*8d741a5dSApple OSS Distributions 		workq_schedule_creator(NULL, wq, WORKQ_THREADREQ_NONE);
3597*8d741a5dSApple OSS Distributions 	} else {
3598*8d741a5dSApple OSS Distributions 		workq_schedule_immediate_thread_creation(wq);
3599*8d741a5dSApple OSS Distributions 	}
3600*8d741a5dSApple OSS Distributions }
3601*8d741a5dSApple OSS Distributions 
3602*8d741a5dSApple OSS Distributions static int
workq_thread_return(struct proc * p,struct workq_kernreturn_args * uap,struct workqueue * wq)3603*8d741a5dSApple OSS Distributions workq_thread_return(struct proc *p, struct workq_kernreturn_args *uap,
3604*8d741a5dSApple OSS Distributions     struct workqueue *wq)
3605*8d741a5dSApple OSS Distributions {
3606*8d741a5dSApple OSS Distributions 	thread_t th = current_thread();
3607*8d741a5dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(th);
3608*8d741a5dSApple OSS Distributions 	workq_threadreq_t kqr = uth->uu_kqr_bound;
3609*8d741a5dSApple OSS Distributions 	workq_threadreq_param_t trp = { };
3610*8d741a5dSApple OSS Distributions 	int nevents = uap->affinity, error;
3611*8d741a5dSApple OSS Distributions 	user_addr_t eventlist = uap->item;
3612*8d741a5dSApple OSS Distributions 
3613*8d741a5dSApple OSS Distributions 	if (((thread_get_tag(th) & THREAD_TAG_WORKQUEUE) == 0) ||
3614*8d741a5dSApple OSS Distributions 	    (uth->uu_workq_flags & UT_WORKQ_DYING)) {
3615*8d741a5dSApple OSS Distributions 		return EINVAL;
3616*8d741a5dSApple OSS Distributions 	}
3617*8d741a5dSApple OSS Distributions 
3618*8d741a5dSApple OSS Distributions 	if (eventlist && nevents && kqr == NULL) {
3619*8d741a5dSApple OSS Distributions 		return EINVAL;
3620*8d741a5dSApple OSS Distributions 	}
3621*8d741a5dSApple OSS Distributions 
3622*8d741a5dSApple OSS Distributions 	/*
3623*8d741a5dSApple OSS Distributions 	 * Reset signal mask on the workqueue thread to default state,
3624*8d741a5dSApple OSS Distributions 	 * but do not touch any signals that are marked for preservation.
3625*8d741a5dSApple OSS Distributions 	 */
3626*8d741a5dSApple OSS Distributions 	sigset_t resettable = uth->uu_sigmask & ~p->p_workq_allow_sigmask;
3627*8d741a5dSApple OSS Distributions 	if (resettable != (sigset_t)~workq_threadmask) {
3628*8d741a5dSApple OSS Distributions 		proc_lock(p);
3629*8d741a5dSApple OSS Distributions 		uth->uu_sigmask |= ~workq_threadmask & ~p->p_workq_allow_sigmask;
3630*8d741a5dSApple OSS Distributions 		proc_unlock(p);
3631*8d741a5dSApple OSS Distributions 	}
3632*8d741a5dSApple OSS Distributions 
3633*8d741a5dSApple OSS Distributions 	if (kqr && kqr->tr_flags & WORKQ_TR_FLAG_WL_PARAMS) {
3634*8d741a5dSApple OSS Distributions 		/*
3635*8d741a5dSApple OSS Distributions 		 * Ensure we store the threadreq param before unbinding
3636*8d741a5dSApple OSS Distributions 		 * the kqr from this thread.
3637*8d741a5dSApple OSS Distributions 		 */
3638*8d741a5dSApple OSS Distributions 		trp = kqueue_threadreq_workloop_param(kqr);
3639*8d741a5dSApple OSS Distributions 	}
3640*8d741a5dSApple OSS Distributions 
3641*8d741a5dSApple OSS Distributions 	if (kqr && kqr->tr_flags & WORKQ_TR_FLAG_PERMANENT_BIND) {
3642*8d741a5dSApple OSS Distributions 		goto handle_stack_events;
3643*8d741a5dSApple OSS Distributions 	}
3644*8d741a5dSApple OSS Distributions 
3645*8d741a5dSApple OSS Distributions 	/*
3646*8d741a5dSApple OSS Distributions 	 * Freeze the base pri while we decide the fate of this thread.
3647*8d741a5dSApple OSS Distributions 	 *
3648*8d741a5dSApple OSS Distributions 	 * Either:
3649*8d741a5dSApple OSS Distributions 	 * - we return to user and kevent_cleanup will have unfrozen the base pri,
3650*8d741a5dSApple OSS Distributions 	 * - or we proceed to workq_select_threadreq_or_park_and_unlock() who will.
3651*8d741a5dSApple OSS Distributions 	 */
3652*8d741a5dSApple OSS Distributions 	thread_freeze_base_pri(th);
3653*8d741a5dSApple OSS Distributions 
3654*8d741a5dSApple OSS Distributions handle_stack_events:
3655*8d741a5dSApple OSS Distributions 
3656*8d741a5dSApple OSS Distributions 	if (kqr) {
3657*8d741a5dSApple OSS Distributions 		uint32_t upcall_flags = WQ_FLAG_THREAD_NEWSPI | WQ_FLAG_THREAD_REUSE;
3658*8d741a5dSApple OSS Distributions 		if (kqr->tr_flags & WORKQ_TR_FLAG_WORKLOOP) {
3659*8d741a5dSApple OSS Distributions 			upcall_flags |= WQ_FLAG_THREAD_WORKLOOP | WQ_FLAG_THREAD_KEVENT;
3660*8d741a5dSApple OSS Distributions 		} else {
3661*8d741a5dSApple OSS Distributions 			upcall_flags |= WQ_FLAG_THREAD_KEVENT;
3662*8d741a5dSApple OSS Distributions 		}
3663*8d741a5dSApple OSS Distributions 		if (uth->uu_workq_pri.qos_bucket == WORKQ_THREAD_QOS_MANAGER) {
3664*8d741a5dSApple OSS Distributions 			upcall_flags |= WQ_FLAG_THREAD_EVENT_MANAGER;
3665*8d741a5dSApple OSS Distributions 		} else {
3666*8d741a5dSApple OSS Distributions 			if (workq_thread_is_overcommit(uth)) {
3667*8d741a5dSApple OSS Distributions 				upcall_flags |= WQ_FLAG_THREAD_OVERCOMMIT;
3668*8d741a5dSApple OSS Distributions 			}
3669*8d741a5dSApple OSS Distributions 			if (uth->uu_workq_flags & UT_WORKQ_OUTSIDE_QOS) {
3670*8d741a5dSApple OSS Distributions 				upcall_flags |= WQ_FLAG_THREAD_OUTSIDEQOS;
3671*8d741a5dSApple OSS Distributions 			} else {
3672*8d741a5dSApple OSS Distributions 				upcall_flags |= uth->uu_workq_pri.qos_req |
3673*8d741a5dSApple OSS Distributions 				    WQ_FLAG_THREAD_PRIO_QOS;
3674*8d741a5dSApple OSS Distributions 			}
3675*8d741a5dSApple OSS Distributions 		}
3676*8d741a5dSApple OSS Distributions 		error = pthread_functions->workq_handle_stack_events(p, th,
3677*8d741a5dSApple OSS Distributions 		    get_task_map(proc_task(p)), uth->uu_workq_stackaddr,
3678*8d741a5dSApple OSS Distributions 		    uth->uu_workq_thport, eventlist, nevents, upcall_flags);
3679*8d741a5dSApple OSS Distributions 		if (error) {
3680*8d741a5dSApple OSS Distributions 			assert(uth->uu_kqr_bound == kqr);
3681*8d741a5dSApple OSS Distributions 			return error;
3682*8d741a5dSApple OSS Distributions 		}
3683*8d741a5dSApple OSS Distributions 
3684*8d741a5dSApple OSS Distributions 		// pthread is supposed to pass KEVENT_FLAG_PARKING here
3685*8d741a5dSApple OSS Distributions 		// which should cause the above call to either:
3686*8d741a5dSApple OSS Distributions 		// - not return
3687*8d741a5dSApple OSS Distributions 		// - return an error
3688*8d741a5dSApple OSS Distributions 		// - return 0 and have unbound properly
3689*8d741a5dSApple OSS Distributions 		assert(uth->uu_kqr_bound == NULL);
3690*8d741a5dSApple OSS Distributions 	}
3691*8d741a5dSApple OSS Distributions 
3692*8d741a5dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_runthread | DBG_FUNC_END, wq, uap->options, 0, 0);
3693*8d741a5dSApple OSS Distributions 
3694*8d741a5dSApple OSS Distributions 	thread_sched_call(th, NULL);
3695*8d741a5dSApple OSS Distributions 	thread_will_park_or_terminate(th);
3696*8d741a5dSApple OSS Distributions #if CONFIG_WORKLOOP_DEBUG
3697*8d741a5dSApple OSS Distributions 	UU_KEVENT_HISTORY_WRITE_ENTRY(uth, { .uu_error = -1, });
3698*8d741a5dSApple OSS Distributions #endif
3699*8d741a5dSApple OSS Distributions 
3700*8d741a5dSApple OSS Distributions 	workq_lock_spin(wq);
3701*8d741a5dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_thread_logical_run | DBG_FUNC_END, wq, 0, 0, 0);
3702*8d741a5dSApple OSS Distributions 	uth->uu_save.uus_workq_park_data.workloop_params = trp.trp_value;
3703*8d741a5dSApple OSS Distributions 	workq_select_threadreq_or_park_and_unlock(p, wq, uth,
3704*8d741a5dSApple OSS Distributions 	    WQ_SETUP_CLEAR_VOUCHER);
3705*8d741a5dSApple OSS Distributions 	__builtin_unreachable();
3706*8d741a5dSApple OSS Distributions }
3707*8d741a5dSApple OSS Distributions 
3708*8d741a5dSApple OSS Distributions /**
3709*8d741a5dSApple OSS Distributions  * Multiplexed call to interact with the workqueue mechanism
3710*8d741a5dSApple OSS Distributions  */
3711*8d741a5dSApple OSS Distributions int
workq_kernreturn(struct proc * p,struct workq_kernreturn_args * uap,int32_t * retval)3712*8d741a5dSApple OSS Distributions workq_kernreturn(struct proc *p, struct workq_kernreturn_args *uap, int32_t *retval)
3713*8d741a5dSApple OSS Distributions {
3714*8d741a5dSApple OSS Distributions 	int options = uap->options;
3715*8d741a5dSApple OSS Distributions 	int arg2 = uap->affinity;
3716*8d741a5dSApple OSS Distributions 	int arg3 = uap->prio;
3717*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
3718*8d741a5dSApple OSS Distributions 	int error = 0;
3719*8d741a5dSApple OSS Distributions 
3720*8d741a5dSApple OSS Distributions 	if ((p->p_lflag & P_LREGISTER) == 0) {
3721*8d741a5dSApple OSS Distributions 		return EINVAL;
3722*8d741a5dSApple OSS Distributions 	}
3723*8d741a5dSApple OSS Distributions 
3724*8d741a5dSApple OSS Distributions 	switch (options) {
3725*8d741a5dSApple OSS Distributions 	case WQOPS_QUEUE_NEWSPISUPP: {
3726*8d741a5dSApple OSS Distributions 		/*
3727*8d741a5dSApple OSS Distributions 		 * arg2 = offset of serialno into dispatch queue
3728*8d741a5dSApple OSS Distributions 		 * arg3 = kevent support
3729*8d741a5dSApple OSS Distributions 		 */
3730*8d741a5dSApple OSS Distributions 		int offset = arg2;
3731*8d741a5dSApple OSS Distributions 		if (arg3 & 0x01) {
3732*8d741a5dSApple OSS Distributions 			// If we get here, then userspace has indicated support for kevent delivery.
3733*8d741a5dSApple OSS Distributions 		}
3734*8d741a5dSApple OSS Distributions 
3735*8d741a5dSApple OSS Distributions 		p->p_dispatchqueue_serialno_offset = (uint64_t)offset;
3736*8d741a5dSApple OSS Distributions 		break;
3737*8d741a5dSApple OSS Distributions 	}
3738*8d741a5dSApple OSS Distributions 	case WQOPS_QUEUE_REQTHREADS: {
3739*8d741a5dSApple OSS Distributions 		/*
3740*8d741a5dSApple OSS Distributions 		 * arg2 = number of threads to start
3741*8d741a5dSApple OSS Distributions 		 * arg3 = priority
3742*8d741a5dSApple OSS Distributions 		 */
3743*8d741a5dSApple OSS Distributions 		error = workq_reqthreads(p, arg2, arg3, false);
3744*8d741a5dSApple OSS Distributions 		break;
3745*8d741a5dSApple OSS Distributions 	}
3746*8d741a5dSApple OSS Distributions 	/* For requesting threads for the cooperative pool */
3747*8d741a5dSApple OSS Distributions 	case WQOPS_QUEUE_REQTHREADS2: {
3748*8d741a5dSApple OSS Distributions 		/*
3749*8d741a5dSApple OSS Distributions 		 * arg2 = number of threads to start
3750*8d741a5dSApple OSS Distributions 		 * arg3 = priority
3751*8d741a5dSApple OSS Distributions 		 */
3752*8d741a5dSApple OSS Distributions 		error = workq_reqthreads(p, arg2, arg3, true);
3753*8d741a5dSApple OSS Distributions 		break;
3754*8d741a5dSApple OSS Distributions 	}
3755*8d741a5dSApple OSS Distributions 	case WQOPS_SET_EVENT_MANAGER_PRIORITY: {
3756*8d741a5dSApple OSS Distributions 		/*
3757*8d741a5dSApple OSS Distributions 		 * arg2 = priority for the manager thread
3758*8d741a5dSApple OSS Distributions 		 *
3759*8d741a5dSApple OSS Distributions 		 * if _PTHREAD_PRIORITY_SCHED_PRI_FLAG is set,
3760*8d741a5dSApple OSS Distributions 		 * the low bits of the value contains a scheduling priority
3761*8d741a5dSApple OSS Distributions 		 * instead of a QOS value
3762*8d741a5dSApple OSS Distributions 		 */
3763*8d741a5dSApple OSS Distributions 		pthread_priority_t pri = arg2;
3764*8d741a5dSApple OSS Distributions 
3765*8d741a5dSApple OSS Distributions 		if (wq == NULL) {
3766*8d741a5dSApple OSS Distributions 			error = EINVAL;
3767*8d741a5dSApple OSS Distributions 			break;
3768*8d741a5dSApple OSS Distributions 		}
3769*8d741a5dSApple OSS Distributions 
3770*8d741a5dSApple OSS Distributions 		/*
3771*8d741a5dSApple OSS Distributions 		 * Normalize the incoming priority so that it is ordered numerically.
3772*8d741a5dSApple OSS Distributions 		 */
3773*8d741a5dSApple OSS Distributions 		if (_pthread_priority_has_sched_pri(pri)) {
3774*8d741a5dSApple OSS Distributions 			pri &= (_PTHREAD_PRIORITY_SCHED_PRI_MASK |
3775*8d741a5dSApple OSS Distributions 			    _PTHREAD_PRIORITY_SCHED_PRI_FLAG);
3776*8d741a5dSApple OSS Distributions 		} else {
3777*8d741a5dSApple OSS Distributions 			thread_qos_t qos = _pthread_priority_thread_qos(pri);
3778*8d741a5dSApple OSS Distributions 			int relpri = _pthread_priority_relpri(pri);
3779*8d741a5dSApple OSS Distributions 			if (relpri > 0 || relpri < THREAD_QOS_MIN_TIER_IMPORTANCE ||
3780*8d741a5dSApple OSS Distributions 			    qos == THREAD_QOS_UNSPECIFIED) {
3781*8d741a5dSApple OSS Distributions 				error = EINVAL;
3782*8d741a5dSApple OSS Distributions 				break;
3783*8d741a5dSApple OSS Distributions 			}
3784*8d741a5dSApple OSS Distributions 			pri &= ~_PTHREAD_PRIORITY_FLAGS_MASK;
3785*8d741a5dSApple OSS Distributions 		}
3786*8d741a5dSApple OSS Distributions 
3787*8d741a5dSApple OSS Distributions 		/*
3788*8d741a5dSApple OSS Distributions 		 * If userspace passes a scheduling priority, that wins over any QoS.
3789*8d741a5dSApple OSS Distributions 		 * Userspace should takes care not to lower the priority this way.
3790*8d741a5dSApple OSS Distributions 		 */
3791*8d741a5dSApple OSS Distributions 		workq_lock_spin(wq);
3792*8d741a5dSApple OSS Distributions 		if (wq->wq_event_manager_priority < (uint32_t)pri) {
3793*8d741a5dSApple OSS Distributions 			wq->wq_event_manager_priority = (uint32_t)pri;
3794*8d741a5dSApple OSS Distributions 		}
3795*8d741a5dSApple OSS Distributions 		workq_unlock(wq);
3796*8d741a5dSApple OSS Distributions 		break;
3797*8d741a5dSApple OSS Distributions 	}
3798*8d741a5dSApple OSS Distributions 	case WQOPS_THREAD_KEVENT_RETURN:
3799*8d741a5dSApple OSS Distributions 	case WQOPS_THREAD_WORKLOOP_RETURN:
3800*8d741a5dSApple OSS Distributions 	case WQOPS_THREAD_RETURN: {
3801*8d741a5dSApple OSS Distributions 		error = workq_thread_return(p, uap, wq);
3802*8d741a5dSApple OSS Distributions 		break;
3803*8d741a5dSApple OSS Distributions 	}
3804*8d741a5dSApple OSS Distributions 
3805*8d741a5dSApple OSS Distributions 	case WQOPS_SHOULD_NARROW: {
3806*8d741a5dSApple OSS Distributions 		/*
3807*8d741a5dSApple OSS Distributions 		 * arg2 = priority to test
3808*8d741a5dSApple OSS Distributions 		 * arg3 = unused
3809*8d741a5dSApple OSS Distributions 		 */
3810*8d741a5dSApple OSS Distributions 		thread_t th = current_thread();
3811*8d741a5dSApple OSS Distributions 		struct uthread *uth = get_bsdthread_info(th);
3812*8d741a5dSApple OSS Distributions 		if (((thread_get_tag(th) & THREAD_TAG_WORKQUEUE) == 0) ||
3813*8d741a5dSApple OSS Distributions 		    (uth->uu_workq_flags & (UT_WORKQ_DYING | UT_WORKQ_OVERCOMMIT))) {
3814*8d741a5dSApple OSS Distributions 			error = EINVAL;
3815*8d741a5dSApple OSS Distributions 			break;
3816*8d741a5dSApple OSS Distributions 		}
3817*8d741a5dSApple OSS Distributions 
3818*8d741a5dSApple OSS Distributions 		thread_qos_t qos = _pthread_priority_thread_qos(arg2);
3819*8d741a5dSApple OSS Distributions 		if (qos == THREAD_QOS_UNSPECIFIED) {
3820*8d741a5dSApple OSS Distributions 			error = EINVAL;
3821*8d741a5dSApple OSS Distributions 			break;
3822*8d741a5dSApple OSS Distributions 		}
3823*8d741a5dSApple OSS Distributions 		workq_lock_spin(wq);
3824*8d741a5dSApple OSS Distributions 		bool should_narrow = !workq_constrained_allowance(wq, qos, uth, false, false);
3825*8d741a5dSApple OSS Distributions 		workq_unlock(wq);
3826*8d741a5dSApple OSS Distributions 
3827*8d741a5dSApple OSS Distributions 		*retval = should_narrow;
3828*8d741a5dSApple OSS Distributions 		break;
3829*8d741a5dSApple OSS Distributions 	}
3830*8d741a5dSApple OSS Distributions 	case WQOPS_SETUP_DISPATCH: {
3831*8d741a5dSApple OSS Distributions 		/*
3832*8d741a5dSApple OSS Distributions 		 * item = pointer to workq_dispatch_config structure
3833*8d741a5dSApple OSS Distributions 		 * arg2 = sizeof(item)
3834*8d741a5dSApple OSS Distributions 		 */
3835*8d741a5dSApple OSS Distributions 		struct workq_dispatch_config cfg;
3836*8d741a5dSApple OSS Distributions 		bzero(&cfg, sizeof(cfg));
3837*8d741a5dSApple OSS Distributions 
3838*8d741a5dSApple OSS Distributions 		error = copyin(uap->item, &cfg, MIN(sizeof(cfg), (unsigned long) arg2));
3839*8d741a5dSApple OSS Distributions 		if (error) {
3840*8d741a5dSApple OSS Distributions 			break;
3841*8d741a5dSApple OSS Distributions 		}
3842*8d741a5dSApple OSS Distributions 
3843*8d741a5dSApple OSS Distributions 		if (cfg.wdc_flags & ~WORKQ_DISPATCH_SUPPORTED_FLAGS ||
3844*8d741a5dSApple OSS Distributions 		    cfg.wdc_version < WORKQ_DISPATCH_MIN_SUPPORTED_VERSION) {
3845*8d741a5dSApple OSS Distributions 			error = ENOTSUP;
3846*8d741a5dSApple OSS Distributions 			break;
3847*8d741a5dSApple OSS Distributions 		}
3848*8d741a5dSApple OSS Distributions 
3849*8d741a5dSApple OSS Distributions 		/* Load fields from version 1 */
3850*8d741a5dSApple OSS Distributions 		p->p_dispatchqueue_serialno_offset = cfg.wdc_queue_serialno_offs;
3851*8d741a5dSApple OSS Distributions 
3852*8d741a5dSApple OSS Distributions 		/* Load fields from version 2 */
3853*8d741a5dSApple OSS Distributions 		if (cfg.wdc_version >= 2) {
3854*8d741a5dSApple OSS Distributions 			p->p_dispatchqueue_label_offset = cfg.wdc_queue_label_offs;
3855*8d741a5dSApple OSS Distributions 		}
3856*8d741a5dSApple OSS Distributions 
3857*8d741a5dSApple OSS Distributions 		break;
3858*8d741a5dSApple OSS Distributions 	}
3859*8d741a5dSApple OSS Distributions 	default:
3860*8d741a5dSApple OSS Distributions 		error = EINVAL;
3861*8d741a5dSApple OSS Distributions 		break;
3862*8d741a5dSApple OSS Distributions 	}
3863*8d741a5dSApple OSS Distributions 
3864*8d741a5dSApple OSS Distributions 	return error;
3865*8d741a5dSApple OSS Distributions }
3866*8d741a5dSApple OSS Distributions 
3867*8d741a5dSApple OSS Distributions /*
3868*8d741a5dSApple OSS Distributions  * We have no work to do, park ourselves on the idle list.
3869*8d741a5dSApple OSS Distributions  *
3870*8d741a5dSApple OSS Distributions  * Consumes the workqueue lock and does not return.
3871*8d741a5dSApple OSS Distributions  */
3872*8d741a5dSApple OSS Distributions __attribute__((noreturn, noinline))
3873*8d741a5dSApple OSS Distributions static void
workq_park_and_unlock(proc_t p,struct workqueue * wq,struct uthread * uth,uint32_t setup_flags)3874*8d741a5dSApple OSS Distributions workq_park_and_unlock(proc_t p, struct workqueue *wq, struct uthread *uth,
3875*8d741a5dSApple OSS Distributions     uint32_t setup_flags)
3876*8d741a5dSApple OSS Distributions {
3877*8d741a5dSApple OSS Distributions 	assert(uth == current_uthread());
3878*8d741a5dSApple OSS Distributions 	assert(uth->uu_kqr_bound == NULL);
3879*8d741a5dSApple OSS Distributions 	workq_push_idle_thread(p, wq, uth, setup_flags); // may not return
3880*8d741a5dSApple OSS Distributions 
3881*8d741a5dSApple OSS Distributions 	workq_thread_reset_cpupercent(NULL, uth);
3882*8d741a5dSApple OSS Distributions 
3883*8d741a5dSApple OSS Distributions #if CONFIG_PREADOPT_TG
3884*8d741a5dSApple OSS Distributions 	/* Clear the preadoption thread group on the thread.
3885*8d741a5dSApple OSS Distributions 	 *
3886*8d741a5dSApple OSS Distributions 	 * Case 1:
3887*8d741a5dSApple OSS Distributions 	 *		Creator thread which never picked up a thread request. We set a
3888*8d741a5dSApple OSS Distributions 	 *		preadoption thread group on creator threads but if it never picked
3889*8d741a5dSApple OSS Distributions 	 *		up a thread request and didn't go to userspace, then the thread will
3890*8d741a5dSApple OSS Distributions 	 *		park with a preadoption thread group but no explicitly adopted
3891*8d741a5dSApple OSS Distributions 	 *		voucher or work interval.
3892*8d741a5dSApple OSS Distributions 	 *
3893*8d741a5dSApple OSS Distributions 	 *		We drop the preadoption thread group here before proceeding to park.
3894*8d741a5dSApple OSS Distributions 	 *		Note - we may get preempted when we drop the workq lock below.
3895*8d741a5dSApple OSS Distributions 	 *
3896*8d741a5dSApple OSS Distributions 	 * Case 2:
3897*8d741a5dSApple OSS Distributions 	 *		Thread picked up a thread request and bound to it and returned back
3898*8d741a5dSApple OSS Distributions 	 *		from userspace and is parking. At this point, preadoption thread
3899*8d741a5dSApple OSS Distributions 	 *		group should be NULL since the thread has unbound from the thread
3900*8d741a5dSApple OSS Distributions 	 *		request. So this operation should be a no-op.
3901*8d741a5dSApple OSS Distributions 	 */
3902*8d741a5dSApple OSS Distributions 	thread_set_preadopt_thread_group(get_machthread(uth), NULL);
3903*8d741a5dSApple OSS Distributions #endif
3904*8d741a5dSApple OSS Distributions 
3905*8d741a5dSApple OSS Distributions 	if ((uth->uu_workq_flags & UT_WORKQ_IDLE_CLEANUP) &&
3906*8d741a5dSApple OSS Distributions 	    !(uth->uu_workq_flags & UT_WORKQ_DYING)) {
3907*8d741a5dSApple OSS Distributions 		workq_unlock(wq);
3908*8d741a5dSApple OSS Distributions 
3909*8d741a5dSApple OSS Distributions 		/*
3910*8d741a5dSApple OSS Distributions 		 * workq_push_idle_thread() will unset `has_stack`
3911*8d741a5dSApple OSS Distributions 		 * if it wants us to free the stack before parking.
3912*8d741a5dSApple OSS Distributions 		 */
3913*8d741a5dSApple OSS Distributions 		if (!uth->uu_save.uus_workq_park_data.has_stack) {
3914*8d741a5dSApple OSS Distributions 			pthread_functions->workq_markfree_threadstack(p,
3915*8d741a5dSApple OSS Distributions 			    get_machthread(uth), get_task_map(proc_task(p)),
3916*8d741a5dSApple OSS Distributions 			    uth->uu_workq_stackaddr);
3917*8d741a5dSApple OSS Distributions 		}
3918*8d741a5dSApple OSS Distributions 
3919*8d741a5dSApple OSS Distributions 		/*
3920*8d741a5dSApple OSS Distributions 		 * When we remove the voucher from the thread, we may lose our importance
3921*8d741a5dSApple OSS Distributions 		 * causing us to get preempted, so we do this after putting the thread on
3922*8d741a5dSApple OSS Distributions 		 * the idle list.  Then, when we get our importance back we'll be able to
3923*8d741a5dSApple OSS Distributions 		 * use this thread from e.g. the kevent call out to deliver a boosting
3924*8d741a5dSApple OSS Distributions 		 * message.
3925*8d741a5dSApple OSS Distributions 		 *
3926*8d741a5dSApple OSS Distributions 		 * Note that setting the voucher to NULL will not clear the preadoption
3927*8d741a5dSApple OSS Distributions 		 * thread since this thread could have become the creator again and
3928*8d741a5dSApple OSS Distributions 		 * perhaps acquired a preadoption thread group.
3929*8d741a5dSApple OSS Distributions 		 */
3930*8d741a5dSApple OSS Distributions 		__assert_only kern_return_t kr;
3931*8d741a5dSApple OSS Distributions 		kr = thread_set_voucher_name(MACH_PORT_NULL);
3932*8d741a5dSApple OSS Distributions 		assert(kr == KERN_SUCCESS);
3933*8d741a5dSApple OSS Distributions 
3934*8d741a5dSApple OSS Distributions 		workq_lock_spin(wq);
3935*8d741a5dSApple OSS Distributions 		uth->uu_workq_flags &= ~UT_WORKQ_IDLE_CLEANUP;
3936*8d741a5dSApple OSS Distributions 		setup_flags &= ~WQ_SETUP_CLEAR_VOUCHER;
3937*8d741a5dSApple OSS Distributions 	}
3938*8d741a5dSApple OSS Distributions 
3939*8d741a5dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_thread_logical_run | DBG_FUNC_END, wq, 0, 0, 0);
3940*8d741a5dSApple OSS Distributions 
3941*8d741a5dSApple OSS Distributions 	if (uth->uu_workq_flags & UT_WORKQ_RUNNING) {
3942*8d741a5dSApple OSS Distributions 		/*
3943*8d741a5dSApple OSS Distributions 		 * While we'd dropped the lock to unset our voucher, someone came
3944*8d741a5dSApple OSS Distributions 		 * around and made us runnable.  But because we weren't waiting on the
3945*8d741a5dSApple OSS Distributions 		 * event their thread_wakeup() was ineffectual.  To correct for that,
3946*8d741a5dSApple OSS Distributions 		 * we just run the continuation ourselves.
3947*8d741a5dSApple OSS Distributions 		 */
3948*8d741a5dSApple OSS Distributions 		workq_unpark_select_threadreq_or_park_and_unlock(p, wq, uth, setup_flags);
3949*8d741a5dSApple OSS Distributions 		__builtin_unreachable();
3950*8d741a5dSApple OSS Distributions 	}
3951*8d741a5dSApple OSS Distributions 
3952*8d741a5dSApple OSS Distributions 	if (uth->uu_workq_flags & UT_WORKQ_DYING) {
3953*8d741a5dSApple OSS Distributions 		workq_unpark_for_death_and_unlock(p, wq, uth,
3954*8d741a5dSApple OSS Distributions 		    WORKQ_UNPARK_FOR_DEATH_WAS_IDLE, setup_flags);
3955*8d741a5dSApple OSS Distributions 		__builtin_unreachable();
3956*8d741a5dSApple OSS Distributions 	}
3957*8d741a5dSApple OSS Distributions 
3958*8d741a5dSApple OSS Distributions 	/* Disarm the workqueue quantum since the thread is now idle */
3959*8d741a5dSApple OSS Distributions 	thread_disarm_workqueue_quantum(get_machthread(uth));
3960*8d741a5dSApple OSS Distributions 
3961*8d741a5dSApple OSS Distributions 	thread_set_pending_block_hint(get_machthread(uth), kThreadWaitParkedWorkQueue);
3962*8d741a5dSApple OSS Distributions 	assert_wait(workq_parked_wait_event(uth), THREAD_INTERRUPTIBLE);
3963*8d741a5dSApple OSS Distributions 	workq_unlock(wq);
3964*8d741a5dSApple OSS Distributions 	thread_block(workq_unpark_continue);
3965*8d741a5dSApple OSS Distributions 	__builtin_unreachable();
3966*8d741a5dSApple OSS Distributions }
3967*8d741a5dSApple OSS Distributions 
3968*8d741a5dSApple OSS Distributions static inline bool
workq_may_start_event_mgr_thread(struct workqueue * wq,struct uthread * uth)3969*8d741a5dSApple OSS Distributions workq_may_start_event_mgr_thread(struct workqueue *wq, struct uthread *uth)
3970*8d741a5dSApple OSS Distributions {
3971*8d741a5dSApple OSS Distributions 	/*
3972*8d741a5dSApple OSS Distributions 	 * There's an event manager request and either:
3973*8d741a5dSApple OSS Distributions 	 * - no event manager currently running
3974*8d741a5dSApple OSS Distributions 	 * - we are re-using the event manager
3975*8d741a5dSApple OSS Distributions 	 */
3976*8d741a5dSApple OSS Distributions 	return wq->wq_thscheduled_count[_wq_bucket(WORKQ_THREAD_QOS_MANAGER)] == 0 ||
3977*8d741a5dSApple OSS Distributions 	       (uth && uth->uu_workq_pri.qos_bucket == WORKQ_THREAD_QOS_MANAGER);
3978*8d741a5dSApple OSS Distributions }
3979*8d741a5dSApple OSS Distributions 
3980*8d741a5dSApple OSS Distributions /* Called with workq lock held. */
3981*8d741a5dSApple OSS Distributions static uint32_t
workq_constrained_allowance(struct workqueue * wq,thread_qos_t at_qos,struct uthread * uth,bool may_start_timer,bool record_failed_allowance)3982*8d741a5dSApple OSS Distributions workq_constrained_allowance(struct workqueue *wq, thread_qos_t at_qos,
3983*8d741a5dSApple OSS Distributions     struct uthread *uth, bool may_start_timer, bool record_failed_allowance)
3984*8d741a5dSApple OSS Distributions {
3985*8d741a5dSApple OSS Distributions 	assert(at_qos != WORKQ_THREAD_QOS_MANAGER);
3986*8d741a5dSApple OSS Distributions 	uint32_t allowance_passed = 0;
3987*8d741a5dSApple OSS Distributions 	uint32_t count = 0;
3988*8d741a5dSApple OSS Distributions 
3989*8d741a5dSApple OSS Distributions 	uint32_t max_count = wq->wq_constrained_threads_scheduled;
3990*8d741a5dSApple OSS Distributions 	if (uth && workq_thread_is_nonovercommit(uth)) {
3991*8d741a5dSApple OSS Distributions 		/*
3992*8d741a5dSApple OSS Distributions 		 * don't count the current thread as scheduled
3993*8d741a5dSApple OSS Distributions 		 */
3994*8d741a5dSApple OSS Distributions 		assert(max_count > 0);
3995*8d741a5dSApple OSS Distributions 		max_count--;
3996*8d741a5dSApple OSS Distributions 	}
3997*8d741a5dSApple OSS Distributions 	if (max_count >= wq_max_constrained_threads) {
3998*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_constrained_admission | DBG_FUNC_NONE, wq, 1,
3999*8d741a5dSApple OSS Distributions 		    wq->wq_constrained_threads_scheduled,
4000*8d741a5dSApple OSS Distributions 		    wq_max_constrained_threads);
4001*8d741a5dSApple OSS Distributions 		/*
4002*8d741a5dSApple OSS Distributions 		 * we need 1 or more constrained threads to return to the kernel before
4003*8d741a5dSApple OSS Distributions 		 * we can dispatch additional work
4004*8d741a5dSApple OSS Distributions 		 */
4005*8d741a5dSApple OSS Distributions 		allowance_passed = 0;
4006*8d741a5dSApple OSS Distributions 		goto out;
4007*8d741a5dSApple OSS Distributions 	}
4008*8d741a5dSApple OSS Distributions 	max_count -= wq_max_constrained_threads;
4009*8d741a5dSApple OSS Distributions 
4010*8d741a5dSApple OSS Distributions 	/*
4011*8d741a5dSApple OSS Distributions 	 * Compute a metric for many how many threads are active.  We find the
4012*8d741a5dSApple OSS Distributions 	 * highest priority request outstanding and then add up the number of active
4013*8d741a5dSApple OSS Distributions 	 * threads in that and all higher-priority buckets.  We'll also add any
4014*8d741a5dSApple OSS Distributions 	 * "busy" threads which are not currently active but blocked recently enough
4015*8d741a5dSApple OSS Distributions 	 * that we can't be sure that they won't be unblocked soon and start
4016*8d741a5dSApple OSS Distributions 	 * being active again.
4017*8d741a5dSApple OSS Distributions 	 *
4018*8d741a5dSApple OSS Distributions 	 * We'll then compare this metric to our max concurrency to decide whether
4019*8d741a5dSApple OSS Distributions 	 * to add a new thread.
4020*8d741a5dSApple OSS Distributions 	 */
4021*8d741a5dSApple OSS Distributions 
4022*8d741a5dSApple OSS Distributions 	uint32_t busycount, thactive_count;
4023*8d741a5dSApple OSS Distributions 
4024*8d741a5dSApple OSS Distributions 	thactive_count = _wq_thactive_aggregate_downto_qos(wq, _wq_thactive(wq),
4025*8d741a5dSApple OSS Distributions 	    at_qos, &busycount, NULL);
4026*8d741a5dSApple OSS Distributions 
4027*8d741a5dSApple OSS Distributions 	if (uth && uth->uu_workq_pri.qos_bucket != WORKQ_THREAD_QOS_MANAGER &&
4028*8d741a5dSApple OSS Distributions 	    at_qos <= uth->uu_workq_pri.qos_bucket) {
4029*8d741a5dSApple OSS Distributions 		/*
4030*8d741a5dSApple OSS Distributions 		 * Don't count this thread as currently active, but only if it's not
4031*8d741a5dSApple OSS Distributions 		 * a manager thread, as _wq_thactive_aggregate_downto_qos ignores active
4032*8d741a5dSApple OSS Distributions 		 * managers.
4033*8d741a5dSApple OSS Distributions 		 */
4034*8d741a5dSApple OSS Distributions 		assert(thactive_count > 0);
4035*8d741a5dSApple OSS Distributions 		thactive_count--;
4036*8d741a5dSApple OSS Distributions 	}
4037*8d741a5dSApple OSS Distributions 
4038*8d741a5dSApple OSS Distributions 	count = wq_max_parallelism[_wq_bucket(at_qos)];
4039*8d741a5dSApple OSS Distributions 	if (count > thactive_count + busycount) {
4040*8d741a5dSApple OSS Distributions 		count -= thactive_count + busycount;
4041*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_constrained_admission | DBG_FUNC_NONE, wq, 2,
4042*8d741a5dSApple OSS Distributions 		    thactive_count, busycount);
4043*8d741a5dSApple OSS Distributions 		allowance_passed = MIN(count, max_count);
4044*8d741a5dSApple OSS Distributions 		goto out;
4045*8d741a5dSApple OSS Distributions 	} else {
4046*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_constrained_admission | DBG_FUNC_NONE, wq, 3,
4047*8d741a5dSApple OSS Distributions 		    thactive_count, busycount);
4048*8d741a5dSApple OSS Distributions 		allowance_passed = 0;
4049*8d741a5dSApple OSS Distributions 	}
4050*8d741a5dSApple OSS Distributions 
4051*8d741a5dSApple OSS Distributions 	if (may_start_timer) {
4052*8d741a5dSApple OSS Distributions 		/*
4053*8d741a5dSApple OSS Distributions 		 * If this is called from the add timer, we won't have another timer
4054*8d741a5dSApple OSS Distributions 		 * fire when the thread exits the "busy" state, so rearm the timer.
4055*8d741a5dSApple OSS Distributions 		 */
4056*8d741a5dSApple OSS Distributions 		workq_schedule_delayed_thread_creation(wq, 0);
4057*8d741a5dSApple OSS Distributions 	}
4058*8d741a5dSApple OSS Distributions 
4059*8d741a5dSApple OSS Distributions out:
4060*8d741a5dSApple OSS Distributions 	if (record_failed_allowance) {
4061*8d741a5dSApple OSS Distributions 		wq->wq_exceeded_active_constrained_thread_limit = !allowance_passed;
4062*8d741a5dSApple OSS Distributions 	}
4063*8d741a5dSApple OSS Distributions 	return allowance_passed;
4064*8d741a5dSApple OSS Distributions }
4065*8d741a5dSApple OSS Distributions 
4066*8d741a5dSApple OSS Distributions static bool
workq_threadreq_admissible(struct workqueue * wq,struct uthread * uth,workq_threadreq_t req)4067*8d741a5dSApple OSS Distributions workq_threadreq_admissible(struct workqueue *wq, struct uthread *uth,
4068*8d741a5dSApple OSS Distributions     workq_threadreq_t req)
4069*8d741a5dSApple OSS Distributions {
4070*8d741a5dSApple OSS Distributions 	if (req->tr_qos == WORKQ_THREAD_QOS_MANAGER) {
4071*8d741a5dSApple OSS Distributions 		return workq_may_start_event_mgr_thread(wq, uth);
4072*8d741a5dSApple OSS Distributions 	}
4073*8d741a5dSApple OSS Distributions 	if (workq_threadreq_is_cooperative(req)) {
4074*8d741a5dSApple OSS Distributions 		return workq_cooperative_allowance(wq, req->tr_qos, uth, true);
4075*8d741a5dSApple OSS Distributions 	}
4076*8d741a5dSApple OSS Distributions 	if (workq_threadreq_is_nonovercommit(req)) {
4077*8d741a5dSApple OSS Distributions 		return workq_constrained_allowance(wq, req->tr_qos, uth, true, true);
4078*8d741a5dSApple OSS Distributions 	}
4079*8d741a5dSApple OSS Distributions 
4080*8d741a5dSApple OSS Distributions 	return true;
4081*8d741a5dSApple OSS Distributions }
4082*8d741a5dSApple OSS Distributions 
4083*8d741a5dSApple OSS Distributions /*
4084*8d741a5dSApple OSS Distributions  * Called from the context of selecting thread requests for threads returning
4085*8d741a5dSApple OSS Distributions  * from userspace or creator thread
4086*8d741a5dSApple OSS Distributions  */
4087*8d741a5dSApple OSS Distributions static workq_threadreq_t
workq_cooperative_queue_best_req(struct workqueue * wq,struct uthread * uth)4088*8d741a5dSApple OSS Distributions workq_cooperative_queue_best_req(struct workqueue *wq, struct uthread *uth)
4089*8d741a5dSApple OSS Distributions {
4090*8d741a5dSApple OSS Distributions 	workq_lock_held(wq);
4091*8d741a5dSApple OSS Distributions 
4092*8d741a5dSApple OSS Distributions 	/*
4093*8d741a5dSApple OSS Distributions 	 * If the current thread is cooperative, we need to exclude it as part of
4094*8d741a5dSApple OSS Distributions 	 * cooperative schedule count since this thread is looking for a new
4095*8d741a5dSApple OSS Distributions 	 * request. Change in the schedule count for cooperative pool therefore
4096*8d741a5dSApple OSS Distributions 	 * requires us to reeevaluate the next best request for it.
4097*8d741a5dSApple OSS Distributions 	 */
4098*8d741a5dSApple OSS Distributions 	if (uth && workq_thread_is_cooperative(uth)) {
4099*8d741a5dSApple OSS Distributions 		_wq_cooperative_queue_scheduled_count_dec(wq, uth->uu_workq_pri.qos_req);
4100*8d741a5dSApple OSS Distributions 
4101*8d741a5dSApple OSS Distributions 		(void) _wq_cooperative_queue_refresh_best_req_qos(wq);
4102*8d741a5dSApple OSS Distributions 
4103*8d741a5dSApple OSS Distributions 		_wq_cooperative_queue_scheduled_count_inc(wq, uth->uu_workq_pri.qos_req);
4104*8d741a5dSApple OSS Distributions 	} else {
4105*8d741a5dSApple OSS Distributions 		/*
4106*8d741a5dSApple OSS Distributions 		 * The old value that was already precomputed should be safe to use -
4107*8d741a5dSApple OSS Distributions 		 * add an assert that asserts that the best req QoS doesn't change in
4108*8d741a5dSApple OSS Distributions 		 * this case
4109*8d741a5dSApple OSS Distributions 		 */
4110*8d741a5dSApple OSS Distributions 		assert(_wq_cooperative_queue_refresh_best_req_qos(wq) == false);
4111*8d741a5dSApple OSS Distributions 	}
4112*8d741a5dSApple OSS Distributions 
4113*8d741a5dSApple OSS Distributions 	thread_qos_t qos = wq->wq_cooperative_queue_best_req_qos;
4114*8d741a5dSApple OSS Distributions 
4115*8d741a5dSApple OSS Distributions 	/* There are no eligible requests in the cooperative pool */
4116*8d741a5dSApple OSS Distributions 	if (qos == THREAD_QOS_UNSPECIFIED) {
4117*8d741a5dSApple OSS Distributions 		return NULL;
4118*8d741a5dSApple OSS Distributions 	}
4119*8d741a5dSApple OSS Distributions 	assert(qos != WORKQ_THREAD_QOS_ABOVEUI);
4120*8d741a5dSApple OSS Distributions 	assert(qos != WORKQ_THREAD_QOS_MANAGER);
4121*8d741a5dSApple OSS Distributions 
4122*8d741a5dSApple OSS Distributions 	uint8_t bucket = _wq_bucket(qos);
4123*8d741a5dSApple OSS Distributions 	assert(!STAILQ_EMPTY(&wq->wq_cooperative_queue[bucket]));
4124*8d741a5dSApple OSS Distributions 
4125*8d741a5dSApple OSS Distributions 	return STAILQ_FIRST(&wq->wq_cooperative_queue[bucket]);
4126*8d741a5dSApple OSS Distributions }
4127*8d741a5dSApple OSS Distributions 
4128*8d741a5dSApple OSS Distributions static workq_threadreq_t
workq_threadreq_select_for_creator(struct workqueue * wq)4129*8d741a5dSApple OSS Distributions workq_threadreq_select_for_creator(struct workqueue *wq)
4130*8d741a5dSApple OSS Distributions {
4131*8d741a5dSApple OSS Distributions 	workq_threadreq_t req_qos, req_pri, req_tmp, req_mgr;
4132*8d741a5dSApple OSS Distributions 	thread_qos_t qos = THREAD_QOS_UNSPECIFIED;
4133*8d741a5dSApple OSS Distributions 	uint8_t pri = 0;
4134*8d741a5dSApple OSS Distributions 
4135*8d741a5dSApple OSS Distributions 	/*
4136*8d741a5dSApple OSS Distributions 	 * Compute the best priority request, and ignore the turnstile for now
4137*8d741a5dSApple OSS Distributions 	 */
4138*8d741a5dSApple OSS Distributions 
4139*8d741a5dSApple OSS Distributions 	req_pri = priority_queue_max(&wq->wq_special_queue,
4140*8d741a5dSApple OSS Distributions 	    struct workq_threadreq_s, tr_entry);
4141*8d741a5dSApple OSS Distributions 	if (req_pri) {
4142*8d741a5dSApple OSS Distributions 		pri = (uint8_t)priority_queue_entry_sched_pri(&wq->wq_special_queue,
4143*8d741a5dSApple OSS Distributions 		    &req_pri->tr_entry);
4144*8d741a5dSApple OSS Distributions 	}
4145*8d741a5dSApple OSS Distributions 
4146*8d741a5dSApple OSS Distributions 	/*
4147*8d741a5dSApple OSS Distributions 	 * Handle the manager thread request. The special queue might yield
4148*8d741a5dSApple OSS Distributions 	 * a higher priority, but the manager always beats the QoS world.
4149*8d741a5dSApple OSS Distributions 	 */
4150*8d741a5dSApple OSS Distributions 
4151*8d741a5dSApple OSS Distributions 	req_mgr = wq->wq_event_manager_threadreq;
4152*8d741a5dSApple OSS Distributions 	if (req_mgr && workq_may_start_event_mgr_thread(wq, NULL)) {
4153*8d741a5dSApple OSS Distributions 		uint32_t mgr_pri = wq->wq_event_manager_priority;
4154*8d741a5dSApple OSS Distributions 
4155*8d741a5dSApple OSS Distributions 		if (mgr_pri & _PTHREAD_PRIORITY_SCHED_PRI_FLAG) {
4156*8d741a5dSApple OSS Distributions 			mgr_pri &= _PTHREAD_PRIORITY_SCHED_PRI_MASK;
4157*8d741a5dSApple OSS Distributions 		} else {
4158*8d741a5dSApple OSS Distributions 			mgr_pri = thread_workq_pri_for_qos(
4159*8d741a5dSApple OSS Distributions 				_pthread_priority_thread_qos(mgr_pri));
4160*8d741a5dSApple OSS Distributions 		}
4161*8d741a5dSApple OSS Distributions 
4162*8d741a5dSApple OSS Distributions 		return mgr_pri >= pri ? req_mgr : req_pri;
4163*8d741a5dSApple OSS Distributions 	}
4164*8d741a5dSApple OSS Distributions 
4165*8d741a5dSApple OSS Distributions 	/*
4166*8d741a5dSApple OSS Distributions 	 * Compute the best QoS Request, and check whether it beats the "pri" one
4167*8d741a5dSApple OSS Distributions 	 *
4168*8d741a5dSApple OSS Distributions 	 * Start by comparing the overcommit and the cooperative pool
4169*8d741a5dSApple OSS Distributions 	 */
4170*8d741a5dSApple OSS Distributions 	req_qos = priority_queue_max(&wq->wq_overcommit_queue,
4171*8d741a5dSApple OSS Distributions 	    struct workq_threadreq_s, tr_entry);
4172*8d741a5dSApple OSS Distributions 	if (req_qos) {
4173*8d741a5dSApple OSS Distributions 		qos = req_qos->tr_qos;
4174*8d741a5dSApple OSS Distributions 	}
4175*8d741a5dSApple OSS Distributions 
4176*8d741a5dSApple OSS Distributions 	req_tmp = workq_cooperative_queue_best_req(wq, NULL);
4177*8d741a5dSApple OSS Distributions 	if (req_tmp && qos <= req_tmp->tr_qos) {
4178*8d741a5dSApple OSS Distributions 		/*
4179*8d741a5dSApple OSS Distributions 		 * Cooperative TR is better between overcommit and cooperative.  Note
4180*8d741a5dSApple OSS Distributions 		 * that if qos is same between overcommit and cooperative, we choose
4181*8d741a5dSApple OSS Distributions 		 * cooperative.
4182*8d741a5dSApple OSS Distributions 		 *
4183*8d741a5dSApple OSS Distributions 		 * Pick cooperative pool if it passes the admissions check
4184*8d741a5dSApple OSS Distributions 		 */
4185*8d741a5dSApple OSS Distributions 		if (workq_cooperative_allowance(wq, req_tmp->tr_qos, NULL, true)) {
4186*8d741a5dSApple OSS Distributions 			req_qos = req_tmp;
4187*8d741a5dSApple OSS Distributions 			qos = req_qos->tr_qos;
4188*8d741a5dSApple OSS Distributions 		}
4189*8d741a5dSApple OSS Distributions 	}
4190*8d741a5dSApple OSS Distributions 
4191*8d741a5dSApple OSS Distributions 	/*
4192*8d741a5dSApple OSS Distributions 	 * Compare the best QoS so far - either from overcommit or from cooperative
4193*8d741a5dSApple OSS Distributions 	 * pool - and compare it with the constrained pool
4194*8d741a5dSApple OSS Distributions 	 */
4195*8d741a5dSApple OSS Distributions 	req_tmp = priority_queue_max(&wq->wq_constrained_queue,
4196*8d741a5dSApple OSS Distributions 	    struct workq_threadreq_s, tr_entry);
4197*8d741a5dSApple OSS Distributions 
4198*8d741a5dSApple OSS Distributions 	if (req_tmp && qos < req_tmp->tr_qos) {
4199*8d741a5dSApple OSS Distributions 		/*
4200*8d741a5dSApple OSS Distributions 		 * Constrained pool is best in QoS between overcommit, cooperative
4201*8d741a5dSApple OSS Distributions 		 * and constrained. Now check how it fairs against the priority case
4202*8d741a5dSApple OSS Distributions 		 */
4203*8d741a5dSApple OSS Distributions 		if (pri && pri >= thread_workq_pri_for_qos(req_tmp->tr_qos)) {
4204*8d741a5dSApple OSS Distributions 			return req_pri;
4205*8d741a5dSApple OSS Distributions 		}
4206*8d741a5dSApple OSS Distributions 
4207*8d741a5dSApple OSS Distributions 		if (workq_constrained_allowance(wq, req_tmp->tr_qos, NULL, true, true)) {
4208*8d741a5dSApple OSS Distributions 			/*
4209*8d741a5dSApple OSS Distributions 			 * If the constrained thread request is the best one and passes
4210*8d741a5dSApple OSS Distributions 			 * the admission check, pick it.
4211*8d741a5dSApple OSS Distributions 			 */
4212*8d741a5dSApple OSS Distributions 			return req_tmp;
4213*8d741a5dSApple OSS Distributions 		}
4214*8d741a5dSApple OSS Distributions 	}
4215*8d741a5dSApple OSS Distributions 
4216*8d741a5dSApple OSS Distributions 	/*
4217*8d741a5dSApple OSS Distributions 	 * Compare the best of the QoS world with the priority
4218*8d741a5dSApple OSS Distributions 	 */
4219*8d741a5dSApple OSS Distributions 	if (pri && (!qos || pri >= thread_workq_pri_for_qos(qos))) {
4220*8d741a5dSApple OSS Distributions 		return req_pri;
4221*8d741a5dSApple OSS Distributions 	}
4222*8d741a5dSApple OSS Distributions 
4223*8d741a5dSApple OSS Distributions 	if (req_qos) {
4224*8d741a5dSApple OSS Distributions 		return req_qos;
4225*8d741a5dSApple OSS Distributions 	}
4226*8d741a5dSApple OSS Distributions 
4227*8d741a5dSApple OSS Distributions 	/*
4228*8d741a5dSApple OSS Distributions 	 * If we had no eligible request but we have a turnstile push,
4229*8d741a5dSApple OSS Distributions 	 * it must be a non overcommit thread request that failed
4230*8d741a5dSApple OSS Distributions 	 * the admission check.
4231*8d741a5dSApple OSS Distributions 	 *
4232*8d741a5dSApple OSS Distributions 	 * Just fake a BG thread request so that if the push stops the creator
4233*8d741a5dSApple OSS Distributions 	 * priority just drops to 4.
4234*8d741a5dSApple OSS Distributions 	 */
4235*8d741a5dSApple OSS Distributions 	if (turnstile_workq_proprietor_of_max_turnstile(wq->wq_turnstile, NULL)) {
4236*8d741a5dSApple OSS Distributions 		static struct workq_threadreq_s workq_sync_push_fake_req = {
4237*8d741a5dSApple OSS Distributions 			.tr_qos = THREAD_QOS_BACKGROUND,
4238*8d741a5dSApple OSS Distributions 		};
4239*8d741a5dSApple OSS Distributions 
4240*8d741a5dSApple OSS Distributions 		return &workq_sync_push_fake_req;
4241*8d741a5dSApple OSS Distributions 	}
4242*8d741a5dSApple OSS Distributions 
4243*8d741a5dSApple OSS Distributions 	return NULL;
4244*8d741a5dSApple OSS Distributions }
4245*8d741a5dSApple OSS Distributions 
4246*8d741a5dSApple OSS Distributions /*
4247*8d741a5dSApple OSS Distributions  * Returns true if this caused a change in the schedule counts of the
4248*8d741a5dSApple OSS Distributions  * cooperative pool
4249*8d741a5dSApple OSS Distributions  */
4250*8d741a5dSApple OSS Distributions static bool
workq_adjust_cooperative_constrained_schedule_counts(struct workqueue * wq,struct uthread * uth,thread_qos_t old_thread_qos,workq_tr_flags_t tr_flags)4251*8d741a5dSApple OSS Distributions workq_adjust_cooperative_constrained_schedule_counts(struct workqueue *wq,
4252*8d741a5dSApple OSS Distributions     struct uthread *uth, thread_qos_t old_thread_qos, workq_tr_flags_t tr_flags)
4253*8d741a5dSApple OSS Distributions {
4254*8d741a5dSApple OSS Distributions 	workq_lock_held(wq);
4255*8d741a5dSApple OSS Distributions 
4256*8d741a5dSApple OSS Distributions 	/*
4257*8d741a5dSApple OSS Distributions 	 * Row: thread type
4258*8d741a5dSApple OSS Distributions 	 * Column: Request type
4259*8d741a5dSApple OSS Distributions 	 *
4260*8d741a5dSApple OSS Distributions 	 *					overcommit		non-overcommit		cooperative
4261*8d741a5dSApple OSS Distributions 	 * overcommit			X				case 1				case 2
4262*8d741a5dSApple OSS Distributions 	 * cooperative		case 3				case 4				case 5
4263*8d741a5dSApple OSS Distributions 	 * non-overcommit	case 6					X				case 7
4264*8d741a5dSApple OSS Distributions 	 *
4265*8d741a5dSApple OSS Distributions 	 * Move the thread to the right bucket depending on what state it currently
4266*8d741a5dSApple OSS Distributions 	 * has and what state the thread req it picks, is going to have.
4267*8d741a5dSApple OSS Distributions 	 *
4268*8d741a5dSApple OSS Distributions 	 * Note that the creator thread is an overcommit thread.
4269*8d741a5dSApple OSS Distributions 	 */
4270*8d741a5dSApple OSS Distributions 	thread_qos_t new_thread_qos = uth->uu_workq_pri.qos_req;
4271*8d741a5dSApple OSS Distributions 
4272*8d741a5dSApple OSS Distributions 	/*
4273*8d741a5dSApple OSS Distributions 	 * Anytime a cooperative bucket's schedule count changes, we need to
4274*8d741a5dSApple OSS Distributions 	 * potentially refresh the next best QoS for that pool when we determine
4275*8d741a5dSApple OSS Distributions 	 * the next request for the creator
4276*8d741a5dSApple OSS Distributions 	 */
4277*8d741a5dSApple OSS Distributions 	bool cooperative_pool_sched_count_changed = false;
4278*8d741a5dSApple OSS Distributions 
4279*8d741a5dSApple OSS Distributions 	if (workq_thread_is_overcommit(uth)) {
4280*8d741a5dSApple OSS Distributions 		if (workq_tr_is_nonovercommit(tr_flags)) {
4281*8d741a5dSApple OSS Distributions 			// Case 1: thread is overcommit, req is non-overcommit
4282*8d741a5dSApple OSS Distributions 			wq->wq_constrained_threads_scheduled++;
4283*8d741a5dSApple OSS Distributions 		} else if (workq_tr_is_cooperative(tr_flags)) {
4284*8d741a5dSApple OSS Distributions 			// Case 2: thread is overcommit, req is cooperative
4285*8d741a5dSApple OSS Distributions 			_wq_cooperative_queue_scheduled_count_inc(wq, new_thread_qos);
4286*8d741a5dSApple OSS Distributions 			cooperative_pool_sched_count_changed = true;
4287*8d741a5dSApple OSS Distributions 		}
4288*8d741a5dSApple OSS Distributions 	} else if (workq_thread_is_cooperative(uth)) {
4289*8d741a5dSApple OSS Distributions 		if (workq_tr_is_overcommit(tr_flags)) {
4290*8d741a5dSApple OSS Distributions 			// Case 3: thread is cooperative, req is overcommit
4291*8d741a5dSApple OSS Distributions 			_wq_cooperative_queue_scheduled_count_dec(wq, old_thread_qos);
4292*8d741a5dSApple OSS Distributions 		} else if (workq_tr_is_nonovercommit(tr_flags)) {
4293*8d741a5dSApple OSS Distributions 			// Case 4: thread is cooperative, req is non-overcommit
4294*8d741a5dSApple OSS Distributions 			_wq_cooperative_queue_scheduled_count_dec(wq, old_thread_qos);
4295*8d741a5dSApple OSS Distributions 			wq->wq_constrained_threads_scheduled++;
4296*8d741a5dSApple OSS Distributions 		} else {
4297*8d741a5dSApple OSS Distributions 			// Case 5: thread is cooperative, req is also cooperative
4298*8d741a5dSApple OSS Distributions 			assert(workq_tr_is_cooperative(tr_flags));
4299*8d741a5dSApple OSS Distributions 			_wq_cooperative_queue_scheduled_count_dec(wq, old_thread_qos);
4300*8d741a5dSApple OSS Distributions 			_wq_cooperative_queue_scheduled_count_inc(wq, new_thread_qos);
4301*8d741a5dSApple OSS Distributions 		}
4302*8d741a5dSApple OSS Distributions 		cooperative_pool_sched_count_changed = true;
4303*8d741a5dSApple OSS Distributions 	} else {
4304*8d741a5dSApple OSS Distributions 		if (workq_tr_is_overcommit(tr_flags)) {
4305*8d741a5dSApple OSS Distributions 			// Case 6: Thread is non-overcommit, req is overcommit
4306*8d741a5dSApple OSS Distributions 			wq->wq_constrained_threads_scheduled--;
4307*8d741a5dSApple OSS Distributions 		} else if (workq_tr_is_cooperative(tr_flags)) {
4308*8d741a5dSApple OSS Distributions 			// Case 7: Thread is non-overcommit, req is cooperative
4309*8d741a5dSApple OSS Distributions 			wq->wq_constrained_threads_scheduled--;
4310*8d741a5dSApple OSS Distributions 			_wq_cooperative_queue_scheduled_count_inc(wq, new_thread_qos);
4311*8d741a5dSApple OSS Distributions 			cooperative_pool_sched_count_changed = true;
4312*8d741a5dSApple OSS Distributions 		}
4313*8d741a5dSApple OSS Distributions 	}
4314*8d741a5dSApple OSS Distributions 
4315*8d741a5dSApple OSS Distributions 	return cooperative_pool_sched_count_changed;
4316*8d741a5dSApple OSS Distributions }
4317*8d741a5dSApple OSS Distributions 
4318*8d741a5dSApple OSS Distributions static workq_threadreq_t
workq_threadreq_select(struct workqueue * wq,struct uthread * uth)4319*8d741a5dSApple OSS Distributions workq_threadreq_select(struct workqueue *wq, struct uthread *uth)
4320*8d741a5dSApple OSS Distributions {
4321*8d741a5dSApple OSS Distributions 	workq_threadreq_t req_qos, req_pri, req_tmp, req_mgr;
4322*8d741a5dSApple OSS Distributions 	uintptr_t proprietor;
4323*8d741a5dSApple OSS Distributions 	thread_qos_t qos = THREAD_QOS_UNSPECIFIED;
4324*8d741a5dSApple OSS Distributions 	uint8_t pri = 0;
4325*8d741a5dSApple OSS Distributions 
4326*8d741a5dSApple OSS Distributions 	if (uth == wq->wq_creator) {
4327*8d741a5dSApple OSS Distributions 		uth = NULL;
4328*8d741a5dSApple OSS Distributions 	}
4329*8d741a5dSApple OSS Distributions 
4330*8d741a5dSApple OSS Distributions 	/*
4331*8d741a5dSApple OSS Distributions 	 * Compute the best priority request (special or turnstile)
4332*8d741a5dSApple OSS Distributions 	 */
4333*8d741a5dSApple OSS Distributions 
4334*8d741a5dSApple OSS Distributions 	pri = (uint8_t)turnstile_workq_proprietor_of_max_turnstile(wq->wq_turnstile,
4335*8d741a5dSApple OSS Distributions 	    &proprietor);
4336*8d741a5dSApple OSS Distributions 	if (pri) {
4337*8d741a5dSApple OSS Distributions 		struct kqworkloop *kqwl = (struct kqworkloop *)proprietor;
4338*8d741a5dSApple OSS Distributions 		req_pri = &kqwl->kqwl_request;
4339*8d741a5dSApple OSS Distributions 		if (req_pri->tr_state != WORKQ_TR_STATE_QUEUED) {
4340*8d741a5dSApple OSS Distributions 			panic("Invalid thread request (%p) state %d",
4341*8d741a5dSApple OSS Distributions 			    req_pri, req_pri->tr_state);
4342*8d741a5dSApple OSS Distributions 		}
4343*8d741a5dSApple OSS Distributions 	} else {
4344*8d741a5dSApple OSS Distributions 		req_pri = NULL;
4345*8d741a5dSApple OSS Distributions 	}
4346*8d741a5dSApple OSS Distributions 
4347*8d741a5dSApple OSS Distributions 	req_tmp = priority_queue_max(&wq->wq_special_queue,
4348*8d741a5dSApple OSS Distributions 	    struct workq_threadreq_s, tr_entry);
4349*8d741a5dSApple OSS Distributions 	if (req_tmp && pri < priority_queue_entry_sched_pri(&wq->wq_special_queue,
4350*8d741a5dSApple OSS Distributions 	    &req_tmp->tr_entry)) {
4351*8d741a5dSApple OSS Distributions 		req_pri = req_tmp;
4352*8d741a5dSApple OSS Distributions 		pri = (uint8_t)priority_queue_entry_sched_pri(&wq->wq_special_queue,
4353*8d741a5dSApple OSS Distributions 		    &req_tmp->tr_entry);
4354*8d741a5dSApple OSS Distributions 	}
4355*8d741a5dSApple OSS Distributions 
4356*8d741a5dSApple OSS Distributions 	/*
4357*8d741a5dSApple OSS Distributions 	 * Handle the manager thread request. The special queue might yield
4358*8d741a5dSApple OSS Distributions 	 * a higher priority, but the manager always beats the QoS world.
4359*8d741a5dSApple OSS Distributions 	 */
4360*8d741a5dSApple OSS Distributions 
4361*8d741a5dSApple OSS Distributions 	req_mgr = wq->wq_event_manager_threadreq;
4362*8d741a5dSApple OSS Distributions 	if (req_mgr && workq_may_start_event_mgr_thread(wq, uth)) {
4363*8d741a5dSApple OSS Distributions 		uint32_t mgr_pri = wq->wq_event_manager_priority;
4364*8d741a5dSApple OSS Distributions 
4365*8d741a5dSApple OSS Distributions 		if (mgr_pri & _PTHREAD_PRIORITY_SCHED_PRI_FLAG) {
4366*8d741a5dSApple OSS Distributions 			mgr_pri &= _PTHREAD_PRIORITY_SCHED_PRI_MASK;
4367*8d741a5dSApple OSS Distributions 		} else {
4368*8d741a5dSApple OSS Distributions 			mgr_pri = thread_workq_pri_for_qos(
4369*8d741a5dSApple OSS Distributions 				_pthread_priority_thread_qos(mgr_pri));
4370*8d741a5dSApple OSS Distributions 		}
4371*8d741a5dSApple OSS Distributions 
4372*8d741a5dSApple OSS Distributions 		return mgr_pri >= pri ? req_mgr : req_pri;
4373*8d741a5dSApple OSS Distributions 	}
4374*8d741a5dSApple OSS Distributions 
4375*8d741a5dSApple OSS Distributions 	/*
4376*8d741a5dSApple OSS Distributions 	 * Compute the best QoS Request, and check whether it beats the "pri" one
4377*8d741a5dSApple OSS Distributions 	 */
4378*8d741a5dSApple OSS Distributions 
4379*8d741a5dSApple OSS Distributions 	req_qos = priority_queue_max(&wq->wq_overcommit_queue,
4380*8d741a5dSApple OSS Distributions 	    struct workq_threadreq_s, tr_entry);
4381*8d741a5dSApple OSS Distributions 	if (req_qos) {
4382*8d741a5dSApple OSS Distributions 		qos = req_qos->tr_qos;
4383*8d741a5dSApple OSS Distributions 	}
4384*8d741a5dSApple OSS Distributions 
4385*8d741a5dSApple OSS Distributions 	req_tmp = workq_cooperative_queue_best_req(wq, uth);
4386*8d741a5dSApple OSS Distributions 	if (req_tmp && qos <= req_tmp->tr_qos) {
4387*8d741a5dSApple OSS Distributions 		/*
4388*8d741a5dSApple OSS Distributions 		 * Cooperative TR is better between overcommit and cooperative.  Note
4389*8d741a5dSApple OSS Distributions 		 * that if qos is same between overcommit and cooperative, we choose
4390*8d741a5dSApple OSS Distributions 		 * cooperative.
4391*8d741a5dSApple OSS Distributions 		 *
4392*8d741a5dSApple OSS Distributions 		 * Pick cooperative pool if it passes the admissions check
4393*8d741a5dSApple OSS Distributions 		 */
4394*8d741a5dSApple OSS Distributions 		if (workq_cooperative_allowance(wq, req_tmp->tr_qos, uth, true)) {
4395*8d741a5dSApple OSS Distributions 			req_qos = req_tmp;
4396*8d741a5dSApple OSS Distributions 			qos = req_qos->tr_qos;
4397*8d741a5dSApple OSS Distributions 		}
4398*8d741a5dSApple OSS Distributions 	}
4399*8d741a5dSApple OSS Distributions 
4400*8d741a5dSApple OSS Distributions 	/*
4401*8d741a5dSApple OSS Distributions 	 * Compare the best QoS so far - either from overcommit or from cooperative
4402*8d741a5dSApple OSS Distributions 	 * pool - and compare it with the constrained pool
4403*8d741a5dSApple OSS Distributions 	 */
4404*8d741a5dSApple OSS Distributions 	req_tmp = priority_queue_max(&wq->wq_constrained_queue,
4405*8d741a5dSApple OSS Distributions 	    struct workq_threadreq_s, tr_entry);
4406*8d741a5dSApple OSS Distributions 
4407*8d741a5dSApple OSS Distributions 	if (req_tmp && qos < req_tmp->tr_qos) {
4408*8d741a5dSApple OSS Distributions 		/*
4409*8d741a5dSApple OSS Distributions 		 * Constrained pool is best in QoS between overcommit, cooperative
4410*8d741a5dSApple OSS Distributions 		 * and constrained. Now check how it fairs against the priority case
4411*8d741a5dSApple OSS Distributions 		 */
4412*8d741a5dSApple OSS Distributions 		if (pri && pri >= thread_workq_pri_for_qos(req_tmp->tr_qos)) {
4413*8d741a5dSApple OSS Distributions 			return req_pri;
4414*8d741a5dSApple OSS Distributions 		}
4415*8d741a5dSApple OSS Distributions 
4416*8d741a5dSApple OSS Distributions 		if (workq_constrained_allowance(wq, req_tmp->tr_qos, uth, true, true)) {
4417*8d741a5dSApple OSS Distributions 			/*
4418*8d741a5dSApple OSS Distributions 			 * If the constrained thread request is the best one and passes
4419*8d741a5dSApple OSS Distributions 			 * the admission check, pick it.
4420*8d741a5dSApple OSS Distributions 			 */
4421*8d741a5dSApple OSS Distributions 			return req_tmp;
4422*8d741a5dSApple OSS Distributions 		}
4423*8d741a5dSApple OSS Distributions 	}
4424*8d741a5dSApple OSS Distributions 
4425*8d741a5dSApple OSS Distributions 	if (req_pri && (!qos || pri >= thread_workq_pri_for_qos(qos))) {
4426*8d741a5dSApple OSS Distributions 		return req_pri;
4427*8d741a5dSApple OSS Distributions 	}
4428*8d741a5dSApple OSS Distributions 
4429*8d741a5dSApple OSS Distributions 	return req_qos;
4430*8d741a5dSApple OSS Distributions }
4431*8d741a5dSApple OSS Distributions 
4432*8d741a5dSApple OSS Distributions /*
4433*8d741a5dSApple OSS Distributions  * The creator is an anonymous thread that is counted as scheduled,
4434*8d741a5dSApple OSS Distributions  * but otherwise without its scheduler callback set or tracked as active
4435*8d741a5dSApple OSS Distributions  * that is used to make other threads.
4436*8d741a5dSApple OSS Distributions  *
4437*8d741a5dSApple OSS Distributions  * When more requests are added or an existing one is hurried along,
4438*8d741a5dSApple OSS Distributions  * a creator is elected and setup, or the existing one overridden accordingly.
4439*8d741a5dSApple OSS Distributions  *
4440*8d741a5dSApple OSS Distributions  * While this creator is in flight, because no request has been dequeued,
4441*8d741a5dSApple OSS Distributions  * already running threads have a chance at stealing thread requests avoiding
4442*8d741a5dSApple OSS Distributions  * useless context switches, and the creator once scheduled may not find any
4443*8d741a5dSApple OSS Distributions  * work to do and will then just park again.
4444*8d741a5dSApple OSS Distributions  *
4445*8d741a5dSApple OSS Distributions  * The creator serves the dual purpose of informing the scheduler of work that
4446*8d741a5dSApple OSS Distributions  * hasn't be materialized as threads yet, and also as a natural pacing mechanism
4447*8d741a5dSApple OSS Distributions  * for thread creation.
4448*8d741a5dSApple OSS Distributions  *
4449*8d741a5dSApple OSS Distributions  * By being anonymous (and not bound to anything) it means that thread requests
4450*8d741a5dSApple OSS Distributions  * can be stolen from this creator by threads already on core yielding more
4451*8d741a5dSApple OSS Distributions  * efficient scheduling and reduced context switches.
4452*8d741a5dSApple OSS Distributions  */
4453*8d741a5dSApple OSS Distributions static void
workq_schedule_creator(proc_t p,struct workqueue * wq,workq_kern_threadreq_flags_t flags)4454*8d741a5dSApple OSS Distributions workq_schedule_creator(proc_t p, struct workqueue *wq,
4455*8d741a5dSApple OSS Distributions     workq_kern_threadreq_flags_t flags)
4456*8d741a5dSApple OSS Distributions {
4457*8d741a5dSApple OSS Distributions 	workq_threadreq_t req;
4458*8d741a5dSApple OSS Distributions 	struct uthread *uth;
4459*8d741a5dSApple OSS Distributions 	bool needs_wakeup;
4460*8d741a5dSApple OSS Distributions 
4461*8d741a5dSApple OSS Distributions 	workq_lock_held(wq);
4462*8d741a5dSApple OSS Distributions 	assert(p || (flags & WORKQ_THREADREQ_CAN_CREATE_THREADS) == 0);
4463*8d741a5dSApple OSS Distributions 
4464*8d741a5dSApple OSS Distributions again:
4465*8d741a5dSApple OSS Distributions 	uth = wq->wq_creator;
4466*8d741a5dSApple OSS Distributions 
4467*8d741a5dSApple OSS Distributions 	if (!wq->wq_reqcount) {
4468*8d741a5dSApple OSS Distributions 		/*
4469*8d741a5dSApple OSS Distributions 		 * There is no thread request left.
4470*8d741a5dSApple OSS Distributions 		 *
4471*8d741a5dSApple OSS Distributions 		 * If there is a creator, leave everything in place, so that it cleans
4472*8d741a5dSApple OSS Distributions 		 * up itself in workq_push_idle_thread().
4473*8d741a5dSApple OSS Distributions 		 *
4474*8d741a5dSApple OSS Distributions 		 * Else, make sure the turnstile state is reset to no inheritor.
4475*8d741a5dSApple OSS Distributions 		 */
4476*8d741a5dSApple OSS Distributions 		if (uth == NULL) {
4477*8d741a5dSApple OSS Distributions 			workq_turnstile_update_inheritor(wq, TURNSTILE_INHERITOR_NULL, 0);
4478*8d741a5dSApple OSS Distributions 		}
4479*8d741a5dSApple OSS Distributions 		return;
4480*8d741a5dSApple OSS Distributions 	}
4481*8d741a5dSApple OSS Distributions 
4482*8d741a5dSApple OSS Distributions 	req = workq_threadreq_select_for_creator(wq);
4483*8d741a5dSApple OSS Distributions 	if (req == NULL) {
4484*8d741a5dSApple OSS Distributions 		/*
4485*8d741a5dSApple OSS Distributions 		 * There isn't a thread request that passes the admission check.
4486*8d741a5dSApple OSS Distributions 		 *
4487*8d741a5dSApple OSS Distributions 		 * If there is a creator, do not touch anything, the creator will sort
4488*8d741a5dSApple OSS Distributions 		 * it out when it runs.
4489*8d741a5dSApple OSS Distributions 		 *
4490*8d741a5dSApple OSS Distributions 		 * Else, set the inheritor to "WORKQ" so that the turnstile propagation
4491*8d741a5dSApple OSS Distributions 		 * code calls us if anything changes.
4492*8d741a5dSApple OSS Distributions 		 */
4493*8d741a5dSApple OSS Distributions 		if (uth == NULL) {
4494*8d741a5dSApple OSS Distributions 			workq_turnstile_update_inheritor(wq, wq, TURNSTILE_INHERITOR_WORKQ);
4495*8d741a5dSApple OSS Distributions 		}
4496*8d741a5dSApple OSS Distributions 		return;
4497*8d741a5dSApple OSS Distributions 	}
4498*8d741a5dSApple OSS Distributions 
4499*8d741a5dSApple OSS Distributions 
4500*8d741a5dSApple OSS Distributions 	if (uth) {
4501*8d741a5dSApple OSS Distributions 		/*
4502*8d741a5dSApple OSS Distributions 		 * We need to maybe override the creator we already have
4503*8d741a5dSApple OSS Distributions 		 */
4504*8d741a5dSApple OSS Distributions 		if (workq_thread_needs_priority_change(req, uth)) {
4505*8d741a5dSApple OSS Distributions 			WQ_TRACE_WQ(TRACE_wq_creator_select | DBG_FUNC_NONE,
4506*8d741a5dSApple OSS Distributions 			    wq, 1, uthread_tid(uth), req->tr_qos);
4507*8d741a5dSApple OSS Distributions 			workq_thread_reset_pri(wq, uth, req, /*unpark*/ true);
4508*8d741a5dSApple OSS Distributions 		}
4509*8d741a5dSApple OSS Distributions 		assert(wq->wq_inheritor == get_machthread(uth));
4510*8d741a5dSApple OSS Distributions 	} else if (wq->wq_thidlecount) {
4511*8d741a5dSApple OSS Distributions 		/*
4512*8d741a5dSApple OSS Distributions 		 * We need to unpark a creator thread
4513*8d741a5dSApple OSS Distributions 		 */
4514*8d741a5dSApple OSS Distributions 		wq->wq_creator = uth = workq_pop_idle_thread(wq, UT_WORKQ_OVERCOMMIT,
4515*8d741a5dSApple OSS Distributions 		    &needs_wakeup);
4516*8d741a5dSApple OSS Distributions 		/* Always reset the priorities on the newly chosen creator */
4517*8d741a5dSApple OSS Distributions 		workq_thread_reset_pri(wq, uth, req, /*unpark*/ true);
4518*8d741a5dSApple OSS Distributions 		workq_turnstile_update_inheritor(wq, get_machthread(uth),
4519*8d741a5dSApple OSS Distributions 		    TURNSTILE_INHERITOR_THREAD);
4520*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_creator_select | DBG_FUNC_NONE,
4521*8d741a5dSApple OSS Distributions 		    wq, 2, uthread_tid(uth), req->tr_qos);
4522*8d741a5dSApple OSS Distributions 		uth->uu_save.uus_workq_park_data.fulfilled_snapshot = wq->wq_fulfilled;
4523*8d741a5dSApple OSS Distributions 		uth->uu_save.uus_workq_park_data.yields = 0;
4524*8d741a5dSApple OSS Distributions 		if (needs_wakeup) {
4525*8d741a5dSApple OSS Distributions 			workq_thread_wakeup(uth);
4526*8d741a5dSApple OSS Distributions 		}
4527*8d741a5dSApple OSS Distributions 	} else {
4528*8d741a5dSApple OSS Distributions 		/*
4529*8d741a5dSApple OSS Distributions 		 * We need to allocate a thread...
4530*8d741a5dSApple OSS Distributions 		 */
4531*8d741a5dSApple OSS Distributions 		if (__improbable(wq->wq_nthreads >= wq_max_threads)) {
4532*8d741a5dSApple OSS Distributions 			/* out of threads, just go away */
4533*8d741a5dSApple OSS Distributions 			flags = WORKQ_THREADREQ_NONE;
4534*8d741a5dSApple OSS Distributions 		} else if (flags & WORKQ_THREADREQ_SET_AST_ON_FAILURE) {
4535*8d741a5dSApple OSS Distributions 			act_set_astkevent(current_thread(), AST_KEVENT_REDRIVE_THREADREQ);
4536*8d741a5dSApple OSS Distributions 		} else if (!(flags & WORKQ_THREADREQ_CAN_CREATE_THREADS)) {
4537*8d741a5dSApple OSS Distributions 			/* This can drop the workqueue lock, and take it again */
4538*8d741a5dSApple OSS Distributions 			workq_schedule_immediate_thread_creation(wq);
4539*8d741a5dSApple OSS Distributions 		} else if ((workq_add_new_idle_thread(p, wq,
4540*8d741a5dSApple OSS Distributions 		    workq_unpark_continue, false, NULL) == KERN_SUCCESS)) {
4541*8d741a5dSApple OSS Distributions 			goto again;
4542*8d741a5dSApple OSS Distributions 		} else {
4543*8d741a5dSApple OSS Distributions 			workq_schedule_delayed_thread_creation(wq, 0);
4544*8d741a5dSApple OSS Distributions 		}
4545*8d741a5dSApple OSS Distributions 
4546*8d741a5dSApple OSS Distributions 		/*
4547*8d741a5dSApple OSS Distributions 		 * If the current thread is the inheritor:
4548*8d741a5dSApple OSS Distributions 		 *
4549*8d741a5dSApple OSS Distributions 		 * If we set the AST, then the thread will stay the inheritor until
4550*8d741a5dSApple OSS Distributions 		 * either the AST calls workq_kern_threadreq_redrive(), or it parks
4551*8d741a5dSApple OSS Distributions 		 * and calls workq_push_idle_thread().
4552*8d741a5dSApple OSS Distributions 		 *
4553*8d741a5dSApple OSS Distributions 		 * Else, the responsibility of the thread creation is with a thread-call
4554*8d741a5dSApple OSS Distributions 		 * and we need to clear the inheritor.
4555*8d741a5dSApple OSS Distributions 		 */
4556*8d741a5dSApple OSS Distributions 		if ((flags & WORKQ_THREADREQ_SET_AST_ON_FAILURE) == 0 &&
4557*8d741a5dSApple OSS Distributions 		    wq->wq_inheritor == current_thread()) {
4558*8d741a5dSApple OSS Distributions 			workq_turnstile_update_inheritor(wq, TURNSTILE_INHERITOR_NULL, 0);
4559*8d741a5dSApple OSS Distributions 		}
4560*8d741a5dSApple OSS Distributions 	}
4561*8d741a5dSApple OSS Distributions }
4562*8d741a5dSApple OSS Distributions 
4563*8d741a5dSApple OSS Distributions /**
4564*8d741a5dSApple OSS Distributions  * Same as workq_unpark_select_threadreq_or_park_and_unlock,
4565*8d741a5dSApple OSS Distributions  * but do not allow early binds.
4566*8d741a5dSApple OSS Distributions  *
4567*8d741a5dSApple OSS Distributions  * Called with the base pri frozen, will unfreeze it.
4568*8d741a5dSApple OSS Distributions  */
4569*8d741a5dSApple OSS Distributions __attribute__((noreturn, noinline))
4570*8d741a5dSApple OSS Distributions static void
workq_select_threadreq_or_park_and_unlock(proc_t p,struct workqueue * wq,struct uthread * uth,uint32_t setup_flags)4571*8d741a5dSApple OSS Distributions workq_select_threadreq_or_park_and_unlock(proc_t p, struct workqueue *wq,
4572*8d741a5dSApple OSS Distributions     struct uthread *uth, uint32_t setup_flags)
4573*8d741a5dSApple OSS Distributions {
4574*8d741a5dSApple OSS Distributions 	workq_threadreq_t req = NULL;
4575*8d741a5dSApple OSS Distributions 	bool is_creator = (wq->wq_creator == uth);
4576*8d741a5dSApple OSS Distributions 	bool schedule_creator = false;
4577*8d741a5dSApple OSS Distributions 
4578*8d741a5dSApple OSS Distributions 	if (__improbable(_wq_exiting(wq))) {
4579*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_select_threadreq | DBG_FUNC_NONE, wq, 0, 0, 0);
4580*8d741a5dSApple OSS Distributions 		goto park;
4581*8d741a5dSApple OSS Distributions 	}
4582*8d741a5dSApple OSS Distributions 
4583*8d741a5dSApple OSS Distributions 	if (wq->wq_reqcount == 0) {
4584*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_select_threadreq | DBG_FUNC_NONE, wq, 1, 0, 0);
4585*8d741a5dSApple OSS Distributions 		goto park;
4586*8d741a5dSApple OSS Distributions 	}
4587*8d741a5dSApple OSS Distributions 
4588*8d741a5dSApple OSS Distributions 	req = workq_threadreq_select(wq, uth);
4589*8d741a5dSApple OSS Distributions 	if (__improbable(req == NULL)) {
4590*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_select_threadreq | DBG_FUNC_NONE, wq, 2, 0, 0);
4591*8d741a5dSApple OSS Distributions 		goto park;
4592*8d741a5dSApple OSS Distributions 	}
4593*8d741a5dSApple OSS Distributions 
4594*8d741a5dSApple OSS Distributions 	struct uu_workq_policy old_pri = uth->uu_workq_pri;
4595*8d741a5dSApple OSS Distributions 	uint8_t tr_flags = req->tr_flags;
4596*8d741a5dSApple OSS Distributions 	struct turnstile *req_ts = kqueue_threadreq_get_turnstile(req);
4597*8d741a5dSApple OSS Distributions 
4598*8d741a5dSApple OSS Distributions 	/*
4599*8d741a5dSApple OSS Distributions 	 * Attempt to setup ourselves as the new thing to run, moving all priority
4600*8d741a5dSApple OSS Distributions 	 * pushes to ourselves.
4601*8d741a5dSApple OSS Distributions 	 *
4602*8d741a5dSApple OSS Distributions 	 * If the current thread is the creator, then the fact that we are presently
4603*8d741a5dSApple OSS Distributions 	 * running is proof that we'll do something useful, so keep going.
4604*8d741a5dSApple OSS Distributions 	 *
4605*8d741a5dSApple OSS Distributions 	 * For other cases, peek at the AST to know whether the scheduler wants
4606*8d741a5dSApple OSS Distributions 	 * to preempt us, if yes, park instead, and move the thread request
4607*8d741a5dSApple OSS Distributions 	 * turnstile back to the workqueue.
4608*8d741a5dSApple OSS Distributions 	 */
4609*8d741a5dSApple OSS Distributions 	if (req_ts) {
4610*8d741a5dSApple OSS Distributions 		workq_perform_turnstile_operation_locked(wq, ^{
4611*8d741a5dSApple OSS Distributions 			turnstile_update_inheritor(req_ts, get_machthread(uth),
4612*8d741a5dSApple OSS Distributions 			TURNSTILE_IMMEDIATE_UPDATE | TURNSTILE_INHERITOR_THREAD);
4613*8d741a5dSApple OSS Distributions 			turnstile_update_inheritor_complete(req_ts,
4614*8d741a5dSApple OSS Distributions 			TURNSTILE_INTERLOCK_HELD);
4615*8d741a5dSApple OSS Distributions 		});
4616*8d741a5dSApple OSS Distributions 	}
4617*8d741a5dSApple OSS Distributions 
4618*8d741a5dSApple OSS Distributions 	/* accounting changes of aggregate thscheduled_count and thactive which has
4619*8d741a5dSApple OSS Distributions 	 * to be paired with the workq_thread_reset_pri below so that we have
4620*8d741a5dSApple OSS Distributions 	 * uth->uu_workq_pri match with thactive.
4621*8d741a5dSApple OSS Distributions 	 *
4622*8d741a5dSApple OSS Distributions 	 * This is undone when the thread parks */
4623*8d741a5dSApple OSS Distributions 	if (is_creator) {
4624*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_creator_select, wq, 4, 0,
4625*8d741a5dSApple OSS Distributions 		    uth->uu_save.uus_workq_park_data.yields);
4626*8d741a5dSApple OSS Distributions 		wq->wq_creator = NULL;
4627*8d741a5dSApple OSS Distributions 		_wq_thactive_inc(wq, req->tr_qos);
4628*8d741a5dSApple OSS Distributions 		wq->wq_thscheduled_count[_wq_bucket(req->tr_qos)]++;
4629*8d741a5dSApple OSS Distributions 	} else if (old_pri.qos_bucket != req->tr_qos) {
4630*8d741a5dSApple OSS Distributions 		_wq_thactive_move(wq, old_pri.qos_bucket, req->tr_qos);
4631*8d741a5dSApple OSS Distributions 	}
4632*8d741a5dSApple OSS Distributions 	workq_thread_reset_pri(wq, uth, req, /*unpark*/ true);
4633*8d741a5dSApple OSS Distributions 
4634*8d741a5dSApple OSS Distributions 	/*
4635*8d741a5dSApple OSS Distributions 	 * Make relevant accounting changes for pool specific counts.
4636*8d741a5dSApple OSS Distributions 	 *
4637*8d741a5dSApple OSS Distributions 	 * The schedule counts changing can affect what the next best request
4638*8d741a5dSApple OSS Distributions 	 * for cooperative thread pool is if this request is dequeued.
4639*8d741a5dSApple OSS Distributions 	 */
4640*8d741a5dSApple OSS Distributions 	bool cooperative_sched_count_changed =
4641*8d741a5dSApple OSS Distributions 	    workq_adjust_cooperative_constrained_schedule_counts(wq, uth,
4642*8d741a5dSApple OSS Distributions 	    old_pri.qos_req, tr_flags);
4643*8d741a5dSApple OSS Distributions 
4644*8d741a5dSApple OSS Distributions 	if (workq_tr_is_overcommit(tr_flags)) {
4645*8d741a5dSApple OSS Distributions 		workq_thread_set_type(uth, UT_WORKQ_OVERCOMMIT);
4646*8d741a5dSApple OSS Distributions 	} else if (workq_tr_is_cooperative(tr_flags)) {
4647*8d741a5dSApple OSS Distributions 		workq_thread_set_type(uth, UT_WORKQ_COOPERATIVE);
4648*8d741a5dSApple OSS Distributions 	} else {
4649*8d741a5dSApple OSS Distributions 		workq_thread_set_type(uth, 0);
4650*8d741a5dSApple OSS Distributions 	}
4651*8d741a5dSApple OSS Distributions 
4652*8d741a5dSApple OSS Distributions 	if (__improbable(thread_unfreeze_base_pri(get_machthread(uth)) && !is_creator)) {
4653*8d741a5dSApple OSS Distributions 		if (req_ts) {
4654*8d741a5dSApple OSS Distributions 			workq_perform_turnstile_operation_locked(wq, ^{
4655*8d741a5dSApple OSS Distributions 				turnstile_update_inheritor(req_ts, wq->wq_turnstile,
4656*8d741a5dSApple OSS Distributions 				TURNSTILE_IMMEDIATE_UPDATE | TURNSTILE_INHERITOR_TURNSTILE);
4657*8d741a5dSApple OSS Distributions 				turnstile_update_inheritor_complete(req_ts,
4658*8d741a5dSApple OSS Distributions 				TURNSTILE_INTERLOCK_HELD);
4659*8d741a5dSApple OSS Distributions 			});
4660*8d741a5dSApple OSS Distributions 		}
4661*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_select_threadreq | DBG_FUNC_NONE, wq, 3, 0, 0);
4662*8d741a5dSApple OSS Distributions 
4663*8d741a5dSApple OSS Distributions 		/*
4664*8d741a5dSApple OSS Distributions 		 * If a cooperative thread was the one which picked up the manager
4665*8d741a5dSApple OSS Distributions 		 * thread request, we need to reevaluate the cooperative pool before
4666*8d741a5dSApple OSS Distributions 		 * it goes and parks.
4667*8d741a5dSApple OSS Distributions 		 *
4668*8d741a5dSApple OSS Distributions 		 * For every other of thread request that it picks up, the logic in
4669*8d741a5dSApple OSS Distributions 		 * workq_threadreq_select should have done this refresh.
4670*8d741a5dSApple OSS Distributions 		 * See workq_push_idle_thread.
4671*8d741a5dSApple OSS Distributions 		 */
4672*8d741a5dSApple OSS Distributions 		if (cooperative_sched_count_changed) {
4673*8d741a5dSApple OSS Distributions 			if (req->tr_qos == WORKQ_THREAD_QOS_MANAGER) {
4674*8d741a5dSApple OSS Distributions 				_wq_cooperative_queue_refresh_best_req_qos(wq);
4675*8d741a5dSApple OSS Distributions 			}
4676*8d741a5dSApple OSS Distributions 		}
4677*8d741a5dSApple OSS Distributions 		goto park_thawed;
4678*8d741a5dSApple OSS Distributions 	}
4679*8d741a5dSApple OSS Distributions 
4680*8d741a5dSApple OSS Distributions 	/*
4681*8d741a5dSApple OSS Distributions 	 * We passed all checks, dequeue the request, bind to it, and set it up
4682*8d741a5dSApple OSS Distributions 	 * to return to user.
4683*8d741a5dSApple OSS Distributions 	 */
4684*8d741a5dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_thread_logical_run | DBG_FUNC_START, wq,
4685*8d741a5dSApple OSS Distributions 	    workq_trace_req_id(req), tr_flags, 0);
4686*8d741a5dSApple OSS Distributions 	wq->wq_fulfilled++;
4687*8d741a5dSApple OSS Distributions 	schedule_creator = workq_threadreq_dequeue(wq, req,
4688*8d741a5dSApple OSS Distributions 	    cooperative_sched_count_changed);
4689*8d741a5dSApple OSS Distributions 
4690*8d741a5dSApple OSS Distributions 	workq_thread_reset_cpupercent(req, uth);
4691*8d741a5dSApple OSS Distributions 
4692*8d741a5dSApple OSS Distributions 	if (tr_flags & (WORKQ_TR_FLAG_KEVENT | WORKQ_TR_FLAG_WORKLOOP)) {
4693*8d741a5dSApple OSS Distributions 		kqueue_threadreq_bind_prepost(p, req, uth);
4694*8d741a5dSApple OSS Distributions 		req = NULL;
4695*8d741a5dSApple OSS Distributions 	} else if (req->tr_count > 0) {
4696*8d741a5dSApple OSS Distributions 		req = NULL;
4697*8d741a5dSApple OSS Distributions 	}
4698*8d741a5dSApple OSS Distributions 
4699*8d741a5dSApple OSS Distributions 	if (uth->uu_workq_flags & UT_WORKQ_NEW) {
4700*8d741a5dSApple OSS Distributions 		uth->uu_workq_flags ^= UT_WORKQ_NEW;
4701*8d741a5dSApple OSS Distributions 		setup_flags |= WQ_SETUP_FIRST_USE;
4702*8d741a5dSApple OSS Distributions 	}
4703*8d741a5dSApple OSS Distributions 
4704*8d741a5dSApple OSS Distributions 	/* If one of the following is true, call workq_schedule_creator (which also
4705*8d741a5dSApple OSS Distributions 	 * adjusts priority of existing creator):
4706*8d741a5dSApple OSS Distributions 	 *
4707*8d741a5dSApple OSS Distributions 	 *	  - We are the creator currently so the wq may need a new creator
4708*8d741a5dSApple OSS Distributions 	 *	  - The request we're binding to is the highest priority one, existing
4709*8d741a5dSApple OSS Distributions 	 *	  creator's priority might need to be adjusted to reflect the next
4710*8d741a5dSApple OSS Distributions 	 *	  highest TR
4711*8d741a5dSApple OSS Distributions 	 */
4712*8d741a5dSApple OSS Distributions 	if (is_creator || schedule_creator) {
4713*8d741a5dSApple OSS Distributions 		/* This can drop the workqueue lock, and take it again */
4714*8d741a5dSApple OSS Distributions 		workq_schedule_creator(p, wq, WORKQ_THREADREQ_CAN_CREATE_THREADS);
4715*8d741a5dSApple OSS Distributions 	}
4716*8d741a5dSApple OSS Distributions 
4717*8d741a5dSApple OSS Distributions 	workq_unlock(wq);
4718*8d741a5dSApple OSS Distributions 
4719*8d741a5dSApple OSS Distributions 	if (req) {
4720*8d741a5dSApple OSS Distributions 		zfree(workq_zone_threadreq, req);
4721*8d741a5dSApple OSS Distributions 	}
4722*8d741a5dSApple OSS Distributions 
4723*8d741a5dSApple OSS Distributions 	/*
4724*8d741a5dSApple OSS Distributions 	 * Run Thread, Run!
4725*8d741a5dSApple OSS Distributions 	 */
4726*8d741a5dSApple OSS Distributions 	uint32_t upcall_flags = WQ_FLAG_THREAD_NEWSPI;
4727*8d741a5dSApple OSS Distributions 	if (uth->uu_workq_pri.qos_bucket == WORKQ_THREAD_QOS_MANAGER) {
4728*8d741a5dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_EVENT_MANAGER;
4729*8d741a5dSApple OSS Distributions 	} else if (workq_tr_is_overcommit(tr_flags)) {
4730*8d741a5dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_OVERCOMMIT;
4731*8d741a5dSApple OSS Distributions 	} else if (workq_tr_is_cooperative(tr_flags)) {
4732*8d741a5dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_COOPERATIVE;
4733*8d741a5dSApple OSS Distributions 	}
4734*8d741a5dSApple OSS Distributions 	if (tr_flags & WORKQ_TR_FLAG_KEVENT) {
4735*8d741a5dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_KEVENT;
4736*8d741a5dSApple OSS Distributions 		assert((upcall_flags & WQ_FLAG_THREAD_COOPERATIVE) == 0);
4737*8d741a5dSApple OSS Distributions 	}
4738*8d741a5dSApple OSS Distributions 
4739*8d741a5dSApple OSS Distributions 	if (tr_flags & WORKQ_TR_FLAG_WORKLOOP) {
4740*8d741a5dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_WORKLOOP | WQ_FLAG_THREAD_KEVENT;
4741*8d741a5dSApple OSS Distributions 	}
4742*8d741a5dSApple OSS Distributions 	uth->uu_save.uus_workq_park_data.upcall_flags = upcall_flags;
4743*8d741a5dSApple OSS Distributions 
4744*8d741a5dSApple OSS Distributions 	if (tr_flags & (WORKQ_TR_FLAG_KEVENT | WORKQ_TR_FLAG_WORKLOOP)) {
4745*8d741a5dSApple OSS Distributions 		kqueue_threadreq_bind_commit(p, get_machthread(uth));
4746*8d741a5dSApple OSS Distributions 	} else {
4747*8d741a5dSApple OSS Distributions #if CONFIG_PREADOPT_TG
4748*8d741a5dSApple OSS Distributions 		/*
4749*8d741a5dSApple OSS Distributions 		 * The thread may have a preadopt thread group on it already because it
4750*8d741a5dSApple OSS Distributions 		 * got tagged with it as a creator thread. So we need to make sure to
4751*8d741a5dSApple OSS Distributions 		 * clear that since we don't have preadoption for anonymous thread
4752*8d741a5dSApple OSS Distributions 		 * requests
4753*8d741a5dSApple OSS Distributions 		 */
4754*8d741a5dSApple OSS Distributions 		thread_set_preadopt_thread_group(get_machthread(uth), NULL);
4755*8d741a5dSApple OSS Distributions #endif
4756*8d741a5dSApple OSS Distributions 	}
4757*8d741a5dSApple OSS Distributions 
4758*8d741a5dSApple OSS Distributions 	workq_setup_and_run(p, uth, setup_flags);
4759*8d741a5dSApple OSS Distributions 	__builtin_unreachable();
4760*8d741a5dSApple OSS Distributions 
4761*8d741a5dSApple OSS Distributions park:
4762*8d741a5dSApple OSS Distributions 	thread_unfreeze_base_pri(get_machthread(uth));
4763*8d741a5dSApple OSS Distributions park_thawed:
4764*8d741a5dSApple OSS Distributions 	workq_park_and_unlock(p, wq, uth, setup_flags);
4765*8d741a5dSApple OSS Distributions }
4766*8d741a5dSApple OSS Distributions 
4767*8d741a5dSApple OSS Distributions /**
4768*8d741a5dSApple OSS Distributions  * Runs a thread request on a thread
4769*8d741a5dSApple OSS Distributions  *
4770*8d741a5dSApple OSS Distributions  * - if thread is THREAD_NULL, will find a thread and run the request there.
4771*8d741a5dSApple OSS Distributions  *   Otherwise, the thread must be the current thread.
4772*8d741a5dSApple OSS Distributions  *
4773*8d741a5dSApple OSS Distributions  * - if req is NULL, will find the highest priority request and run that.  If
4774*8d741a5dSApple OSS Distributions  *   it is not NULL, it must be a threadreq object in state NEW.  If it can not
4775*8d741a5dSApple OSS Distributions  *   be run immediately, it will be enqueued and moved to state QUEUED.
4776*8d741a5dSApple OSS Distributions  *
4777*8d741a5dSApple OSS Distributions  *   Either way, the thread request object serviced will be moved to state
4778*8d741a5dSApple OSS Distributions  *   BINDING and attached to the uthread.
4779*8d741a5dSApple OSS Distributions  *
4780*8d741a5dSApple OSS Distributions  * Should be called with the workqueue lock held.  Will drop it.
4781*8d741a5dSApple OSS Distributions  * Should be called with the base pri not frozen.
4782*8d741a5dSApple OSS Distributions  */
4783*8d741a5dSApple OSS Distributions __attribute__((noreturn, noinline))
4784*8d741a5dSApple OSS Distributions static void
workq_unpark_select_threadreq_or_park_and_unlock(proc_t p,struct workqueue * wq,struct uthread * uth,uint32_t setup_flags)4785*8d741a5dSApple OSS Distributions workq_unpark_select_threadreq_or_park_and_unlock(proc_t p, struct workqueue *wq,
4786*8d741a5dSApple OSS Distributions     struct uthread *uth, uint32_t setup_flags)
4787*8d741a5dSApple OSS Distributions {
4788*8d741a5dSApple OSS Distributions 	if (uth->uu_workq_flags & UT_WORKQ_EARLY_BOUND) {
4789*8d741a5dSApple OSS Distributions 		if (uth->uu_workq_flags & UT_WORKQ_NEW) {
4790*8d741a5dSApple OSS Distributions 			setup_flags |= WQ_SETUP_FIRST_USE;
4791*8d741a5dSApple OSS Distributions 		}
4792*8d741a5dSApple OSS Distributions 		uth->uu_workq_flags &= ~(UT_WORKQ_NEW | UT_WORKQ_EARLY_BOUND);
4793*8d741a5dSApple OSS Distributions 		/*
4794*8d741a5dSApple OSS Distributions 		 * This pointer is possibly freed and only used for tracing purposes.
4795*8d741a5dSApple OSS Distributions 		 */
4796*8d741a5dSApple OSS Distributions 		workq_threadreq_t req = uth->uu_save.uus_workq_park_data.thread_request;
4797*8d741a5dSApple OSS Distributions 		workq_unlock(wq);
4798*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_thread_logical_run | DBG_FUNC_START, wq,
4799*8d741a5dSApple OSS Distributions 		    VM_KERNEL_ADDRHIDE(req), 0, 0);
4800*8d741a5dSApple OSS Distributions 		(void)req;
4801*8d741a5dSApple OSS Distributions 
4802*8d741a5dSApple OSS Distributions 		workq_setup_and_run(p, uth, setup_flags);
4803*8d741a5dSApple OSS Distributions 		__builtin_unreachable();
4804*8d741a5dSApple OSS Distributions 	}
4805*8d741a5dSApple OSS Distributions 
4806*8d741a5dSApple OSS Distributions 	thread_freeze_base_pri(get_machthread(uth));
4807*8d741a5dSApple OSS Distributions 	workq_select_threadreq_or_park_and_unlock(p, wq, uth, setup_flags);
4808*8d741a5dSApple OSS Distributions }
4809*8d741a5dSApple OSS Distributions 
4810*8d741a5dSApple OSS Distributions static bool
workq_creator_should_yield(struct workqueue * wq,struct uthread * uth)4811*8d741a5dSApple OSS Distributions workq_creator_should_yield(struct workqueue *wq, struct uthread *uth)
4812*8d741a5dSApple OSS Distributions {
4813*8d741a5dSApple OSS Distributions 	thread_qos_t qos = workq_pri_override(uth->uu_workq_pri);
4814*8d741a5dSApple OSS Distributions 
4815*8d741a5dSApple OSS Distributions 	if (qos >= THREAD_QOS_USER_INTERACTIVE) {
4816*8d741a5dSApple OSS Distributions 		return false;
4817*8d741a5dSApple OSS Distributions 	}
4818*8d741a5dSApple OSS Distributions 
4819*8d741a5dSApple OSS Distributions 	uint32_t snapshot = uth->uu_save.uus_workq_park_data.fulfilled_snapshot;
4820*8d741a5dSApple OSS Distributions 	if (wq->wq_fulfilled == snapshot) {
4821*8d741a5dSApple OSS Distributions 		return false;
4822*8d741a5dSApple OSS Distributions 	}
4823*8d741a5dSApple OSS Distributions 
4824*8d741a5dSApple OSS Distributions 	uint32_t cnt = 0, conc = wq_max_parallelism[_wq_bucket(qos)];
4825*8d741a5dSApple OSS Distributions 	if (wq->wq_fulfilled - snapshot > conc) {
4826*8d741a5dSApple OSS Distributions 		/* we fulfilled more than NCPU requests since being dispatched */
4827*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_creator_yield, wq, 1,
4828*8d741a5dSApple OSS Distributions 		    wq->wq_fulfilled, snapshot);
4829*8d741a5dSApple OSS Distributions 		return true;
4830*8d741a5dSApple OSS Distributions 	}
4831*8d741a5dSApple OSS Distributions 
4832*8d741a5dSApple OSS Distributions 	for (uint8_t i = _wq_bucket(qos); i < WORKQ_NUM_QOS_BUCKETS; i++) {
4833*8d741a5dSApple OSS Distributions 		cnt += wq->wq_thscheduled_count[i];
4834*8d741a5dSApple OSS Distributions 	}
4835*8d741a5dSApple OSS Distributions 	if (conc <= cnt) {
4836*8d741a5dSApple OSS Distributions 		/* We fulfilled requests and have more than NCPU scheduled threads */
4837*8d741a5dSApple OSS Distributions 		WQ_TRACE_WQ(TRACE_wq_creator_yield, wq, 2,
4838*8d741a5dSApple OSS Distributions 		    wq->wq_fulfilled, snapshot);
4839*8d741a5dSApple OSS Distributions 		return true;
4840*8d741a5dSApple OSS Distributions 	}
4841*8d741a5dSApple OSS Distributions 
4842*8d741a5dSApple OSS Distributions 	return false;
4843*8d741a5dSApple OSS Distributions }
4844*8d741a5dSApple OSS Distributions 
4845*8d741a5dSApple OSS Distributions /**
4846*8d741a5dSApple OSS Distributions  * parked idle thread wakes up
4847*8d741a5dSApple OSS Distributions  */
4848*8d741a5dSApple OSS Distributions __attribute__((noreturn, noinline))
4849*8d741a5dSApple OSS Distributions static void
workq_unpark_continue(void * parameter __unused,wait_result_t wr __unused)4850*8d741a5dSApple OSS Distributions workq_unpark_continue(void *parameter __unused, wait_result_t wr __unused)
4851*8d741a5dSApple OSS Distributions {
4852*8d741a5dSApple OSS Distributions 	thread_t th = current_thread();
4853*8d741a5dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(th);
4854*8d741a5dSApple OSS Distributions 	proc_t p = current_proc();
4855*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr_fast(p);
4856*8d741a5dSApple OSS Distributions 
4857*8d741a5dSApple OSS Distributions 	workq_lock_spin(wq);
4858*8d741a5dSApple OSS Distributions 
4859*8d741a5dSApple OSS Distributions 	if (wq->wq_creator == uth && workq_creator_should_yield(wq, uth)) {
4860*8d741a5dSApple OSS Distributions 		/*
4861*8d741a5dSApple OSS Distributions 		 * If the number of threads we have out are able to keep up with the
4862*8d741a5dSApple OSS Distributions 		 * demand, then we should avoid sending this creator thread to
4863*8d741a5dSApple OSS Distributions 		 * userspace.
4864*8d741a5dSApple OSS Distributions 		 */
4865*8d741a5dSApple OSS Distributions 		uth->uu_save.uus_workq_park_data.fulfilled_snapshot = wq->wq_fulfilled;
4866*8d741a5dSApple OSS Distributions 		uth->uu_save.uus_workq_park_data.yields++;
4867*8d741a5dSApple OSS Distributions 		workq_unlock(wq);
4868*8d741a5dSApple OSS Distributions 		thread_yield_with_continuation(workq_unpark_continue, NULL);
4869*8d741a5dSApple OSS Distributions 		__builtin_unreachable();
4870*8d741a5dSApple OSS Distributions 	}
4871*8d741a5dSApple OSS Distributions 
4872*8d741a5dSApple OSS Distributions 	if (__probable(uth->uu_workq_flags & UT_WORKQ_RUNNING)) {
4873*8d741a5dSApple OSS Distributions 		workq_unpark_select_threadreq_or_park_and_unlock(p, wq, uth, WQ_SETUP_NONE);
4874*8d741a5dSApple OSS Distributions 		__builtin_unreachable();
4875*8d741a5dSApple OSS Distributions 	}
4876*8d741a5dSApple OSS Distributions 
4877*8d741a5dSApple OSS Distributions 	if (__probable(wr == THREAD_AWAKENED)) {
4878*8d741a5dSApple OSS Distributions 		/*
4879*8d741a5dSApple OSS Distributions 		 * We were set running, but for the purposes of dying.
4880*8d741a5dSApple OSS Distributions 		 */
4881*8d741a5dSApple OSS Distributions 		assert(uth->uu_workq_flags & UT_WORKQ_DYING);
4882*8d741a5dSApple OSS Distributions 		assert((uth->uu_workq_flags & UT_WORKQ_NEW) == 0);
4883*8d741a5dSApple OSS Distributions 	} else {
4884*8d741a5dSApple OSS Distributions 		/*
4885*8d741a5dSApple OSS Distributions 		 * workaround for <rdar://problem/38647347>,
4886*8d741a5dSApple OSS Distributions 		 * in case we do hit userspace, make sure calling
4887*8d741a5dSApple OSS Distributions 		 * workq_thread_terminate() does the right thing here,
4888*8d741a5dSApple OSS Distributions 		 * and if we never call it, that workq_exit() will too because it sees
4889*8d741a5dSApple OSS Distributions 		 * this thread on the runlist.
4890*8d741a5dSApple OSS Distributions 		 */
4891*8d741a5dSApple OSS Distributions 		assert(wr == THREAD_INTERRUPTED);
4892*8d741a5dSApple OSS Distributions 		wq->wq_thdying_count++;
4893*8d741a5dSApple OSS Distributions 		uth->uu_workq_flags |= UT_WORKQ_DYING;
4894*8d741a5dSApple OSS Distributions 	}
4895*8d741a5dSApple OSS Distributions 
4896*8d741a5dSApple OSS Distributions 	workq_unpark_for_death_and_unlock(p, wq, uth,
4897*8d741a5dSApple OSS Distributions 	    WORKQ_UNPARK_FOR_DEATH_WAS_IDLE, WQ_SETUP_NONE);
4898*8d741a5dSApple OSS Distributions 	__builtin_unreachable();
4899*8d741a5dSApple OSS Distributions }
4900*8d741a5dSApple OSS Distributions 
4901*8d741a5dSApple OSS Distributions __attribute__((noreturn, noinline))
4902*8d741a5dSApple OSS Distributions static void
workq_setup_and_run(proc_t p,struct uthread * uth,int setup_flags)4903*8d741a5dSApple OSS Distributions workq_setup_and_run(proc_t p, struct uthread *uth, int setup_flags)
4904*8d741a5dSApple OSS Distributions {
4905*8d741a5dSApple OSS Distributions 	thread_t th = get_machthread(uth);
4906*8d741a5dSApple OSS Distributions 	vm_map_t vmap = get_task_map(proc_task(p));
4907*8d741a5dSApple OSS Distributions 
4908*8d741a5dSApple OSS Distributions 	if (setup_flags & WQ_SETUP_CLEAR_VOUCHER) {
4909*8d741a5dSApple OSS Distributions 		/*
4910*8d741a5dSApple OSS Distributions 		 * For preemption reasons, we want to reset the voucher as late as
4911*8d741a5dSApple OSS Distributions 		 * possible, so we do it in two places:
4912*8d741a5dSApple OSS Distributions 		 *   - Just before parking (i.e. in workq_park_and_unlock())
4913*8d741a5dSApple OSS Distributions 		 *   - Prior to doing the setup for the next workitem (i.e. here)
4914*8d741a5dSApple OSS Distributions 		 *
4915*8d741a5dSApple OSS Distributions 		 * Those two places are sufficient to ensure we always reset it before
4916*8d741a5dSApple OSS Distributions 		 * it goes back out to user space, but be careful to not break that
4917*8d741a5dSApple OSS Distributions 		 * guarantee.
4918*8d741a5dSApple OSS Distributions 		 *
4919*8d741a5dSApple OSS Distributions 		 * Note that setting the voucher to NULL will not clear the preadoption
4920*8d741a5dSApple OSS Distributions 		 * thread group on this thread
4921*8d741a5dSApple OSS Distributions 		 */
4922*8d741a5dSApple OSS Distributions 		__assert_only kern_return_t kr;
4923*8d741a5dSApple OSS Distributions 		kr = thread_set_voucher_name(MACH_PORT_NULL);
4924*8d741a5dSApple OSS Distributions 		assert(kr == KERN_SUCCESS);
4925*8d741a5dSApple OSS Distributions 	}
4926*8d741a5dSApple OSS Distributions 
4927*8d741a5dSApple OSS Distributions 	uint32_t upcall_flags = uth->uu_save.uus_workq_park_data.upcall_flags;
4928*8d741a5dSApple OSS Distributions 	if (!(setup_flags & WQ_SETUP_FIRST_USE)) {
4929*8d741a5dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_REUSE;
4930*8d741a5dSApple OSS Distributions 	}
4931*8d741a5dSApple OSS Distributions 
4932*8d741a5dSApple OSS Distributions 	if (uth->uu_workq_flags & UT_WORKQ_OUTSIDE_QOS) {
4933*8d741a5dSApple OSS Distributions 		/*
4934*8d741a5dSApple OSS Distributions 		 * For threads that have an outside-of-QoS thread priority, indicate
4935*8d741a5dSApple OSS Distributions 		 * to userspace that setting QoS should only affect the TSD and not
4936*8d741a5dSApple OSS Distributions 		 * change QOS in the kernel.
4937*8d741a5dSApple OSS Distributions 		 */
4938*8d741a5dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_OUTSIDEQOS;
4939*8d741a5dSApple OSS Distributions 	} else {
4940*8d741a5dSApple OSS Distributions 		/*
4941*8d741a5dSApple OSS Distributions 		 * Put the QoS class value into the lower bits of the reuse_thread
4942*8d741a5dSApple OSS Distributions 		 * register, this is where the thread priority used to be stored
4943*8d741a5dSApple OSS Distributions 		 * anyway.
4944*8d741a5dSApple OSS Distributions 		 */
4945*8d741a5dSApple OSS Distributions 		upcall_flags |= uth->uu_save.uus_workq_park_data.qos |
4946*8d741a5dSApple OSS Distributions 		    WQ_FLAG_THREAD_PRIO_QOS;
4947*8d741a5dSApple OSS Distributions 	}
4948*8d741a5dSApple OSS Distributions 
4949*8d741a5dSApple OSS Distributions 	if (uth->uu_workq_thport == MACH_PORT_NULL) {
4950*8d741a5dSApple OSS Distributions 		/* convert_thread_to_port_pinned() consumes a reference */
4951*8d741a5dSApple OSS Distributions 		thread_reference(th);
4952*8d741a5dSApple OSS Distributions 		/* Convert to immovable/pinned thread port, but port is not pinned yet */
4953*8d741a5dSApple OSS Distributions 		ipc_port_t port = convert_thread_to_port_pinned(th);
4954*8d741a5dSApple OSS Distributions 		/* Atomically, pin and copy out the port */
4955*8d741a5dSApple OSS Distributions 		uth->uu_workq_thport = ipc_port_copyout_send_pinned(port, get_task_ipcspace(proc_task(p)));
4956*8d741a5dSApple OSS Distributions 	}
4957*8d741a5dSApple OSS Distributions 
4958*8d741a5dSApple OSS Distributions 	/* Thread has been set up to run, arm its next workqueue quantum or disarm
4959*8d741a5dSApple OSS Distributions 	 * if it is no longer supporting that */
4960*8d741a5dSApple OSS Distributions 	if (thread_supports_cooperative_workqueue(th)) {
4961*8d741a5dSApple OSS Distributions 		thread_arm_workqueue_quantum(th);
4962*8d741a5dSApple OSS Distributions 	} else {
4963*8d741a5dSApple OSS Distributions 		thread_disarm_workqueue_quantum(th);
4964*8d741a5dSApple OSS Distributions 	}
4965*8d741a5dSApple OSS Distributions 
4966*8d741a5dSApple OSS Distributions 	/*
4967*8d741a5dSApple OSS Distributions 	 * Call out to pthread, this sets up the thread, pulls in kevent structs
4968*8d741a5dSApple OSS Distributions 	 * onto the stack, sets up the thread state and then returns to userspace.
4969*8d741a5dSApple OSS Distributions 	 */
4970*8d741a5dSApple OSS Distributions 	WQ_TRACE_WQ(TRACE_wq_runthread | DBG_FUNC_START,
4971*8d741a5dSApple OSS Distributions 	    proc_get_wqptr_fast(p), 0, 0, 0);
4972*8d741a5dSApple OSS Distributions 
4973*8d741a5dSApple OSS Distributions 	if (workq_thread_is_cooperative(uth) || workq_thread_is_permanently_bound(uth)) {
4974*8d741a5dSApple OSS Distributions 		thread_sched_call(th, NULL);
4975*8d741a5dSApple OSS Distributions 	} else {
4976*8d741a5dSApple OSS Distributions 		thread_sched_call(th, workq_sched_callback);
4977*8d741a5dSApple OSS Distributions 	}
4978*8d741a5dSApple OSS Distributions 
4979*8d741a5dSApple OSS Distributions 	pthread_functions->workq_setup_thread(p, th, vmap, uth->uu_workq_stackaddr,
4980*8d741a5dSApple OSS Distributions 	    uth->uu_workq_thport, 0, setup_flags, upcall_flags);
4981*8d741a5dSApple OSS Distributions 
4982*8d741a5dSApple OSS Distributions 	__builtin_unreachable();
4983*8d741a5dSApple OSS Distributions }
4984*8d741a5dSApple OSS Distributions 
4985*8d741a5dSApple OSS Distributions /**
4986*8d741a5dSApple OSS Distributions  * A wrapper around workq_setup_and_run for permanently bound thread.
4987*8d741a5dSApple OSS Distributions  */
4988*8d741a5dSApple OSS Distributions __attribute__((noreturn, noinline))
4989*8d741a5dSApple OSS Distributions static void
workq_bound_thread_setup_and_run(struct uthread * uth,int setup_flags)4990*8d741a5dSApple OSS Distributions workq_bound_thread_setup_and_run(struct uthread *uth, int setup_flags)
4991*8d741a5dSApple OSS Distributions {
4992*8d741a5dSApple OSS Distributions 	struct workq_threadreq_s * kqr = uth->uu_kqr_bound;
4993*8d741a5dSApple OSS Distributions 
4994*8d741a5dSApple OSS Distributions 	uint32_t upcall_flags = (WQ_FLAG_THREAD_NEWSPI |
4995*8d741a5dSApple OSS Distributions 	    WQ_FLAG_THREAD_WORKLOOP | WQ_FLAG_THREAD_KEVENT);
4996*8d741a5dSApple OSS Distributions 	if (workq_tr_is_overcommit(kqr->tr_flags)) {
4997*8d741a5dSApple OSS Distributions 		workq_thread_set_type(uth, UT_WORKQ_OVERCOMMIT);
4998*8d741a5dSApple OSS Distributions 		upcall_flags |= WQ_FLAG_THREAD_OVERCOMMIT;
4999*8d741a5dSApple OSS Distributions 	}
5000*8d741a5dSApple OSS Distributions 	uth->uu_save.uus_workq_park_data.upcall_flags = upcall_flags;
5001*8d741a5dSApple OSS Distributions 	workq_setup_and_run(current_proc(), uth, setup_flags);
5002*8d741a5dSApple OSS Distributions 	__builtin_unreachable();
5003*8d741a5dSApple OSS Distributions }
5004*8d741a5dSApple OSS Distributions 
5005*8d741a5dSApple OSS Distributions /**
5006*8d741a5dSApple OSS Distributions  * A parked bound thread wakes up for the first time.
5007*8d741a5dSApple OSS Distributions  */
5008*8d741a5dSApple OSS Distributions __attribute__((noreturn, noinline))
5009*8d741a5dSApple OSS Distributions static void
workq_bound_thread_initialize_and_unpark_continue(void * parameter __unused,wait_result_t wr)5010*8d741a5dSApple OSS Distributions workq_bound_thread_initialize_and_unpark_continue(void *parameter __unused,
5011*8d741a5dSApple OSS Distributions     wait_result_t wr)
5012*8d741a5dSApple OSS Distributions {
5013*8d741a5dSApple OSS Distributions 	/*
5014*8d741a5dSApple OSS Distributions 	 * Locking model for accessing uu_workq_flags :
5015*8d741a5dSApple OSS Distributions 	 *
5016*8d741a5dSApple OSS Distributions 	 * The concurrent access to uu_workq_flags is synchronized with workq lock
5017*8d741a5dSApple OSS Distributions 	 * until a thread gets permanently bound to a kqwl. Post that, kqlock
5018*8d741a5dSApple OSS Distributions 	 * is used for subsequent synchronizations. This gives us a significant
5019*8d741a5dSApple OSS Distributions 	 * benefit by avoiding having to take a process wide workq lock on every
5020*8d741a5dSApple OSS Distributions 	 * wakeup of the bound thread.
5021*8d741a5dSApple OSS Distributions 	 * This flip in locking model is tracked with UT_WORKQ_PERMANENT_BIND flag.
5022*8d741a5dSApple OSS Distributions 	 *
5023*8d741a5dSApple OSS Distributions 	 * There is one more optimization we can perform for when the thread is
5024*8d741a5dSApple OSS Distributions 	 * awakened for running (i.e THREAD_AWAKENED) until it parks.
5025*8d741a5dSApple OSS Distributions 	 * During this window, we know KQ_SLEEP bit is reset so there should not
5026*8d741a5dSApple OSS Distributions 	 * be any concurrent attempts to modify uu_workq_flags by
5027*8d741a5dSApple OSS Distributions 	 * kqworkloop_bound_thread_wakeup because the thread is already "awake".
5028*8d741a5dSApple OSS Distributions 	 * So we can safely access uu_workq_flags within this window without having
5029*8d741a5dSApple OSS Distributions 	 * to take kqlock. This KQ_SLEEP is later set by the bound thread under
5030*8d741a5dSApple OSS Distributions 	 * kqlock on its way to parking.
5031*8d741a5dSApple OSS Distributions 	 */
5032*8d741a5dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(current_thread());
5033*8d741a5dSApple OSS Distributions 
5034*8d741a5dSApple OSS Distributions 	if (__probable(wr == THREAD_AWAKENED)) {
5035*8d741a5dSApple OSS Distributions 		/* At most one flag. */
5036*8d741a5dSApple OSS Distributions 		assert((uth->uu_workq_flags & (UT_WORKQ_RUNNING | UT_WORKQ_DYING))
5037*8d741a5dSApple OSS Distributions 		    != (UT_WORKQ_RUNNING | UT_WORKQ_DYING));
5038*8d741a5dSApple OSS Distributions 
5039*8d741a5dSApple OSS Distributions 		assert(workq_thread_is_permanently_bound(uth));
5040*8d741a5dSApple OSS Distributions 
5041*8d741a5dSApple OSS Distributions 		if (uth->uu_workq_flags & UT_WORKQ_RUNNING) {
5042*8d741a5dSApple OSS Distributions 			assert(uth->uu_workq_flags & UT_WORKQ_NEW);
5043*8d741a5dSApple OSS Distributions 			uth->uu_workq_flags &= ~UT_WORKQ_NEW;
5044*8d741a5dSApple OSS Distributions 
5045*8d741a5dSApple OSS Distributions 			struct workq_threadreq_s * kqr = uth->uu_kqr_bound;
5046*8d741a5dSApple OSS Distributions 			if (kqr->tr_work_interval) {
5047*8d741a5dSApple OSS Distributions 				kern_return_t kr;
5048*8d741a5dSApple OSS Distributions 				kr = kern_work_interval_explicit_join(get_machthread(uth),
5049*8d741a5dSApple OSS Distributions 				    kqr->tr_work_interval);
5050*8d741a5dSApple OSS Distributions 				/*
5051*8d741a5dSApple OSS Distributions 				 * The work interval functions requires to be called on the
5052*8d741a5dSApple OSS Distributions 				 * current thread. If we fail here, we record the fact and
5053*8d741a5dSApple OSS Distributions 				 * continue.
5054*8d741a5dSApple OSS Distributions 				 * In the future, we can preflight checking that this join will
5055*8d741a5dSApple OSS Distributions 				 * always be successful when the paird kqwl is configured; but,
5056*8d741a5dSApple OSS Distributions 				 * for now, this should be a rare case (e.g. if you have passed
5057*8d741a5dSApple OSS Distributions 				 * invalid arguments to the join).
5058*8d741a5dSApple OSS Distributions 				 */
5059*8d741a5dSApple OSS Distributions 				if (kr == KERN_SUCCESS) {
5060*8d741a5dSApple OSS Distributions 					uth->uu_workq_flags |= UT_WORKQ_WORK_INTERVAL_JOINED;
5061*8d741a5dSApple OSS Distributions 					/* Thread and kqwl both have +1 ref on the work interval. */
5062*8d741a5dSApple OSS Distributions 				} else {
5063*8d741a5dSApple OSS Distributions 					uth->uu_workq_flags |= UT_WORKQ_WORK_INTERVAL_FAILED;
5064*8d741a5dSApple OSS Distributions 				}
5065*8d741a5dSApple OSS Distributions 			}
5066*8d741a5dSApple OSS Distributions 			workq_thread_reset_cpupercent(kqr, uth);
5067*8d741a5dSApple OSS Distributions 			workq_bound_thread_setup_and_run(uth, WQ_SETUP_FIRST_USE);
5068*8d741a5dSApple OSS Distributions 			__builtin_unreachable();
5069*8d741a5dSApple OSS Distributions 		} else {
5070*8d741a5dSApple OSS Distributions 			/*
5071*8d741a5dSApple OSS Distributions 			 * The permanently bound kqworkloop is getting destroyed so we
5072*8d741a5dSApple OSS Distributions 			 * are woken up to cleanly unbind ourselves from it and terminate.
5073*8d741a5dSApple OSS Distributions 			 * See KQ_WORKLOOP_DESTROY -> workq_kern_bound_thread_wakeup.
5074*8d741a5dSApple OSS Distributions 			 *
5075*8d741a5dSApple OSS Distributions 			 * The actual full unbind happens from
5076*8d741a5dSApple OSS Distributions 			 * uthread_cleanup -> kqueue_threadreq_unbind.
5077*8d741a5dSApple OSS Distributions 			 */
5078*8d741a5dSApple OSS Distributions 			assert(uth->uu_workq_flags & UT_WORKQ_DYING);
5079*8d741a5dSApple OSS Distributions 		}
5080*8d741a5dSApple OSS Distributions 	} else {
5081*8d741a5dSApple OSS Distributions 		/*
5082*8d741a5dSApple OSS Distributions 		 * The process is getting terminated so we are woken up to die.
5083*8d741a5dSApple OSS Distributions 		 * E.g. SIGKILL'd.
5084*8d741a5dSApple OSS Distributions 		 */
5085*8d741a5dSApple OSS Distributions 		assert(wr == THREAD_INTERRUPTED);
5086*8d741a5dSApple OSS Distributions 		/*
5087*8d741a5dSApple OSS Distributions 		 * It is possible we started running as the process is aborted
5088*8d741a5dSApple OSS Distributions 		 * due to termination; but, workq_kern_threadreq_permanent_bind
5089*8d741a5dSApple OSS Distributions 		 * has not had a chance to bind us to the kqwl yet.
5090*8d741a5dSApple OSS Distributions 		 *
5091*8d741a5dSApple OSS Distributions 		 * We synchronize with it using workq lock.
5092*8d741a5dSApple OSS Distributions 		 */
5093*8d741a5dSApple OSS Distributions 		proc_t p = current_proc();
5094*8d741a5dSApple OSS Distributions 		struct workqueue *wq = proc_get_wqptr_fast(p);
5095*8d741a5dSApple OSS Distributions 		workq_lock_spin(wq);
5096*8d741a5dSApple OSS Distributions 		assert(workq_thread_is_permanently_bound(uth));
5097*8d741a5dSApple OSS Distributions 		workq_unlock(wq);
5098*8d741a5dSApple OSS Distributions 
5099*8d741a5dSApple OSS Distributions 		/*
5100*8d741a5dSApple OSS Distributions 		 * We do the bind commit ourselves if workq_kern_threadreq_permanent_bind
5101*8d741a5dSApple OSS Distributions 		 * has not done it for us yet so our state is aligned with what the
5102*8d741a5dSApple OSS Distributions 		 * termination path below expects.
5103*8d741a5dSApple OSS Distributions 		 */
5104*8d741a5dSApple OSS Distributions 		kqueue_threadreq_bind_commit(p, get_machthread(uth));
5105*8d741a5dSApple OSS Distributions 	}
5106*8d741a5dSApple OSS Distributions 	workq_kern_bound_thread_terminate(uth->uu_kqr_bound);
5107*8d741a5dSApple OSS Distributions 	__builtin_unreachable();
5108*8d741a5dSApple OSS Distributions }
5109*8d741a5dSApple OSS Distributions 
5110*8d741a5dSApple OSS Distributions /**
5111*8d741a5dSApple OSS Distributions  * A parked bound thread wakes up. Not the first time.
5112*8d741a5dSApple OSS Distributions  */
5113*8d741a5dSApple OSS Distributions __attribute__((noreturn, noinline))
5114*8d741a5dSApple OSS Distributions static void
workq_bound_thread_unpark_continue(void * parameter __unused,wait_result_t wr)5115*8d741a5dSApple OSS Distributions workq_bound_thread_unpark_continue(void *parameter __unused, wait_result_t wr)
5116*8d741a5dSApple OSS Distributions {
5117*8d741a5dSApple OSS Distributions 	struct uthread *uth = get_bsdthread_info(current_thread());
5118*8d741a5dSApple OSS Distributions 	assert(workq_thread_is_permanently_bound(uth));
5119*8d741a5dSApple OSS Distributions 
5120*8d741a5dSApple OSS Distributions 	if (__probable(wr == THREAD_AWAKENED)) {
5121*8d741a5dSApple OSS Distributions 		/* At most one flag. */
5122*8d741a5dSApple OSS Distributions 		assert((uth->uu_workq_flags & (UT_WORKQ_RUNNING | UT_WORKQ_DYING))
5123*8d741a5dSApple OSS Distributions 		    != (UT_WORKQ_RUNNING | UT_WORKQ_DYING));
5124*8d741a5dSApple OSS Distributions 		if (uth->uu_workq_flags & UT_WORKQ_RUNNING) {
5125*8d741a5dSApple OSS Distributions 			workq_bound_thread_setup_and_run(uth, WQ_SETUP_NONE);
5126*8d741a5dSApple OSS Distributions 		} else {
5127*8d741a5dSApple OSS Distributions 			assert(uth->uu_workq_flags & UT_WORKQ_DYING);
5128*8d741a5dSApple OSS Distributions 		}
5129*8d741a5dSApple OSS Distributions 	} else {
5130*8d741a5dSApple OSS Distributions 		assert(wr == THREAD_INTERRUPTED);
5131*8d741a5dSApple OSS Distributions 	}
5132*8d741a5dSApple OSS Distributions 	workq_kern_bound_thread_terminate(uth->uu_kqr_bound);
5133*8d741a5dSApple OSS Distributions 	__builtin_unreachable();
5134*8d741a5dSApple OSS Distributions }
5135*8d741a5dSApple OSS Distributions 
5136*8d741a5dSApple OSS Distributions #pragma mark misc
5137*8d741a5dSApple OSS Distributions 
5138*8d741a5dSApple OSS Distributions int
fill_procworkqueue(proc_t p,struct proc_workqueueinfo * pwqinfo)5139*8d741a5dSApple OSS Distributions fill_procworkqueue(proc_t p, struct proc_workqueueinfo * pwqinfo)
5140*8d741a5dSApple OSS Distributions {
5141*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
5142*8d741a5dSApple OSS Distributions 	int error = 0;
5143*8d741a5dSApple OSS Distributions 	int     activecount;
5144*8d741a5dSApple OSS Distributions 
5145*8d741a5dSApple OSS Distributions 	if (wq == NULL) {
5146*8d741a5dSApple OSS Distributions 		return EINVAL;
5147*8d741a5dSApple OSS Distributions 	}
5148*8d741a5dSApple OSS Distributions 
5149*8d741a5dSApple OSS Distributions 	/*
5150*8d741a5dSApple OSS Distributions 	 * This is sometimes called from interrupt context by the kperf sampler.
5151*8d741a5dSApple OSS Distributions 	 * In that case, it's not safe to spin trying to take the lock since we
5152*8d741a5dSApple OSS Distributions 	 * might already hold it.  So, we just try-lock it and error out if it's
5153*8d741a5dSApple OSS Distributions 	 * already held.  Since this is just a debugging aid, and all our callers
5154*8d741a5dSApple OSS Distributions 	 * are able to handle an error, that's fine.
5155*8d741a5dSApple OSS Distributions 	 */
5156*8d741a5dSApple OSS Distributions 	bool locked = workq_lock_try(wq);
5157*8d741a5dSApple OSS Distributions 	if (!locked) {
5158*8d741a5dSApple OSS Distributions 		return EBUSY;
5159*8d741a5dSApple OSS Distributions 	}
5160*8d741a5dSApple OSS Distributions 
5161*8d741a5dSApple OSS Distributions 	wq_thactive_t act = _wq_thactive(wq);
5162*8d741a5dSApple OSS Distributions 	activecount = _wq_thactive_aggregate_downto_qos(wq, act,
5163*8d741a5dSApple OSS Distributions 	    WORKQ_THREAD_QOS_MIN, NULL, NULL);
5164*8d741a5dSApple OSS Distributions 	if (act & _wq_thactive_offset_for_qos(WORKQ_THREAD_QOS_MANAGER)) {
5165*8d741a5dSApple OSS Distributions 		activecount++;
5166*8d741a5dSApple OSS Distributions 	}
5167*8d741a5dSApple OSS Distributions 	pwqinfo->pwq_nthreads = wq->wq_nthreads;
5168*8d741a5dSApple OSS Distributions 	pwqinfo->pwq_runthreads = activecount;
5169*8d741a5dSApple OSS Distributions 	pwqinfo->pwq_blockedthreads = wq->wq_threads_scheduled - activecount;
5170*8d741a5dSApple OSS Distributions 	pwqinfo->pwq_state = 0;
5171*8d741a5dSApple OSS Distributions 
5172*8d741a5dSApple OSS Distributions 	if (wq->wq_constrained_threads_scheduled >= wq_max_constrained_threads) {
5173*8d741a5dSApple OSS Distributions 		pwqinfo->pwq_state |= WQ_EXCEEDED_CONSTRAINED_THREAD_LIMIT;
5174*8d741a5dSApple OSS Distributions 	}
5175*8d741a5dSApple OSS Distributions 
5176*8d741a5dSApple OSS Distributions 	if (wq->wq_nthreads >= wq_max_threads) {
5177*8d741a5dSApple OSS Distributions 		pwqinfo->pwq_state |= WQ_EXCEEDED_TOTAL_THREAD_LIMIT;
5178*8d741a5dSApple OSS Distributions 	}
5179*8d741a5dSApple OSS Distributions 
5180*8d741a5dSApple OSS Distributions 	uint64_t total_cooperative_threads;
5181*8d741a5dSApple OSS Distributions 	total_cooperative_threads = workq_num_cooperative_threads_scheduled_total(wq);
5182*8d741a5dSApple OSS Distributions 	if ((total_cooperative_threads == wq_cooperative_queue_max_size(wq)) &&
5183*8d741a5dSApple OSS Distributions 	    workq_has_cooperative_thread_requests(wq)) {
5184*8d741a5dSApple OSS Distributions 		pwqinfo->pwq_state |= WQ_EXCEEDED_COOPERATIVE_THREAD_LIMIT;
5185*8d741a5dSApple OSS Distributions 	}
5186*8d741a5dSApple OSS Distributions 
5187*8d741a5dSApple OSS Distributions 	if (wq->wq_exceeded_active_constrained_thread_limit) {
5188*8d741a5dSApple OSS Distributions 		pwqinfo->pwq_state |= WQ_EXCEEDED_ACTIVE_CONSTRAINED_THREAD_LIMIT;
5189*8d741a5dSApple OSS Distributions 	}
5190*8d741a5dSApple OSS Distributions 
5191*8d741a5dSApple OSS Distributions 	workq_unlock(wq);
5192*8d741a5dSApple OSS Distributions 	return error;
5193*8d741a5dSApple OSS Distributions }
5194*8d741a5dSApple OSS Distributions 
5195*8d741a5dSApple OSS Distributions boolean_t
workqueue_get_pwq_exceeded(void * v,boolean_t * exceeded_total,boolean_t * exceeded_constrained)5196*8d741a5dSApple OSS Distributions workqueue_get_pwq_exceeded(void *v, boolean_t *exceeded_total,
5197*8d741a5dSApple OSS Distributions     boolean_t *exceeded_constrained)
5198*8d741a5dSApple OSS Distributions {
5199*8d741a5dSApple OSS Distributions 	proc_t p = v;
5200*8d741a5dSApple OSS Distributions 	struct proc_workqueueinfo pwqinfo;
5201*8d741a5dSApple OSS Distributions 	int err;
5202*8d741a5dSApple OSS Distributions 
5203*8d741a5dSApple OSS Distributions 	assert(p != NULL);
5204*8d741a5dSApple OSS Distributions 	assert(exceeded_total != NULL);
5205*8d741a5dSApple OSS Distributions 	assert(exceeded_constrained != NULL);
5206*8d741a5dSApple OSS Distributions 
5207*8d741a5dSApple OSS Distributions 	err = fill_procworkqueue(p, &pwqinfo);
5208*8d741a5dSApple OSS Distributions 	if (err) {
5209*8d741a5dSApple OSS Distributions 		return FALSE;
5210*8d741a5dSApple OSS Distributions 	}
5211*8d741a5dSApple OSS Distributions 	if (!(pwqinfo.pwq_state & WQ_FLAGS_AVAILABLE)) {
5212*8d741a5dSApple OSS Distributions 		return FALSE;
5213*8d741a5dSApple OSS Distributions 	}
5214*8d741a5dSApple OSS Distributions 
5215*8d741a5dSApple OSS Distributions 	*exceeded_total = (pwqinfo.pwq_state & WQ_EXCEEDED_TOTAL_THREAD_LIMIT);
5216*8d741a5dSApple OSS Distributions 	*exceeded_constrained = (pwqinfo.pwq_state & WQ_EXCEEDED_CONSTRAINED_THREAD_LIMIT);
5217*8d741a5dSApple OSS Distributions 
5218*8d741a5dSApple OSS Distributions 	return TRUE;
5219*8d741a5dSApple OSS Distributions }
5220*8d741a5dSApple OSS Distributions 
5221*8d741a5dSApple OSS Distributions uint64_t
workqueue_get_task_ss_flags_from_pwq_state_kdp(void * v)5222*8d741a5dSApple OSS Distributions workqueue_get_task_ss_flags_from_pwq_state_kdp(void * v)
5223*8d741a5dSApple OSS Distributions {
5224*8d741a5dSApple OSS Distributions 	static_assert((WQ_EXCEEDED_CONSTRAINED_THREAD_LIMIT << 17) ==
5225*8d741a5dSApple OSS Distributions 	    kTaskWqExceededConstrainedThreadLimit);
5226*8d741a5dSApple OSS Distributions 	static_assert((WQ_EXCEEDED_TOTAL_THREAD_LIMIT << 17) ==
5227*8d741a5dSApple OSS Distributions 	    kTaskWqExceededTotalThreadLimit);
5228*8d741a5dSApple OSS Distributions 	static_assert((WQ_FLAGS_AVAILABLE << 17) == kTaskWqFlagsAvailable);
5229*8d741a5dSApple OSS Distributions 	static_assert(((uint64_t)WQ_EXCEEDED_COOPERATIVE_THREAD_LIMIT << 34) ==
5230*8d741a5dSApple OSS Distributions 	    (uint64_t)kTaskWqExceededCooperativeThreadLimit);
5231*8d741a5dSApple OSS Distributions 	static_assert(((uint64_t)WQ_EXCEEDED_ACTIVE_CONSTRAINED_THREAD_LIMIT << 34) ==
5232*8d741a5dSApple OSS Distributions 	    (uint64_t)kTaskWqExceededActiveConstrainedThreadLimit);
5233*8d741a5dSApple OSS Distributions 	static_assert((WQ_FLAGS_AVAILABLE | WQ_EXCEEDED_TOTAL_THREAD_LIMIT |
5234*8d741a5dSApple OSS Distributions 	    WQ_EXCEEDED_CONSTRAINED_THREAD_LIMIT |
5235*8d741a5dSApple OSS Distributions 	    WQ_EXCEEDED_COOPERATIVE_THREAD_LIMIT |
5236*8d741a5dSApple OSS Distributions 	    WQ_EXCEEDED_ACTIVE_CONSTRAINED_THREAD_LIMIT) == 0x1F);
5237*8d741a5dSApple OSS Distributions 
5238*8d741a5dSApple OSS Distributions 	if (v == NULL) {
5239*8d741a5dSApple OSS Distributions 		return 0;
5240*8d741a5dSApple OSS Distributions 	}
5241*8d741a5dSApple OSS Distributions 
5242*8d741a5dSApple OSS Distributions 	proc_t p = v;
5243*8d741a5dSApple OSS Distributions 	struct workqueue *wq = proc_get_wqptr(p);
5244*8d741a5dSApple OSS Distributions 
5245*8d741a5dSApple OSS Distributions 	if (wq == NULL || workq_lock_is_acquired_kdp(wq)) {
5246*8d741a5dSApple OSS Distributions 		return 0;
5247*8d741a5dSApple OSS Distributions 	}
5248*8d741a5dSApple OSS Distributions 
5249*8d741a5dSApple OSS Distributions 	uint64_t ss_flags = kTaskWqFlagsAvailable;
5250*8d741a5dSApple OSS Distributions 
5251*8d741a5dSApple OSS Distributions 	if (wq->wq_constrained_threads_scheduled >= wq_max_constrained_threads) {
5252*8d741a5dSApple OSS Distributions 		ss_flags |= kTaskWqExceededConstrainedThreadLimit;
5253*8d741a5dSApple OSS Distributions 	}
5254*8d741a5dSApple OSS Distributions 
5255*8d741a5dSApple OSS Distributions 	if (wq->wq_nthreads >= wq_max_threads) {
5256*8d741a5dSApple OSS Distributions 		ss_flags |= kTaskWqExceededTotalThreadLimit;
5257*8d741a5dSApple OSS Distributions 	}
5258*8d741a5dSApple OSS Distributions 
5259*8d741a5dSApple OSS Distributions 	uint64_t total_cooperative_threads;
5260*8d741a5dSApple OSS Distributions 	total_cooperative_threads = workq_num_cooperative_threads_scheduled_to_qos_internal(wq,
5261*8d741a5dSApple OSS Distributions 	    WORKQ_THREAD_QOS_MIN);
5262*8d741a5dSApple OSS Distributions 	if ((total_cooperative_threads == wq_cooperative_queue_max_size(wq)) &&
5263*8d741a5dSApple OSS Distributions 	    workq_has_cooperative_thread_requests(wq)) {
5264*8d741a5dSApple OSS Distributions 		ss_flags |= kTaskWqExceededCooperativeThreadLimit;
5265*8d741a5dSApple OSS Distributions 	}
5266*8d741a5dSApple OSS Distributions 
5267*8d741a5dSApple OSS Distributions 	if (wq->wq_exceeded_active_constrained_thread_limit) {
5268*8d741a5dSApple OSS Distributions 		ss_flags |= kTaskWqExceededActiveConstrainedThreadLimit;
5269*8d741a5dSApple OSS Distributions 	}
5270*8d741a5dSApple OSS Distributions 
5271*8d741a5dSApple OSS Distributions 	return ss_flags;
5272*8d741a5dSApple OSS Distributions }
5273*8d741a5dSApple OSS Distributions 
5274*8d741a5dSApple OSS Distributions void
workq_init(void)5275*8d741a5dSApple OSS Distributions workq_init(void)
5276*8d741a5dSApple OSS Distributions {
5277*8d741a5dSApple OSS Distributions 	clock_interval_to_absolutetime_interval(wq_stalled_window.usecs,
5278*8d741a5dSApple OSS Distributions 	    NSEC_PER_USEC, &wq_stalled_window.abstime);
5279*8d741a5dSApple OSS Distributions 	clock_interval_to_absolutetime_interval(wq_reduce_pool_window.usecs,
5280*8d741a5dSApple OSS Distributions 	    NSEC_PER_USEC, &wq_reduce_pool_window.abstime);
5281*8d741a5dSApple OSS Distributions 	clock_interval_to_absolutetime_interval(wq_max_timer_interval.usecs,
5282*8d741a5dSApple OSS Distributions 	    NSEC_PER_USEC, &wq_max_timer_interval.abstime);
5283*8d741a5dSApple OSS Distributions 
5284*8d741a5dSApple OSS Distributions 	thread_deallocate_daemon_register_queue(&workq_deallocate_queue,
5285*8d741a5dSApple OSS Distributions 	    workq_deallocate_queue_invoke);
5286*8d741a5dSApple OSS Distributions }
5287