1 /*
2 * Copyright (c) 2000-2023 Apple Inc. All rights reserved.
3 *
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
5 *
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
14 *
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
17 *
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
25 *
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
27 */
28 /* Copyright (c) 1995 NeXT Computer, Inc. All Rights Reserved */
29 /*-
30 * Copyright (c) 1982, 1986, 1989, 1993
31 * The Regents of the University of California. All rights reserved.
32 *
33 * This code is derived from software contributed to Berkeley by
34 * Mike Karels at Berkeley Software Design, Inc.
35 *
36 * Redistribution and use in source and binary forms, with or without
37 * modification, are permitted provided that the following conditions
38 * are met:
39 * 1. Redistributions of source code must retain the above copyright
40 * notice, this list of conditions and the following disclaimer.
41 * 2. Redistributions in binary form must reproduce the above copyright
42 * notice, this list of conditions and the following disclaimer in the
43 * documentation and/or other materials provided with the distribution.
44 * 3. All advertising materials mentioning features or use of this software
45 * must display the following acknowledgement:
46 * This product includes software developed by the University of
47 * California, Berkeley and its contributors.
48 * 4. Neither the name of the University nor the names of its contributors
49 * may be used to endorse or promote products derived from this software
50 * without specific prior written permission.
51 *
52 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
53 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
54 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
55 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
56 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
57 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
58 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
59 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
60 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
61 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
62 * SUCH DAMAGE.
63 *
64 * @(#)kern_sysctl.c 8.4 (Berkeley) 4/14/94
65 */
66 /*
67 * NOTICE: This file was modified by SPARTA, Inc. in 2005 to introduce
68 * support for mandatory and extensible security protections. This notice
69 * is included in support of clause 2.2 (b) of the Apple Public License,
70 * Version 2.0.
71 */
72
73 /*
74 * DEPRECATED sysctl system call code
75 *
76 * Everything in this file is deprecated. Sysctls should be handled
77 * by the code in kern_newsysctl.c.
78 * The remaining "case" sections are supposed to be converted into
79 * SYSCTL_*-style definitions, and as soon as all of them are gone,
80 * this source file is supposed to die.
81 *
82 * DO NOT ADD ANY MORE "case" SECTIONS TO THIS FILE, instead define
83 * your sysctl with SYSCTL_INT, SYSCTL_PROC etc. in your source file.
84 */
85
86 #include <sys/param.h>
87 #include <sys/systm.h>
88 #include <sys/kernel.h>
89 #include <sys/malloc.h>
90 #include <sys/proc_internal.h>
91 #include <sys/kauth.h>
92 #include <sys/file_internal.h>
93 #include <sys/vnode_internal.h>
94 #include <sys/unistd.h>
95 #include <sys/buf.h>
96 #include <sys/ioctl.h>
97 #include <sys/namei.h>
98 #include <sys/tty.h>
99 #include <sys/disklabel.h>
100 #include <sys/vm.h>
101 #include <sys/sysctl.h>
102 #include <sys/user.h>
103 #include <sys/aio_kern.h>
104 #include <sys/reboot.h>
105 #include <sys/memory_maintenance.h>
106 #include <sys/priv.h>
107 #include <stdatomic.h>
108 #include <uuid/uuid.h>
109
110 #include <security/audit/audit.h>
111 #include <kern/kalloc.h>
112
113 #include <machine/smp.h>
114 #include <machine/atomic.h>
115 #include <machine/config.h>
116 #include <mach/machine.h>
117 #include <mach/mach_host.h>
118 #include <mach/mach_types.h>
119 #include <mach/processor_info.h>
120 #include <mach/vm_param.h>
121 #include <kern/debug.h>
122 #include <kern/mach_param.h>
123 #include <kern/task.h>
124 #include <kern/thread.h>
125 #include <kern/thread_group.h>
126 #include <kern/processor.h>
127 #include <kern/cpu_number.h>
128 #include <kern/sched_prim.h>
129 #include <kern/workload_config.h>
130 #include <kern/iotrace.h>
131 #include <vm/vm_kern.h>
132 #include <vm/vm_map.h>
133 #include <mach/host_info.h>
134 #include <mach/exclaves.h>
135 #include <kern/hvg_hypercall.h>
136
137 #if DEVELOPMENT || DEBUG
138 #include <kern/ext_paniclog.h>
139 #endif
140
141 #include <sys/mount_internal.h>
142 #include <sys/kdebug.h>
143 #include <sys/kern_debug.h>
144 #include <sys/kern_sysctl.h>
145 #include <sys/variant_internal.h>
146
147 #include <IOKit/IOPlatformExpert.h>
148 #include <pexpert/pexpert.h>
149
150 #include <machine/machine_routines.h>
151 #include <machine/exec.h>
152
153 #include <nfs/nfs_conf.h>
154
155 #include <vm/vm_protos.h>
156 #include <vm/vm_pageout.h>
157 #include <vm/vm_compressor_algorithms.h>
158 #include <sys/imgsrc.h>
159 #include <kern/timer_call.h>
160 #include <sys/codesign.h>
161 #include <IOKit/IOBSD.h>
162 #if CONFIG_CSR
163 #include <sys/csr.h>
164 #endif
165
166 #if defined(__i386__) || defined(__x86_64__)
167 #include <i386/cpuid.h>
168 #endif
169
170 #if CONFIG_FREEZE
171 #include <sys/kern_memorystatus.h>
172 #endif
173
174 #if KPERF
175 #include <kperf/kperf.h>
176 #endif
177
178 #if HYPERVISOR
179 #include <kern/hv_support.h>
180 #endif
181
182
183 #include <corecrypto/ccsha2.h>
184
185 /*
186 * deliberately setting max requests to really high number
187 * so that runaway settings do not cause MALLOC overflows
188 */
189 #define AIO_MAX_REQUESTS (128 * CONFIG_AIO_MAX)
190
191 extern int aio_max_requests;
192 extern int aio_max_requests_per_process;
193 extern int aio_worker_threads;
194 extern int lowpri_IO_window_msecs;
195 extern int lowpri_IO_delay_msecs;
196 #if DEVELOPMENT || DEBUG
197 extern int nx_enabled;
198 #endif
199 extern int speculative_reads_disabled;
200 extern unsigned int speculative_prefetch_max;
201 extern unsigned int speculative_prefetch_max_iosize;
202 extern unsigned int preheat_max_bytes;
203 extern unsigned int preheat_min_bytes;
204 extern long numvnodes;
205 extern long freevnodes;
206 extern long num_recycledvnodes;
207
208 extern uuid_string_t bootsessionuuid_string;
209
210 extern unsigned int vm_max_delayed_work_limit;
211 extern unsigned int vm_max_batch;
212
213 extern unsigned int vm_page_free_min;
214 extern unsigned int vm_page_free_target;
215 extern unsigned int vm_page_free_reserved;
216
217 #if (DEVELOPMENT || DEBUG)
218 extern uint32_t vm_page_creation_throttled_hard;
219 extern uint32_t vm_page_creation_throttled_soft;
220 #endif /* DEVELOPMENT || DEBUG */
221
222 #if DEVELOPMENT || DEBUG
223 extern bool bootarg_hide_process_traced;
224 #endif
225
226 /*
227 * Conditionally allow dtrace to see these functions for debugging purposes.
228 */
229 #ifdef STATIC
230 #undef STATIC
231 #endif
232 #if 0
233 #define STATIC
234 #else
235 #define STATIC static
236 #endif
237
238 extern boolean_t mach_timer_coalescing_enabled;
239
240 extern uint64_t timer_deadline_tracking_bin_1, timer_deadline_tracking_bin_2;
241
242 STATIC void
243 fill_user32_eproc(proc_t, struct user32_eproc *__restrict);
244 STATIC void
245 fill_user32_externproc(proc_t, struct user32_extern_proc *__restrict);
246 STATIC void
247 fill_user64_eproc(proc_t, struct user64_eproc *__restrict);
248 STATIC void
249 fill_user64_proc(proc_t, struct user64_kinfo_proc *__restrict);
250 STATIC void
251 fill_user64_externproc(proc_t, struct user64_extern_proc *__restrict);
252 STATIC void
253 fill_user32_proc(proc_t, struct user32_kinfo_proc *__restrict);
254
255 #if CONFIG_NETBOOT
256 extern int
257 netboot_root(void);
258 #endif
259 int
260 sysctl_procargs(int *name, u_int namelen, user_addr_t where,
261 size_t *sizep, proc_t cur_proc);
262 STATIC int
263 sysctl_procargsx(int *name, u_int namelen, user_addr_t where, size_t *sizep,
264 proc_t cur_proc, int argc_yes);
265 int
266 sysctl_struct(user_addr_t oldp, size_t *oldlenp, user_addr_t newp,
267 size_t newlen, void *sp, int len);
268
269 STATIC int sysdoproc_filt_KERN_PROC_PID(proc_t p, void * arg);
270 STATIC int sysdoproc_filt_KERN_PROC_PGRP(proc_t p, void * arg);
271 STATIC int sysdoproc_filt_KERN_PROC_TTY(proc_t p, void * arg);
272 STATIC int sysdoproc_filt_KERN_PROC_UID(proc_t p, void * arg);
273 STATIC int sysdoproc_filt_KERN_PROC_RUID(proc_t p, void * arg);
274 int sysdoproc_callback(proc_t p, void *arg);
275
276 #if CONFIG_THREAD_GROUPS && (DEVELOPMENT || DEBUG)
277 STATIC int sysctl_get_thread_group_id SYSCTL_HANDLER_ARGS;
278 #endif
279
280 /* forward declarations for non-static STATIC */
281 STATIC void fill_loadavg64(struct loadavg *la, struct user64_loadavg *la64);
282 STATIC void fill_loadavg32(struct loadavg *la, struct user32_loadavg *la32);
283 STATIC int sysctl_handle_kern_threadname(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
284 STATIC int sysctl_sched_stats(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
285 STATIC int sysctl_sched_stats_enable(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
286 #if COUNT_SYSCALLS
287 STATIC int sysctl_docountsyscalls SYSCTL_HANDLER_ARGS;
288 #endif /* COUNT_SYSCALLS */
289 #if defined(XNU_TARGET_OS_OSX)
290 STATIC int sysctl_doprocargs SYSCTL_HANDLER_ARGS;
291 #endif /* defined(XNU_TARGET_OS_OSX) */
292 STATIC int sysctl_doprocargs2 SYSCTL_HANDLER_ARGS;
293 STATIC int sysctl_prochandle SYSCTL_HANDLER_ARGS;
294 STATIC int sysctl_aiomax(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
295 STATIC int sysctl_aioprocmax(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
296 STATIC int sysctl_aiothreads(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
297 STATIC int sysctl_maxproc(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
298 STATIC int sysctl_osversion(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
299 STATIC int sysctl_sysctl_bootargs(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
300 STATIC int sysctl_maxvnodes(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
301 STATIC int sysctl_securelvl(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
302 STATIC int sysctl_domainname(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
303 STATIC int sysctl_hostname(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
304 STATIC int sysctl_procname(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
305 STATIC int sysctl_boottime(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
306 STATIC int sysctl_bootuuid(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
307 STATIC int sysctl_symfile(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
308 #if CONFIG_NETBOOT
309 STATIC int sysctl_netboot(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
310 #endif
311 #ifdef CONFIG_IMGSRC_ACCESS
312 STATIC int sysctl_imgsrcdev(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
313 #endif
314 STATIC int sysctl_usrstack(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
315 STATIC int sysctl_usrstack64(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
316 #if CONFIG_COREDUMP
317 STATIC int sysctl_coredump(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
318 STATIC int sysctl_suid_coredump(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
319 #endif
320 STATIC int sysctl_delayterm(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
321 STATIC int sysctl_rage_vnode(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
322 STATIC int sysctl_kern_check_openevt(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
323 #if DEVELOPMENT || DEBUG
324 STATIC int sysctl_nx(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
325 #endif
326 STATIC int sysctl_loadavg(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
327 STATIC int sysctl_vm_toggle_address_reuse(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
328 STATIC int sysctl_swapusage(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
329 STATIC int fetch_process_cputype( proc_t cur_proc, int *name, u_int namelen, cpu_type_t *cputype);
330 STATIC int sysctl_sysctl_native(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
331 STATIC int sysctl_sysctl_cputype(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
332 STATIC int sysctl_safeboot(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
333 STATIC int sysctl_singleuser(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
334 STATIC int sysctl_minimalboot(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
335 STATIC int sysctl_slide(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
336
337 #ifdef CONFIG_XNUPOST
338 #include <tests/xnupost.h>
339
340 STATIC int sysctl_debug_test_oslog_ctl(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
341 STATIC int sysctl_debug_test_stackshot_mutex_owner(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
342 STATIC int sysctl_debug_test_stackshot_rwlck_owner(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
343 #endif
344
345 extern void IORegistrySetOSBuildVersion(char * build_version);
346 extern int IOParseWorkloadConfig(workload_config_ctx_t *ctx, const char * buffer, size_t size);
347 extern int IOUnparseWorkloadConfig(char *buffer, size_t *size);
348
349 STATIC void
fill_loadavg64(struct loadavg * la,struct user64_loadavg * la64)350 fill_loadavg64(struct loadavg *la, struct user64_loadavg *la64)
351 {
352 la64->ldavg[0] = la->ldavg[0];
353 la64->ldavg[1] = la->ldavg[1];
354 la64->ldavg[2] = la->ldavg[2];
355 la64->fscale = (user64_long_t)la->fscale;
356 }
357
358 STATIC void
fill_loadavg32(struct loadavg * la,struct user32_loadavg * la32)359 fill_loadavg32(struct loadavg *la, struct user32_loadavg *la32)
360 {
361 la32->ldavg[0] = la->ldavg[0];
362 la32->ldavg[1] = la->ldavg[1];
363 la32->ldavg[2] = la->ldavg[2];
364 la32->fscale = (user32_long_t)la->fscale;
365 }
366
367 #if COUNT_SYSCALLS
368 extern int do_count_syscalls;
369 #endif
370
371 #ifdef INSECURE
372 int securelevel = -1;
373 #else
374 int securelevel;
375 #endif
376
377 STATIC int
sysctl_handle_kern_threadname(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)378 sysctl_handle_kern_threadname( __unused struct sysctl_oid *oidp, __unused void *arg1,
379 __unused int arg2, struct sysctl_req *req)
380 {
381 int error;
382 struct uthread *ut = current_uthread();
383 user_addr_t oldp = 0, newp = 0;
384 size_t *oldlenp = NULL;
385 size_t newlen = 0;
386
387 oldp = req->oldptr;
388 oldlenp = &(req->oldlen);
389 newp = req->newptr;
390 newlen = req->newlen;
391
392 /* We want the current length, and maybe the string itself */
393 if (oldlenp) {
394 /* if we have no thread name yet tell'em we want MAXTHREADNAMESIZE - 1 */
395 size_t currlen = MAXTHREADNAMESIZE - 1;
396
397 if (ut->pth_name) {
398 /* use length of current thread name */
399 currlen = strlen(ut->pth_name);
400 }
401 if (oldp) {
402 if (*oldlenp < currlen) {
403 return ENOMEM;
404 }
405 /* NOTE - we do not copy the NULL terminator */
406 if (ut->pth_name) {
407 error = copyout(ut->pth_name, oldp, currlen);
408 if (error) {
409 return error;
410 }
411 }
412 }
413 /* return length of thread name minus NULL terminator (just like strlen) */
414 req->oldidx = currlen;
415 }
416
417 /* We want to set the name to something */
418 if (newp) {
419 if (newlen > (MAXTHREADNAMESIZE - 1)) {
420 return ENAMETOOLONG;
421 }
422 if (!ut->pth_name) {
423 char *tmp_pth_name = (char *)kalloc_data(MAXTHREADNAMESIZE,
424 Z_WAITOK | Z_ZERO);
425 if (!tmp_pth_name) {
426 return ENOMEM;
427 }
428 if (!OSCompareAndSwapPtr(NULL, tmp_pth_name, &ut->pth_name)) {
429 kfree_data(tmp_pth_name, MAXTHREADNAMESIZE);
430 return EBUSY;
431 }
432 } else {
433 kernel_debug_string_simple(TRACE_STRING_THREADNAME_PREV, ut->pth_name);
434 bzero(ut->pth_name, MAXTHREADNAMESIZE);
435 }
436 error = copyin(newp, ut->pth_name, newlen);
437 if (error) {
438 return error;
439 }
440
441 kernel_debug_string_simple(TRACE_STRING_THREADNAME, ut->pth_name);
442 }
443
444 return 0;
445 }
446
447 SYSCTL_PROC(_kern, KERN_THREADNAME, threadname, CTLFLAG_ANYBODY | CTLTYPE_STRING | CTLFLAG_RW | CTLFLAG_LOCKED, 0, 0, sysctl_handle_kern_threadname, "A", "");
448
449 #define WORKLOAD_CONFIG_MAX_SIZE (128 * 1024 * 1024)
450
451 /* Called locked - sysctl defined without CTLFLAG_LOCKED. */
452 static int
453 sysctl_workload_config SYSCTL_HANDLER_ARGS
454 {
455 #pragma unused(arg1, arg2)
456
457 char *plist_blob = NULL;
458 kern_return_t ret = KERN_FAILURE;
459 int error = -1;
460
461 /* Only allow reading of workload config on non-RELEASE kernels. */
462 #if DEVELOPMENT || DEBUG
463
464 const size_t buf_size = req->oldlen;
465
466 if (!req->oldptr) {
467 /* Just looking for the size to allocate. */
468 size_t size = 0;
469 ret = IOUnparseWorkloadConfig(NULL, &size);
470 if (ret != KERN_SUCCESS) {
471 return ENOMEM;
472 }
473
474 error = SYSCTL_OUT(req, NULL, size);
475 if (error) {
476 return error;
477 }
478 } else {
479 if (buf_size > (WORKLOAD_CONFIG_MAX_SIZE - 1) ||
480 buf_size == 0) {
481 return EINVAL;
482 }
483
484 plist_blob = kalloc_data(buf_size, Z_WAITOK | Z_ZERO);
485 if (!plist_blob) {
486 return ENOMEM;
487 }
488
489 size_t size = buf_size;
490 ret = IOUnparseWorkloadConfig(plist_blob, &size);
491 if (ret != KERN_SUCCESS) {
492 kfree_data(plist_blob, buf_size);
493 return ENOMEM;
494 }
495
496 error = SYSCTL_OUT(req, plist_blob, MIN(buf_size, size));
497
498 /* If the buffer was too small to fit the entire config. */
499 if (buf_size < size) {
500 error = ENOMEM;
501 }
502
503 kfree_data(plist_blob, buf_size);
504 if (error) {
505 return error;
506 }
507 }
508 #endif /* DEVELOPMENT || DEBUG */
509
510 if (req->newptr) {
511 size_t newlen = req->newlen;
512 if (newlen > (WORKLOAD_CONFIG_MAX_SIZE - 1)) {
513 return EINVAL;
514 }
515
516
517 workload_config_ctx_t *ctx = NULL;
518 /*
519 * Only allow workload_config_boot to be loaded once at boot by launchd.
520 */
521 if (current_proc() == initproc &&
522 !workload_config_initialized(&workload_config_boot)) {
523 ctx = &workload_config_boot;
524 } else {
525 #if DEVELOPMENT || DEBUG
526 /*
527 * Use the devel config context otherwise. If a devel config has been
528 * initialized it will be used for lookups in place of the boot config.
529 */
530 ctx = &workload_config_devel;
531 if (workload_config_initialized(ctx)) {
532 workload_config_free(ctx);
533 }
534
535 /* The devel context can be explicitly cleared by an empty string. */
536 if (newlen == 1) {
537 return 0;
538 }
539 #else
540 return EINVAL;
541 #endif
542 }
543
544 plist_blob = kalloc_data(newlen + 1, Z_WAITOK | Z_ZERO);
545 if (!plist_blob) {
546 return ENOMEM;
547 }
548 error = copyin(req->newptr, plist_blob, newlen);
549 if (error) {
550 kfree_data(plist_blob, newlen + 1);
551 return error;
552 }
553 plist_blob[newlen] = '\0';
554 ret = IOParseWorkloadConfig(ctx, plist_blob, newlen + 1);
555
556 kfree_data(plist_blob, newlen + 1);
557 return ret == KERN_SUCCESS ? 0 : EINVAL;
558 }
559
560 return 0;
561 }
562
563 SYSCTL_PROC(_kern, OID_AUTO, workload_config, CTLTYPE_STRING | CTLFLAG_RW | CTLFLAG_MASKED,
564 0, 0, sysctl_workload_config, "A", "global workgroup configuration plist load/unload");
565
566 #define BSD_HOST 1
567 STATIC int
sysctl_sched_stats(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)568 sysctl_sched_stats(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
569 {
570 host_basic_info_data_t hinfo;
571 kern_return_t kret;
572 uint32_t size;
573 uint32_t buf_size = 0;
574 int changed;
575 mach_msg_type_number_t count = HOST_BASIC_INFO_COUNT;
576 struct _processor_statistics_np *buf;
577 int error;
578
579 kret = host_info((host_t)BSD_HOST, HOST_BASIC_INFO, (host_info_t)&hinfo, &count);
580 if (kret != KERN_SUCCESS) {
581 return EINVAL;
582 }
583
584 size = sizeof(struct _processor_statistics_np) * (hinfo.logical_cpu_max + 2); /* One for RT Queue, One for Fair Share Queue */
585
586 if (req->oldlen < size) {
587 return EINVAL;
588 }
589
590 buf_size = size;
591 buf = (struct _processor_statistics_np *)kalloc_data(buf_size, Z_ZERO | Z_WAITOK);
592
593 kret = get_sched_statistics(buf, &size);
594 if (kret != KERN_SUCCESS) {
595 error = EINVAL;
596 goto out;
597 }
598
599 error = sysctl_io_opaque(req, buf, size, &changed);
600 if (error) {
601 goto out;
602 }
603
604 if (changed) {
605 panic("Sched info changed?!");
606 }
607 out:
608 kfree_data(buf, buf_size);
609 return error;
610 }
611
612 SYSCTL_PROC(_kern, OID_AUTO, sched_stats, CTLFLAG_LOCKED, 0, 0, sysctl_sched_stats, "-", "");
613
614 STATIC int
sysctl_sched_stats_enable(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,__unused struct sysctl_req * req)615 sysctl_sched_stats_enable(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, __unused struct sysctl_req *req)
616 {
617 boolean_t active;
618 int res;
619
620 if (req->newlen != sizeof(active)) {
621 return EINVAL;
622 }
623
624 res = copyin(req->newptr, &active, sizeof(active));
625 if (res != 0) {
626 return res;
627 }
628
629 return set_sched_stats_active(active);
630 }
631
632 SYSCTL_PROC(_kern, OID_AUTO, sched_stats_enable, CTLFLAG_LOCKED | CTLFLAG_WR, 0, 0, sysctl_sched_stats_enable, "-", "");
633
634 extern uint32_t sched_debug_flags;
635 SYSCTL_INT(_debug, OID_AUTO, sched, CTLFLAG_RW | CTLFLAG_LOCKED, &sched_debug_flags, 0, "scheduler debug");
636
637 #if (DEBUG || DEVELOPMENT)
638 extern boolean_t doprnt_hide_pointers;
639 SYSCTL_INT(_debug, OID_AUTO, hide_kernel_pointers, CTLFLAG_RW | CTLFLAG_LOCKED, &doprnt_hide_pointers, 0, "hide kernel pointers from log");
640 #endif
641
642
643 extern int get_kernel_symfile(proc_t, char **);
644
645 #if COUNT_SYSCALLS
646 #define KERN_COUNT_SYSCALLS (KERN_OSTYPE + 1000)
647
648 extern const unsigned int nsysent;
649 extern int syscalls_log[];
650 extern const char *syscallnames[];
651
652 STATIC int
653 sysctl_docountsyscalls SYSCTL_HANDLER_ARGS
654 {
655 __unused int cmd = oidp->oid_arg2; /* subcommand*/
656 __unused int *name = arg1; /* oid element argument vector */
657 __unused int namelen = arg2; /* number of oid element arguments */
658 int error, changed;
659
660 int tmp;
661
662 /* valid values passed in:
663 * = 0 means don't keep called counts for each bsd syscall
664 * > 0 means keep called counts for each bsd syscall
665 * = 2 means dump current counts to the system log
666 * = 3 means reset all counts
667 * for example, to dump current counts:
668 * sysctl -w kern.count_calls=2
669 */
670 error = sysctl_io_number(req, do_count_syscalls,
671 sizeof(do_count_syscalls), &tmp, &changed);
672
673 if (error != 0 || !changed) {
674 return error;
675 }
676
677 if (tmp == 1) {
678 do_count_syscalls = 1;
679 } else if (tmp == 0 || tmp == 2 || tmp == 3) {
680 for (int i = 0; i < nsysent; i++) {
681 if (syscalls_log[i] != 0) {
682 if (tmp == 2) {
683 printf("%d calls - name %s \n", syscalls_log[i], syscallnames[i]);
684 } else {
685 syscalls_log[i] = 0;
686 }
687 }
688 }
689 do_count_syscalls = (tmp != 0);
690 }
691
692 return error;
693 }
694 SYSCTL_PROC(_kern, KERN_COUNT_SYSCALLS, count_syscalls, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED,
695 0, /* Pointer argument (arg1) */
696 0, /* Integer argument (arg2) */
697 sysctl_docountsyscalls, /* Handler function */
698 NULL, /* Data pointer */
699 "");
700 #endif /* COUNT_SYSCALLS */
701
702 /*
703 * The following sysctl_* functions should not be used
704 * any more, as they can only cope with callers in
705 * user mode: Use new-style
706 * sysctl_io_number()
707 * sysctl_io_string()
708 * sysctl_io_opaque()
709 * instead.
710 */
711
712 STATIC int
sysdoproc_filt_KERN_PROC_PID(proc_t p,void * arg)713 sysdoproc_filt_KERN_PROC_PID(proc_t p, void * arg)
714 {
715 if (proc_getpid(p) != (pid_t)*(int*)arg) {
716 return 0;
717 } else {
718 return 1;
719 }
720 }
721
722 STATIC int
sysdoproc_filt_KERN_PROC_PGRP(proc_t p,void * arg)723 sysdoproc_filt_KERN_PROC_PGRP(proc_t p, void * arg)
724 {
725 if (p->p_pgrpid != (pid_t)*(int*)arg) {
726 return 0;
727 } else {
728 return 1;
729 }
730 }
731
732 STATIC int
sysdoproc_filt_KERN_PROC_TTY(proc_t p,void * arg)733 sysdoproc_filt_KERN_PROC_TTY(proc_t p, void * arg)
734 {
735 struct pgrp *pg;
736 dev_t dev = NODEV;
737
738 if ((p->p_flag & P_CONTROLT) && (pg = proc_pgrp(p, NULL)) != PGRP_NULL) {
739 dev = os_atomic_load(&pg->pg_session->s_ttydev, relaxed);
740 pgrp_rele(pg);
741 }
742
743 return dev != NODEV && dev == (dev_t)*(int *)arg;
744 }
745
746 STATIC int
sysdoproc_filt_KERN_PROC_UID(proc_t p,void * arg)747 sysdoproc_filt_KERN_PROC_UID(proc_t p, void * arg)
748 {
749 uid_t uid;
750
751 smr_proc_task_enter();
752 uid = kauth_cred_getuid(proc_ucred_smr(p));
753 smr_proc_task_leave();
754
755 if (uid != (uid_t)*(int*)arg) {
756 return 0;
757 } else {
758 return 1;
759 }
760 }
761
762
763 STATIC int
sysdoproc_filt_KERN_PROC_RUID(proc_t p,void * arg)764 sysdoproc_filt_KERN_PROC_RUID(proc_t p, void * arg)
765 {
766 uid_t ruid;
767
768 smr_proc_task_enter();
769 ruid = kauth_cred_getruid(proc_ucred_smr(p));
770 smr_proc_task_leave();
771
772 if (ruid != (uid_t)*(int*)arg) {
773 return 0;
774 } else {
775 return 1;
776 }
777 }
778
779 /*
780 * try over estimating by 5 procs
781 */
782 #define KERN_PROCSLOP (5 * sizeof(struct kinfo_proc))
783 struct sysdoproc_args {
784 size_t buflen;
785 void *kprocp;
786 boolean_t is_64_bit;
787 user_addr_t dp;
788 size_t needed;
789 unsigned int sizeof_kproc;
790 int *errorp;
791 int uidcheck;
792 int ruidcheck;
793 int ttycheck;
794 int uidval;
795 };
796
797 int
sysdoproc_callback(proc_t p,void * arg)798 sysdoproc_callback(proc_t p, void *arg)
799 {
800 struct sysdoproc_args *args = arg;
801
802 if (args->buflen >= args->sizeof_kproc) {
803 if ((args->ruidcheck != 0) && (sysdoproc_filt_KERN_PROC_RUID(p, &args->uidval) == 0)) {
804 return PROC_RETURNED;
805 }
806 if ((args->uidcheck != 0) && (sysdoproc_filt_KERN_PROC_UID(p, &args->uidval) == 0)) {
807 return PROC_RETURNED;
808 }
809 if ((args->ttycheck != 0) && (sysdoproc_filt_KERN_PROC_TTY(p, &args->uidval) == 0)) {
810 return PROC_RETURNED;
811 }
812
813 bzero(args->kprocp, args->sizeof_kproc);
814 if (args->is_64_bit) {
815 fill_user64_proc(p, args->kprocp);
816 } else {
817 fill_user32_proc(p, args->kprocp);
818 }
819 int error = copyout(args->kprocp, args->dp, args->sizeof_kproc);
820 if (error) {
821 *args->errorp = error;
822 return PROC_RETURNED_DONE;
823 }
824 args->dp += args->sizeof_kproc;
825 args->buflen -= args->sizeof_kproc;
826 }
827 args->needed += args->sizeof_kproc;
828 return PROC_RETURNED;
829 }
830
831 SYSCTL_NODE(_kern, KERN_PROC, proc, CTLFLAG_RD | CTLFLAG_LOCKED, 0, "");
832 STATIC int
833 sysctl_prochandle SYSCTL_HANDLER_ARGS
834 {
835 int cmd = oidp->oid_arg2; /* subcommand for multiple nodes */
836 int *name = arg1; /* oid element argument vector */
837 int namelen = arg2; /* number of oid element arguments */
838 user_addr_t where = req->oldptr;/* user buffer copy out address */
839
840 user_addr_t dp = where;
841 size_t needed = 0;
842 size_t buflen = where != USER_ADDR_NULL ? req->oldlen : 0;
843 int error = 0;
844 boolean_t is_64_bit = proc_is64bit(current_proc());
845 struct user32_kinfo_proc user32_kproc;
846 struct user64_kinfo_proc user_kproc;
847 int sizeof_kproc;
848 void *kprocp;
849 int (*filterfn)(proc_t, void *) = 0;
850 struct sysdoproc_args args;
851 int uidcheck = 0;
852 int ruidcheck = 0;
853 int ttycheck = 0;
854
855 if (namelen != 1 && !(namelen == 0 && cmd == KERN_PROC_ALL)) {
856 return EINVAL;
857 }
858
859 if (is_64_bit) {
860 sizeof_kproc = sizeof(user_kproc);
861 kprocp = &user_kproc;
862 } else {
863 sizeof_kproc = sizeof(user32_kproc);
864 kprocp = &user32_kproc;
865 }
866
867 switch (cmd) {
868 case KERN_PROC_PID:
869 filterfn = sysdoproc_filt_KERN_PROC_PID;
870 break;
871
872 case KERN_PROC_PGRP:
873 filterfn = sysdoproc_filt_KERN_PROC_PGRP;
874 break;
875
876 case KERN_PROC_TTY:
877 ttycheck = 1;
878 break;
879
880 case KERN_PROC_UID:
881 uidcheck = 1;
882 break;
883
884 case KERN_PROC_RUID:
885 ruidcheck = 1;
886 break;
887
888 case KERN_PROC_ALL:
889 break;
890
891 default:
892 /* must be kern.proc.<unknown> */
893 return ENOTSUP;
894 }
895
896 error = 0;
897 args.buflen = buflen;
898 args.kprocp = kprocp;
899 args.is_64_bit = is_64_bit;
900 args.dp = dp;
901 args.needed = needed;
902 args.errorp = &error;
903 args.uidcheck = uidcheck;
904 args.ruidcheck = ruidcheck;
905 args.ttycheck = ttycheck;
906 args.sizeof_kproc = sizeof_kproc;
907 if (namelen) {
908 args.uidval = name[0];
909 }
910
911 proc_iterate((PROC_ALLPROCLIST | PROC_ZOMBPROCLIST),
912 sysdoproc_callback, &args, filterfn, name);
913
914 if (error) {
915 return error;
916 }
917
918 dp = args.dp;
919 needed = args.needed;
920
921 if (where != USER_ADDR_NULL) {
922 req->oldlen = dp - where;
923 if (needed > req->oldlen) {
924 return ENOMEM;
925 }
926 } else {
927 needed += KERN_PROCSLOP;
928 req->oldlen = needed;
929 }
930 /* adjust index so we return the right required/consumed amount */
931 req->oldidx += req->oldlen;
932 return 0;
933 }
934
935
936 /*
937 * We specify the subcommand code for multiple nodes as the 'req->arg2' value
938 * in the sysctl declaration itself, which comes into the handler function
939 * as 'oidp->oid_arg2'.
940 *
941 * For these particular sysctls, since they have well known OIDs, we could
942 * have just obtained it from the '((int *)arg1)[0]' parameter, but that would
943 * not demonstrate how to handle multiple sysctls that used OID_AUTO instead
944 * of a well known value with a common handler function. This is desirable,
945 * because we want well known values to "go away" at some future date.
946 *
947 * It should be noted that the value of '((int *)arg1)[1]' is used for many
948 * an integer parameter to the subcommand for many of these sysctls; we'd
949 * rather have used '((int *)arg1)[0]' for that, or even better, an element
950 * in a structure passed in as the the 'newp' argument to sysctlbyname(3),
951 * and then use leaf-node permissions enforcement, but that would have
952 * necessitated modifying user space code to correspond to the interface
953 * change, and we are striving for binary backward compatibility here; even
954 * though these are SPI, and not intended for use by user space applications
955 * which are not themselves system tools or libraries, some applications
956 * have erroneously used them.
957 */
958 SYSCTL_PROC(_kern_proc, KERN_PROC_ALL, all, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED,
959 0, /* Pointer argument (arg1) */
960 KERN_PROC_ALL, /* Integer argument (arg2) */
961 sysctl_prochandle, /* Handler function */
962 NULL, /* Data is size variant on ILP32/LP64 */
963 "");
964 SYSCTL_PROC(_kern_proc, KERN_PROC_PID, pid, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED,
965 0, /* Pointer argument (arg1) */
966 KERN_PROC_PID, /* Integer argument (arg2) */
967 sysctl_prochandle, /* Handler function */
968 NULL, /* Data is size variant on ILP32/LP64 */
969 "");
970 SYSCTL_PROC(_kern_proc, KERN_PROC_TTY, tty, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED,
971 0, /* Pointer argument (arg1) */
972 KERN_PROC_TTY, /* Integer argument (arg2) */
973 sysctl_prochandle, /* Handler function */
974 NULL, /* Data is size variant on ILP32/LP64 */
975 "");
976 SYSCTL_PROC(_kern_proc, KERN_PROC_PGRP, pgrp, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED,
977 0, /* Pointer argument (arg1) */
978 KERN_PROC_PGRP, /* Integer argument (arg2) */
979 sysctl_prochandle, /* Handler function */
980 NULL, /* Data is size variant on ILP32/LP64 */
981 "");
982 SYSCTL_PROC(_kern_proc, KERN_PROC_UID, uid, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED,
983 0, /* Pointer argument (arg1) */
984 KERN_PROC_UID, /* Integer argument (arg2) */
985 sysctl_prochandle, /* Handler function */
986 NULL, /* Data is size variant on ILP32/LP64 */
987 "");
988 SYSCTL_PROC(_kern_proc, KERN_PROC_RUID, ruid, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED,
989 0, /* Pointer argument (arg1) */
990 KERN_PROC_RUID, /* Integer argument (arg2) */
991 sysctl_prochandle, /* Handler function */
992 NULL, /* Data is size variant on ILP32/LP64 */
993 "");
994 SYSCTL_PROC(_kern_proc, KERN_PROC_LCID, lcid, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED,
995 0, /* Pointer argument (arg1) */
996 KERN_PROC_LCID, /* Integer argument (arg2) */
997 sysctl_prochandle, /* Handler function */
998 NULL, /* Data is size variant on ILP32/LP64 */
999 "");
1000
1001
1002 /*
1003 * Fill in non-zero fields of an eproc structure for the specified process.
1004 */
1005 STATIC void
fill_user32_eproc(proc_t p,struct user32_eproc * __restrict ep)1006 fill_user32_eproc(proc_t p, struct user32_eproc *__restrict ep)
1007 {
1008 struct pgrp *pg;
1009 struct session *sessp;
1010 kauth_cred_t my_cred;
1011
1012 pg = proc_pgrp(p, &sessp);
1013
1014 if (pg != PGRP_NULL) {
1015 ep->e_pgid = p->p_pgrpid;
1016 ep->e_jobc = pg->pg_jobc;
1017 if (sessp->s_ttyvp) {
1018 ep->e_flag = EPROC_CTTY;
1019 }
1020 }
1021
1022 ep->e_ppid = p->p_ppid;
1023
1024 smr_proc_task_enter();
1025 my_cred = proc_ucred_smr(p);
1026
1027 /* A fake historical pcred */
1028 ep->e_pcred.p_ruid = kauth_cred_getruid(my_cred);
1029 ep->e_pcred.p_svuid = kauth_cred_getsvuid(my_cred);
1030 ep->e_pcred.p_rgid = kauth_cred_getrgid(my_cred);
1031 ep->e_pcred.p_svgid = kauth_cred_getsvgid(my_cred);
1032
1033 /* A fake historical *kauth_cred_t */
1034 unsigned long refcnt = os_atomic_load(&my_cred->cr_ref, relaxed);
1035 ep->e_ucred.cr_ref = (uint32_t)MIN(refcnt, UINT32_MAX);
1036 ep->e_ucred.cr_uid = kauth_cred_getuid(my_cred);
1037 ep->e_ucred.cr_ngroups = (short)posix_cred_get(my_cred)->cr_ngroups;
1038 bcopy(posix_cred_get(my_cred)->cr_groups,
1039 ep->e_ucred.cr_groups, NGROUPS * sizeof(gid_t));
1040
1041 my_cred = NOCRED;
1042 smr_proc_task_leave();
1043
1044 ep->e_tdev = NODEV;
1045 if (pg != PGRP_NULL) {
1046 if (p->p_flag & P_CONTROLT) {
1047 session_lock(sessp);
1048 ep->e_tdev = os_atomic_load(&sessp->s_ttydev, relaxed);
1049 ep->e_tpgid = sessp->s_ttypgrpid;
1050 session_unlock(sessp);
1051 }
1052 if (SESS_LEADER(p, sessp)) {
1053 ep->e_flag |= EPROC_SLEADER;
1054 }
1055 pgrp_rele(pg);
1056 }
1057 }
1058
1059 /*
1060 * Fill in non-zero fields of an LP64 eproc structure for the specified process.
1061 */
1062 STATIC void
fill_user64_eproc(proc_t p,struct user64_eproc * __restrict ep)1063 fill_user64_eproc(proc_t p, struct user64_eproc *__restrict ep)
1064 {
1065 struct pgrp *pg;
1066 struct session *sessp;
1067 kauth_cred_t my_cred;
1068
1069 pg = proc_pgrp(p, &sessp);
1070
1071 if (pg != PGRP_NULL) {
1072 ep->e_pgid = p->p_pgrpid;
1073 ep->e_jobc = pg->pg_jobc;
1074 if (sessp->s_ttyvp) {
1075 ep->e_flag = EPROC_CTTY;
1076 }
1077 }
1078
1079 ep->e_ppid = p->p_ppid;
1080
1081 smr_proc_task_enter();
1082 my_cred = proc_ucred_smr(p);
1083
1084 /* A fake historical pcred */
1085 ep->e_pcred.p_ruid = kauth_cred_getruid(my_cred);
1086 ep->e_pcred.p_svuid = kauth_cred_getsvuid(my_cred);
1087 ep->e_pcred.p_rgid = kauth_cred_getrgid(my_cred);
1088 ep->e_pcred.p_svgid = kauth_cred_getsvgid(my_cred);
1089
1090 /* A fake historical *kauth_cred_t */
1091 unsigned long refcnt = os_atomic_load(&my_cred->cr_ref, relaxed);
1092 ep->e_ucred.cr_ref = (uint32_t)MIN(refcnt, UINT32_MAX);
1093 ep->e_ucred.cr_uid = kauth_cred_getuid(my_cred);
1094 ep->e_ucred.cr_ngroups = (short)posix_cred_get(my_cred)->cr_ngroups;
1095 bcopy(posix_cred_get(my_cred)->cr_groups,
1096 ep->e_ucred.cr_groups, NGROUPS * sizeof(gid_t));
1097
1098 my_cred = NOCRED;
1099 smr_proc_task_leave();
1100
1101 ep->e_tdev = NODEV;
1102 if (pg != PGRP_NULL) {
1103 if (p->p_flag & P_CONTROLT) {
1104 session_lock(sessp);
1105 ep->e_tdev = os_atomic_load(&sessp->s_ttydev, relaxed);
1106 ep->e_tpgid = sessp->s_ttypgrpid;
1107 session_unlock(sessp);
1108 }
1109 if (SESS_LEADER(p, sessp)) {
1110 ep->e_flag |= EPROC_SLEADER;
1111 }
1112 pgrp_rele(pg);
1113 }
1114 }
1115
1116 /*
1117 * Fill in an eproc structure for the specified process.
1118 * bzeroed by our caller, so only set non-zero fields.
1119 */
1120 STATIC void
fill_user32_externproc(proc_t p,struct user32_extern_proc * __restrict exp)1121 fill_user32_externproc(proc_t p, struct user32_extern_proc *__restrict exp)
1122 {
1123 exp->p_starttime.tv_sec = (user32_time_t)p->p_start.tv_sec;
1124 exp->p_starttime.tv_usec = p->p_start.tv_usec;
1125 exp->p_flag = p->p_flag;
1126 #if DEVELOPMENT || DEBUG
1127 if (p->p_lflag & P_LTRACED && !bootarg_hide_process_traced) {
1128 #else
1129 if (p->p_lflag & P_LTRACED) {
1130 #endif
1131 exp->p_flag |= P_TRACED;
1132 }
1133 if (p->p_lflag & P_LPPWAIT) {
1134 exp->p_flag |= P_PPWAIT;
1135 }
1136 if (p->p_lflag & P_LEXIT) {
1137 exp->p_flag |= P_WEXIT;
1138 }
1139 exp->p_stat = p->p_stat;
1140 exp->p_pid = proc_getpid(p);
1141 #if DEVELOPMENT || DEBUG
1142 if (bootarg_hide_process_traced) {
1143 exp->p_oppid = 0;
1144 } else
1145 #endif
1146 {
1147 exp->p_oppid = p->p_oppid;
1148 }
1149 /* Mach related */
1150 exp->p_debugger = p->p_debugger;
1151 exp->sigwait = p->sigwait;
1152 /* scheduling */
1153 #ifdef _PROC_HAS_SCHEDINFO_
1154 exp->p_estcpu = p->p_estcpu;
1155 exp->p_pctcpu = p->p_pctcpu;
1156 exp->p_slptime = p->p_slptime;
1157 #endif
1158 exp->p_realtimer.it_interval.tv_sec =
1159 (user32_time_t)p->p_realtimer.it_interval.tv_sec;
1160 exp->p_realtimer.it_interval.tv_usec =
1161 (__int32_t)p->p_realtimer.it_interval.tv_usec;
1162
1163 exp->p_realtimer.it_value.tv_sec =
1164 (user32_time_t)p->p_realtimer.it_value.tv_sec;
1165 exp->p_realtimer.it_value.tv_usec =
1166 (__int32_t)p->p_realtimer.it_value.tv_usec;
1167
1168 exp->p_rtime.tv_sec = (user32_time_t)p->p_rtime.tv_sec;
1169 exp->p_rtime.tv_usec = (__int32_t)p->p_rtime.tv_usec;
1170
1171 exp->p_sigignore = p->p_sigignore;
1172 exp->p_sigcatch = p->p_sigcatch;
1173 exp->p_priority = p->p_priority;
1174 exp->p_nice = p->p_nice;
1175 bcopy(&p->p_comm, &exp->p_comm, MAXCOMLEN);
1176 exp->p_xstat = (u_short)MIN(p->p_xstat, USHRT_MAX);
1177 exp->p_acflag = p->p_acflag;
1178 }
1179
1180 /*
1181 * Fill in an LP64 version of extern_proc structure for the specified process.
1182 */
1183 STATIC void
1184 fill_user64_externproc(proc_t p, struct user64_extern_proc *__restrict exp)
1185 {
1186 exp->p_starttime.tv_sec = p->p_start.tv_sec;
1187 exp->p_starttime.tv_usec = p->p_start.tv_usec;
1188 exp->p_flag = p->p_flag;
1189 #if DEVELOPMENT || DEBUG
1190 if (p->p_lflag & P_LTRACED && !bootarg_hide_process_traced) {
1191 #else
1192 if (p->p_lflag & P_LTRACED) {
1193 #endif
1194 exp->p_flag |= P_TRACED;
1195 }
1196 if (p->p_lflag & P_LPPWAIT) {
1197 exp->p_flag |= P_PPWAIT;
1198 }
1199 if (p->p_lflag & P_LEXIT) {
1200 exp->p_flag |= P_WEXIT;
1201 }
1202 exp->p_stat = p->p_stat;
1203 exp->p_pid = proc_getpid(p);
1204 #if DEVELOPMENT || DEBUG
1205 if (bootarg_hide_process_traced) {
1206 exp->p_oppid = 0;
1207 } else
1208 #endif
1209 {
1210 exp->p_oppid = p->p_oppid;
1211 }
1212 /* Mach related */
1213 exp->p_debugger = p->p_debugger;
1214 exp->sigwait = p->sigwait;
1215 /* scheduling */
1216 #ifdef _PROC_HAS_SCHEDINFO_
1217 exp->p_estcpu = p->p_estcpu;
1218 exp->p_pctcpu = p->p_pctcpu;
1219 exp->p_slptime = p->p_slptime;
1220 #endif
1221 exp->p_realtimer.it_interval.tv_sec = p->p_realtimer.it_interval.tv_sec;
1222 exp->p_realtimer.it_interval.tv_usec = p->p_realtimer.it_interval.tv_usec;
1223
1224 exp->p_realtimer.it_value.tv_sec = p->p_realtimer.it_value.tv_sec;
1225 exp->p_realtimer.it_value.tv_usec = p->p_realtimer.it_value.tv_usec;
1226
1227 exp->p_rtime.tv_sec = p->p_rtime.tv_sec;
1228 exp->p_rtime.tv_usec = p->p_rtime.tv_usec;
1229
1230 exp->p_sigignore = p->p_sigignore;
1231 exp->p_sigcatch = p->p_sigcatch;
1232 exp->p_priority = p->p_priority;
1233 exp->p_nice = p->p_nice;
1234 bcopy(&p->p_comm, &exp->p_comm, MAXCOMLEN);
1235 exp->p_xstat = (u_short)MIN(p->p_xstat, USHRT_MAX);
1236 exp->p_acflag = p->p_acflag;
1237 }
1238
1239 STATIC void
1240 fill_user32_proc(proc_t p, struct user32_kinfo_proc *__restrict kp)
1241 {
1242 /* on a 64 bit kernel, 32 bit users get some truncated information */
1243 fill_user32_externproc(p, &kp->kp_proc);
1244 fill_user32_eproc(p, &kp->kp_eproc);
1245 }
1246
1247 STATIC void
1248 fill_user64_proc(proc_t p, struct user64_kinfo_proc *__restrict kp)
1249 {
1250 fill_user64_externproc(p, &kp->kp_proc);
1251 fill_user64_eproc(p, &kp->kp_eproc);
1252 }
1253
1254 #if defined(XNU_TARGET_OS_OSX)
1255 /*
1256 * Return the top *sizep bytes of the user stack, or the entire area of the
1257 * user stack down through the saved exec_path, whichever is smaller.
1258 */
1259 STATIC int
1260 sysctl_doprocargs SYSCTL_HANDLER_ARGS
1261 {
1262 __unused int cmd = oidp->oid_arg2; /* subcommand*/
1263 int *name = arg1; /* oid element argument vector */
1264 int namelen = arg2; /* number of oid element arguments */
1265 user_addr_t oldp = req->oldptr; /* user buffer copy out address */
1266 size_t *oldlenp = &req->oldlen; /* user buffer copy out size */
1267 // user_addr_t newp = req->newptr; /* user buffer copy in address */
1268 // size_t newlen = req->newlen; /* user buffer copy in size */
1269 int error;
1270
1271 error = sysctl_procargsx( name, namelen, oldp, oldlenp, current_proc(), 0);
1272
1273 /* adjust index so we return the right required/consumed amount */
1274 if (!error) {
1275 req->oldidx += req->oldlen;
1276 }
1277
1278 return error;
1279 }
1280 SYSCTL_PROC(_kern, KERN_PROCARGS, procargs, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED,
1281 0, /* Pointer argument (arg1) */
1282 0, /* Integer argument (arg2) */
1283 sysctl_doprocargs, /* Handler function */
1284 NULL, /* Data pointer */
1285 "");
1286 #endif /* defined(XNU_TARGET_OS_OSX) */
1287
1288 STATIC int
1289 sysctl_doprocargs2 SYSCTL_HANDLER_ARGS
1290 {
1291 __unused int cmd = oidp->oid_arg2; /* subcommand*/
1292 int *name = arg1; /* oid element argument vector */
1293 int namelen = arg2; /* number of oid element arguments */
1294 user_addr_t oldp = req->oldptr; /* user buffer copy out address */
1295 size_t *oldlenp = &req->oldlen; /* user buffer copy out size */
1296 // user_addr_t newp = req->newptr; /* user buffer copy in address */
1297 // size_t newlen = req->newlen; /* user buffer copy in size */
1298 int error;
1299
1300 error = sysctl_procargsx( name, namelen, oldp, oldlenp, current_proc(), 1);
1301
1302 /* adjust index so we return the right required/consumed amount */
1303 if (!error) {
1304 req->oldidx += req->oldlen;
1305 }
1306
1307 return error;
1308 }
1309 SYSCTL_PROC(_kern, KERN_PROCARGS2, procargs2, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED,
1310 0, /* Pointer argument (arg1) */
1311 0, /* Integer argument (arg2) */
1312 sysctl_doprocargs2, /* Handler function */
1313 NULL, /* Data pointer */
1314 "");
1315
1316 #define SYSCTL_PROCARGS_READ_ENVVARS_ENTITLEMENT "com.apple.private.read-environment-variables"
1317 STATIC int
1318 sysctl_procargsx(int *name, u_int namelen, user_addr_t where,
1319 size_t *sizep, proc_t cur_proc, int argc_yes)
1320 {
1321 assert(sizep != NULL);
1322 proc_t p = NULL;
1323 size_t buflen = where != USER_ADDR_NULL ? *sizep : 0;
1324 int error = 0;
1325 struct _vm_map *proc_map = NULL;
1326 struct task * task;
1327 vm_map_copy_t tmp = NULL;
1328 user_addr_t arg_addr;
1329 size_t arg_size;
1330 caddr_t data;
1331 size_t argslen = 0;
1332 size_t size = 0;
1333 vm_offset_t copy_start = 0, copy_end;
1334 vm_offset_t smallbuffer_start;
1335 kern_return_t ret;
1336 int pid;
1337 kauth_cred_t my_cred;
1338 uid_t uid;
1339 int argc = -1;
1340 size_t argvsize;
1341 size_t remaining;
1342 size_t current_arg_index;
1343 size_t current_arg_len;
1344 const char * current_arg;
1345 bool omit_env_vars = true;
1346 user_addr_t user_stack;
1347 vm_map_offset_t effective_page_mask;
1348
1349 if (namelen < 1) {
1350 error = EINVAL;
1351 goto finish;
1352 }
1353
1354 if (argc_yes) {
1355 buflen -= sizeof(int); /* reserve first word to return argc */
1356 }
1357 /* we only care about buflen when where (oldp from sysctl) is not NULL. */
1358 /* when where (oldp from sysctl) is NULL and sizep (oldlenp from sysctl */
1359 /* is not NULL then the caller wants us to return the length needed to */
1360 /* hold the data we would return */
1361 if (where != USER_ADDR_NULL && (buflen <= 0 || buflen > ARG_MAX)) {
1362 error = EINVAL;
1363 goto finish;
1364 }
1365
1366 /*
1367 * Lookup process by pid
1368 */
1369 pid = name[0];
1370 p = proc_find(pid);
1371 if (p == NULL) {
1372 error = EINVAL;
1373 goto finish;
1374 }
1375
1376 /* Allow reading environment variables if any of the following are true:
1377 * - kernel is DEVELOPMENT || DEBUG
1378 * - target process is same as current_proc()
1379 * - target process is not cs_restricted
1380 * - SIP is off
1381 * - caller has an entitlement
1382 */
1383
1384 #if DEVELOPMENT || DEBUG
1385 omit_env_vars = false;
1386 #endif
1387 if (p == current_proc() ||
1388 !cs_restricted(p) ||
1389 #if CONFIG_CSR
1390 csr_check(CSR_ALLOW_UNRESTRICTED_DTRACE) == 0 ||
1391 #endif
1392 IOCurrentTaskHasEntitlement(SYSCTL_PROCARGS_READ_ENVVARS_ENTITLEMENT)
1393 ) {
1394 omit_env_vars = false;
1395 }
1396
1397 /*
1398 * Copy the top N bytes of the stack.
1399 * On all machines we have so far, the stack grows
1400 * downwards.
1401 *
1402 * If the user expects no more than N bytes of
1403 * argument list, use that as a guess for the
1404 * size.
1405 */
1406
1407 if (!p->user_stack) {
1408 error = EINVAL;
1409 goto finish;
1410 }
1411
1412 /* save off argc, argslen, user_stack before releasing the proc */
1413 argc = p->p_argc;
1414 argslen = p->p_argslen;
1415 user_stack = p->user_stack;
1416
1417 /*
1418 * When these sysctls were introduced, the first string in the strings
1419 * section was just the bare path of the executable. However, for security
1420 * reasons we now prefix this string with executable_path= so it can be
1421 * parsed getenv style. To avoid binary compatability issues with exising
1422 * callers of this sysctl, we strip it off here.
1423 * (rdar://problem/13746466)
1424 */
1425 #define EXECUTABLE_KEY "executable_path="
1426 argslen -= strlen(EXECUTABLE_KEY);
1427
1428 if (where == USER_ADDR_NULL && !omit_env_vars) {
1429 /* caller only wants to know length of proc args data.
1430 * If we don't need to omit environment variables, we can skip
1431 * copying the target process stack */
1432 goto calculate_size;
1433 }
1434
1435 my_cred = kauth_cred_proc_ref(p);
1436 uid = kauth_cred_getuid(my_cred);
1437 kauth_cred_unref(&my_cred);
1438
1439 if ((uid != kauth_cred_getuid(kauth_cred_get()))
1440 && suser(kauth_cred_get(), &cur_proc->p_acflag)) {
1441 error = EINVAL;
1442 goto finish;
1443 }
1444
1445 /*
1446 * Before we can block (any VM code), make another
1447 * reference to the map to keep it alive. We do
1448 * that by getting a reference on the task itself.
1449 */
1450 task = proc_task(p);
1451 if (task == NULL) {
1452 error = EINVAL;
1453 goto finish;
1454 }
1455
1456 /*
1457 * Once we have a task reference we can convert that into a
1458 * map reference, which we will use in the calls below. The
1459 * task/process may change its map after we take this reference
1460 * (see execve), but the worst that will happen then is a return
1461 * of stale info (which is always a possibility).
1462 */
1463 task_reference(task);
1464 proc_rele(p);
1465 p = NULL;
1466 proc_map = get_task_map_reference(task);
1467 task_deallocate(task);
1468
1469 if (proc_map == NULL) {
1470 error = EINVAL;
1471 goto finish;
1472 }
1473
1474 effective_page_mask = vm_map_page_mask(proc_map);
1475
1476 arg_size = vm_map_round_page(argslen, effective_page_mask);
1477
1478 arg_addr = user_stack - arg_size;
1479
1480 ret = kmem_alloc(kernel_map, ©_start, arg_size,
1481 KMA_DATA | KMA_ZERO, VM_KERN_MEMORY_BSD);
1482 if (ret != KERN_SUCCESS) {
1483 error = ENOMEM;
1484 goto finish;
1485 }
1486
1487 copy_end = copy_start + arg_size;
1488
1489 if (vm_map_copyin(proc_map, (vm_map_address_t)arg_addr,
1490 (vm_map_size_t)arg_size, FALSE, &tmp) != KERN_SUCCESS) {
1491 error = EIO;
1492 goto finish;
1493 }
1494
1495 /*
1496 * Now that we've done the copyin from the process'
1497 * map, we can release the reference to it.
1498 */
1499 vm_map_deallocate(proc_map);
1500 proc_map = NULL;
1501
1502 if (vm_map_copy_overwrite(kernel_map,
1503 (vm_map_address_t)copy_start,
1504 tmp, (vm_map_size_t) arg_size, FALSE) != KERN_SUCCESS) {
1505 error = EIO;
1506 goto finish;
1507 }
1508 /* tmp was consumed */
1509 tmp = NULL;
1510
1511 if (omit_env_vars) {
1512 argvsize = 0;
1513
1514 /* Iterate over everything in argv, plus one for the bare executable path */
1515 for (current_arg_index = 0; current_arg_index < argc + 1 && argvsize < argslen; ++current_arg_index) {
1516 current_arg = (const char *)(copy_end - argslen) + argvsize;
1517 remaining = argslen - argvsize;
1518 current_arg_len = strnlen(current_arg, remaining);
1519 if (current_arg_len < remaining) {
1520 /* We have space for the null terminator */
1521 current_arg_len += 1;
1522
1523 if (current_arg_index == 0) {
1524 /* The bare executable path may have multiple null bytes after it for alignment */
1525 while (current_arg_len < remaining && current_arg[current_arg_len] == 0) {
1526 current_arg_len += 1;
1527 }
1528 }
1529 }
1530 argvsize += current_arg_len;
1531 }
1532 assert(argvsize <= argslen);
1533
1534 /* Adjust argslen and copy_end to make the copyout range extend to the end of argv */
1535 copy_end = copy_end - argslen + argvsize;
1536 argslen = argvsize;
1537 }
1538
1539 if (where == USER_ADDR_NULL) {
1540 /* Skip copyout */
1541 goto calculate_size;
1542 }
1543
1544 if (buflen >= argslen) {
1545 data = (caddr_t) (copy_end - argslen);
1546 size = argslen;
1547 } else {
1548 /*
1549 * Before rdar://25397314, this function contained incorrect logic when buflen is less
1550 * than argslen. The problem was that it copied in `buflen` bytes from the end of the target
1551 * process user stack into the beginning of a buffer of size round_page(buflen), and then
1552 * copied out `buflen` bytes from the end of this buffer. The effect of this was that
1553 * the caller of this sysctl would get zeros at the end of their buffer.
1554 *
1555 * To preserve this behavior, bzero everything from copy_end-round_page(buflen)+buflen to the
1556 * end of the buffer. This emulates copying in only `buflen` bytes.
1557 *
1558 *
1559 * In the old code:
1560 *
1561 * copy_start .... size: round_page(buflen) .... copy_end
1562 * [---copied in data (size: buflen)---|--- zeros ----------]
1563 * ^
1564 * data = copy_end - buflen
1565 *
1566 *
1567 * In the new code:
1568 * copy_start .... size: round_page(p->argslen) .... full copy_end
1569 * ^ ....................... p->argslen ...............................^
1570 * ^ ^ truncated copy_end ^
1571 * ^ ^ ^ ^
1572 * ^ ................ argslen ........................ ^
1573 * ^ ^ ^ ^
1574 * [-------copied in data (size: round_page(p->argslen))-------:----env vars---]
1575 * ^ ^
1576 * ^ data = copy_end - buflen
1577 * smallbuffer_start = max(copy_end - round_page(buflen), copy_start)
1578 *
1579 *
1580 * Full copy_end: copy_end calculated from copy_start + round_page(p->argslen)
1581 * Truncated copy_end: copy_end after truncation to remove environment variables.
1582 *
1583 * If environment variables were omitted, then we use the truncated copy_end, otherwise
1584 * we use full copy_end.
1585 *
1586 * smallbuffer_start: represents where copy_start would be in the old code.
1587 * data: The beginning of the region we copyout
1588 */
1589 smallbuffer_start = copy_end - vm_map_round_page(buflen, effective_page_mask);
1590 if (smallbuffer_start < copy_start) {
1591 smallbuffer_start = copy_start;
1592 }
1593 bzero((void *)(smallbuffer_start + buflen), copy_end - (smallbuffer_start + buflen));
1594 data = (caddr_t) (copy_end - buflen);
1595 size = buflen;
1596 }
1597
1598 if (argc_yes) {
1599 /* Put processes argc as the first word in the copyout buffer */
1600 suword(where, argc);
1601 error = copyout(data, (where + sizeof(int)), size);
1602 size += sizeof(int);
1603 } else {
1604 error = copyout(data, where, size);
1605
1606 /*
1607 * Make the old PROCARGS work to return the executable's path
1608 * But, only if there is enough space in the provided buffer
1609 *
1610 * on entry: data [possibily] points to the beginning of the path
1611 *
1612 * Note: we keep all pointers&sizes aligned to word boundries
1613 */
1614 if ((!error) && (buflen > 0 && (u_int)buflen > size)) {
1615 int binPath_sz, alignedBinPath_sz = 0;
1616 int extraSpaceNeeded, addThis;
1617 user_addr_t placeHere;
1618 char * str = (char *) data;
1619 size_t max_len = size;
1620
1621 /* Some apps are really bad about messing up their stacks
1622 * So, we have to be extra careful about getting the length
1623 * of the executing binary. If we encounter an error, we bail.
1624 */
1625
1626 /* Limit ourselves to PATH_MAX paths */
1627 if (max_len > PATH_MAX) {
1628 max_len = PATH_MAX;
1629 }
1630
1631 binPath_sz = 0;
1632
1633 while ((binPath_sz < max_len - 1) && (*str++ != 0)) {
1634 binPath_sz++;
1635 }
1636
1637 /* If we have a NUL terminator, copy it, too */
1638 if (binPath_sz < max_len - 1) {
1639 binPath_sz += 1;
1640 }
1641
1642 /* Pre-Flight the space requiremnts */
1643
1644 /* Account for the padding that fills out binPath to the next word */
1645 alignedBinPath_sz += (binPath_sz & (sizeof(int) - 1)) ? (sizeof(int) - (binPath_sz & (sizeof(int) - 1))) : 0;
1646
1647 placeHere = where + size;
1648
1649 /* Account for the bytes needed to keep placeHere word aligned */
1650 addThis = (placeHere & (sizeof(int) - 1)) ? (sizeof(int) - (placeHere & (sizeof(int) - 1))) : 0;
1651
1652 /* Add up all the space that is needed */
1653 extraSpaceNeeded = alignedBinPath_sz + addThis + binPath_sz + (4 * sizeof(int));
1654
1655 /* is there is room to tack on argv[0]? */
1656 if ((buflen & ~(sizeof(int) - 1)) >= (size + extraSpaceNeeded)) {
1657 placeHere += addThis;
1658 suword(placeHere, 0);
1659 placeHere += sizeof(int);
1660 suword(placeHere, 0xBFFF0000);
1661 placeHere += sizeof(int);
1662 suword(placeHere, 0);
1663 placeHere += sizeof(int);
1664 error = copyout(data, placeHere, binPath_sz);
1665 if (!error) {
1666 placeHere += binPath_sz;
1667 suword(placeHere, 0);
1668 size += extraSpaceNeeded;
1669 }
1670 }
1671 }
1672 }
1673
1674 calculate_size:
1675 /* Size has already been calculated for the where != NULL case */
1676 if (where == USER_ADDR_NULL) {
1677 size = argslen;
1678 if (argc_yes) {
1679 size += sizeof(int);
1680 } else {
1681 /*
1682 * old PROCARGS will return the executable's path and plus some
1683 * extra space for work alignment and data tags
1684 */
1685 size += PATH_MAX + (6 * sizeof(int));
1686 }
1687 size += (size & (sizeof(int) - 1)) ? (sizeof(int) - (size & (sizeof(int) - 1))) : 0;
1688 }
1689
1690 *sizep = size;
1691
1692 finish:
1693 if (p != NULL) {
1694 proc_rele(p);
1695 }
1696 if (tmp != NULL) {
1697 vm_map_copy_discard(tmp);
1698 }
1699 if (proc_map != NULL) {
1700 vm_map_deallocate(proc_map);
1701 }
1702 if (copy_start != (vm_offset_t) 0) {
1703 kmem_free(kernel_map, copy_start, arg_size);
1704 }
1705 return error;
1706 }
1707
1708
1709 /*
1710 * Max number of concurrent aio requests
1711 */
1712 STATIC int
1713 sysctl_aiomax
1714 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
1715 {
1716 int new_value, changed;
1717 int error = sysctl_io_number(req, aio_max_requests, sizeof(int), &new_value, &changed);
1718 if (changed) {
1719 /* make sure the system-wide limit is greater than the per process limit */
1720 if (new_value >= aio_max_requests_per_process && new_value <= AIO_MAX_REQUESTS) {
1721 aio_max_requests = new_value;
1722 } else {
1723 error = EINVAL;
1724 }
1725 }
1726 return error;
1727 }
1728
1729
1730 /*
1731 * Max number of concurrent aio requests per process
1732 */
1733 STATIC int
1734 sysctl_aioprocmax
1735 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
1736 {
1737 int new_value, changed;
1738 int error = sysctl_io_number(req, aio_max_requests_per_process, sizeof(int), &new_value, &changed);
1739 if (changed) {
1740 /* make sure per process limit is less than the system-wide limit */
1741 if (new_value <= aio_max_requests && new_value >= AIO_LISTIO_MAX) {
1742 aio_max_requests_per_process = new_value;
1743 } else {
1744 error = EINVAL;
1745 }
1746 }
1747 return error;
1748 }
1749
1750
1751 /*
1752 * Max number of async IO worker threads
1753 */
1754 STATIC int
1755 sysctl_aiothreads
1756 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
1757 {
1758 int new_value, changed;
1759 int error = sysctl_io_number(req, aio_worker_threads, sizeof(int), &new_value, &changed);
1760 if (changed) {
1761 /* we only allow an increase in the number of worker threads */
1762 if (new_value > aio_worker_threads) {
1763 _aio_create_worker_threads((new_value - aio_worker_threads));
1764 aio_worker_threads = new_value;
1765 } else {
1766 error = EINVAL;
1767 }
1768 }
1769 return error;
1770 }
1771
1772
1773 /*
1774 * System-wide limit on the max number of processes
1775 */
1776 STATIC int
1777 sysctl_maxproc
1778 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
1779 {
1780 int new_value, changed;
1781 int error = sysctl_io_number(req, maxproc, sizeof(int), &new_value, &changed);
1782 if (changed) {
1783 AUDIT_ARG(value32, new_value);
1784 /* make sure the system-wide limit is less than the configured hard
1785 * limit set at kernel compilation */
1786 if (new_value <= hard_maxproc && new_value > 0) {
1787 maxproc = new_value;
1788 } else {
1789 error = EINVAL;
1790 }
1791 }
1792 return error;
1793 }
1794
1795 extern int sched_enable_smt;
1796 STATIC int
1797 sysctl_sched_enable_smt
1798 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
1799 {
1800 int new_value, changed;
1801 int error = sysctl_io_number(req, sched_enable_smt, sizeof(int), &new_value, &changed);
1802 if (error) {
1803 return error;
1804 }
1805 kern_return_t kret = KERN_SUCCESS;
1806 if (changed) {
1807 AUDIT_ARG(value32, new_value);
1808 if (new_value == 0) {
1809 sched_enable_smt = 0;
1810 kret = enable_smt_processors(false);
1811 } else {
1812 sched_enable_smt = 1;
1813 kret = enable_smt_processors(true);
1814 }
1815 }
1816 switch (kret) {
1817 case KERN_SUCCESS:
1818 error = 0;
1819 break;
1820 case KERN_INVALID_ARGUMENT:
1821 error = EINVAL;
1822 break;
1823 case KERN_FAILURE:
1824 error = EBUSY;
1825 break;
1826 default:
1827 error = ENOENT;
1828 break;
1829 }
1830
1831 return error;
1832 }
1833
1834 SYSCTL_STRING(_kern, KERN_OSTYPE, ostype,
1835 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
1836 ostype, 0, "");
1837 SYSCTL_STRING(_kern, KERN_OSRELEASE, osrelease,
1838 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
1839 osrelease, 0, "");
1840 SYSCTL_INT(_kern, KERN_OSREV, osrevision,
1841 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
1842 (int *)NULL, BSD, "");
1843 SYSCTL_STRING(_kern, KERN_VERSION, version,
1844 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
1845 version, 0, "");
1846 SYSCTL_STRING(_kern, OID_AUTO, uuid,
1847 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
1848 &kernel_uuid_string[0], 0, "");
1849
1850 SYSCTL_STRING(_kern, OID_AUTO, osbuildconfig,
1851 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED | CTLFLAG_MASKED,
1852 &osbuild_config[0], 0, "");
1853
1854 #if DEBUG
1855 #ifndef DKPR
1856 #define DKPR 1
1857 #endif
1858 #endif
1859
1860 #if DKPR
1861 int debug_kprint_syscall = 0;
1862 char debug_kprint_syscall_process[MAXCOMLEN + 1];
1863
1864 /* Thread safe: bits and string value are not used to reclaim state */
1865 SYSCTL_INT(_debug, OID_AUTO, kprint_syscall,
1866 CTLFLAG_RW | CTLFLAG_LOCKED, &debug_kprint_syscall, 0, "kprintf syscall tracing");
1867 SYSCTL_STRING(_debug, OID_AUTO, kprint_syscall_process,
1868 CTLFLAG_RW | CTLFLAG_LOCKED, debug_kprint_syscall_process, sizeof(debug_kprint_syscall_process),
1869 "name of process for kprintf syscall tracing");
1870
1871 int
1872 debug_kprint_current_process(const char **namep)
1873 {
1874 struct proc *p = current_proc();
1875
1876 if (p == NULL) {
1877 return 0;
1878 }
1879
1880 if (debug_kprint_syscall_process[0]) {
1881 /* user asked to scope tracing to a particular process name */
1882 if (0 == strncmp(debug_kprint_syscall_process,
1883 p->p_comm, sizeof(debug_kprint_syscall_process))) {
1884 /* no value in telling the user that we traced what they asked */
1885 if (namep) {
1886 *namep = NULL;
1887 }
1888
1889 return 1;
1890 } else {
1891 return 0;
1892 }
1893 }
1894
1895 /* trace all processes. Tell user what we traced */
1896 if (namep) {
1897 *namep = p->p_comm;
1898 }
1899
1900 return 1;
1901 }
1902 #endif
1903
1904 /* PR-5293665: need to use a callback function for kern.osversion to set
1905 * osversion in IORegistry */
1906
1907 STATIC int
1908 sysctl_osversion(__unused struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
1909 {
1910 int rval = 0;
1911
1912 rval = sysctl_handle_string(oidp, arg1, arg2, req);
1913
1914 if (req->newptr) {
1915 IORegistrySetOSBuildVersion((char *)arg1);
1916 }
1917
1918 return rval;
1919 }
1920
1921 SYSCTL_PROC(_kern, KERN_OSVERSION, osversion,
1922 CTLFLAG_RW | CTLFLAG_KERN | CTLTYPE_STRING | CTLFLAG_LOCKED,
1923 osversion, 256 /* OSVERSIZE*/,
1924 sysctl_osversion, "A", "");
1925
1926 static bool
1927 _already_set_or_not_launchd(struct sysctl_req *req, char *val)
1928 {
1929 if (req->newptr != 0) {
1930 /*
1931 * Can only ever be set by launchd, and only once at boot.
1932 */
1933 if (proc_getpid(req->p) != 1 || val[0] != '\0') {
1934 return true;
1935 }
1936 }
1937 return false;
1938 }
1939
1940 #define kRootsInstalledReadWriteEntitlement "com.apple.private.roots-installed-read-write"
1941 #define kRootsInstalledReadOnlyEntitlement "com.apple.private.roots-installed-read-only"
1942 uint64_t roots_installed = 0;
1943
1944 static int
1945 sysctl_roots_installed
1946 (__unused struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
1947 {
1948 int error = 0;
1949
1950 if (req->newptr != 0) {
1951 /* a ReadWrite entitlement is required for updating this syscl
1952 * meanwhile, only allow write once
1953 */
1954 if (!IOCurrentTaskHasEntitlement(kRootsInstalledReadWriteEntitlement) || (roots_installed != 0)) {
1955 return EPERM;
1956 }
1957 } else {
1958 /* for reader of this sysctl, need either ReadWrite or ReadOnly entitlement */
1959 if (!IOCurrentTaskHasEntitlement(kRootsInstalledReadWriteEntitlement) &&
1960 !IOCurrentTaskHasEntitlement(kRootsInstalledReadOnlyEntitlement)) {
1961 return EPERM;
1962 }
1963 }
1964
1965 error = sysctl_handle_quad(oidp, arg1, arg2, req);
1966
1967 return error;
1968 }
1969
1970 SYSCTL_PROC(_kern, OID_AUTO, roots_installed,
1971 CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_ANYBODY | CTLFLAG_LOCKED,
1972 &roots_installed, sizeof(roots_installed),
1973 sysctl_roots_installed, "Q", "");
1974
1975 #if XNU_TARGET_OS_OSX
1976 static int
1977 sysctl_system_version_compat
1978 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
1979 {
1980 int oldval = (task_has_system_version_compat_enabled(current_task()));
1981 int new_value = 0, changed = 0;
1982
1983 int error = sysctl_io_number(req, oldval, sizeof(int), &new_value, &changed);
1984 if (changed) {
1985 task_set_system_version_compat_enabled(current_task(), (new_value));
1986 }
1987 return error;
1988 }
1989
1990 SYSCTL_PROC(_kern, OID_AUTO, system_version_compat,
1991 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_ANYBODY | CTLFLAG_LOCKED,
1992 0, 0, sysctl_system_version_compat, "A", "");
1993
1994 char osproductversioncompat[48] = { '\0' };
1995
1996 static int
1997 sysctl_osproductversioncompat(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
1998 {
1999 if (_already_set_or_not_launchd(req, osproductversioncompat)) {
2000 return EPERM;
2001 }
2002 return sysctl_handle_string(oidp, arg1, arg2, req);
2003 }
2004
2005
2006 SYSCTL_PROC(_kern, OID_AUTO, osproductversioncompat,
2007 CTLFLAG_RW | CTLFLAG_KERN | CTLTYPE_STRING | CTLFLAG_LOCKED,
2008 osproductversioncompat, sizeof(osproductversioncompat),
2009 sysctl_osproductversioncompat, "A", "The ProductVersion from SystemVersionCompat.plist");
2010 #endif
2011
2012 char osproductversion[48] = { '\0' };
2013
2014 static char iossupportversion_string[48] = { '\0' };
2015
2016 static int
2017 sysctl_osproductversion(__unused struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
2018 {
2019 if (_already_set_or_not_launchd(req, osproductversion)) {
2020 return EPERM;
2021 }
2022
2023 #if XNU_TARGET_OS_OSX
2024 if (task_has_system_version_compat_enabled(current_task()) && (osproductversioncompat[0] != '\0')) {
2025 return sysctl_handle_string(oidp, osproductversioncompat, arg2, req);
2026 } else {
2027 return sysctl_handle_string(oidp, arg1, arg2, req);
2028 }
2029 #else
2030 return sysctl_handle_string(oidp, arg1, arg2, req);
2031 #endif
2032 }
2033
2034 #if XNU_TARGET_OS_OSX
2035 static_assert(sizeof(osproductversioncompat) == sizeof(osproductversion),
2036 "osproductversion size matches osproductversioncompat size");
2037 #endif
2038
2039 SYSCTL_PROC(_kern, OID_AUTO, osproductversion,
2040 CTLFLAG_RW | CTLFLAG_KERN | CTLTYPE_STRING | CTLFLAG_LOCKED,
2041 osproductversion, sizeof(osproductversion),
2042 sysctl_osproductversion, "A", "The ProductVersion from SystemVersion.plist");
2043
2044 char osreleasetype[48] = { '\0' };
2045
2046 STATIC int
2047 sysctl_osreleasetype(__unused struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
2048 {
2049 if (_already_set_or_not_launchd(req, osreleasetype)) {
2050 return EPERM;
2051 }
2052 return sysctl_handle_string(oidp, arg1, arg2, req);
2053 }
2054
2055 void reset_osreleasetype(void);
2056
2057 void
2058 reset_osreleasetype(void)
2059 {
2060 memset(osreleasetype, 0, sizeof(osreleasetype));
2061 }
2062
2063 SYSCTL_PROC(_kern, OID_AUTO, osreleasetype,
2064 CTLFLAG_RW | CTLFLAG_KERN | CTLTYPE_STRING | CTLFLAG_LOCKED,
2065 osreleasetype, sizeof(osreleasetype),
2066 sysctl_osreleasetype, "A", "The ReleaseType from SystemVersion.plist");
2067
2068 STATIC int
2069 sysctl_iossupportversion(__unused struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
2070 {
2071 if (_already_set_or_not_launchd(req, iossupportversion_string)) {
2072 return EPERM;
2073 }
2074
2075 return sysctl_handle_string(oidp, arg1, arg2, req);
2076 }
2077
2078 SYSCTL_PROC(_kern, OID_AUTO, iossupportversion,
2079 CTLFLAG_RW | CTLFLAG_KERN | CTLTYPE_STRING | CTLFLAG_LOCKED,
2080 iossupportversion_string, sizeof(iossupportversion_string),
2081 sysctl_iossupportversion, "A", "The iOSSupportVersion from SystemVersion.plist");
2082
2083 static uint64_t osvariant_status = 0;
2084
2085 STATIC int
2086 sysctl_osvariant_status(__unused struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
2087 {
2088 if (req->newptr != 0) {
2089 /*
2090 * Can only ever be set by launchd, and only once.
2091 * Reset by usrctl() -> reset_osvariant_status() during
2092 * userspace reboot, since userspace could reboot into
2093 * a different variant.
2094 */
2095 if (proc_getpid(req->p) != 1 || osvariant_status != 0) {
2096 return EPERM;
2097 }
2098 }
2099
2100 int err = sysctl_handle_quad(oidp, arg1, arg2, req);
2101
2102 reset_debug_syscall_rejection_mode();
2103
2104 return err;
2105 }
2106
2107 SYSCTL_PROC(_kern, OID_AUTO, osvariant_status,
2108 CTLFLAG_RW | CTLTYPE_QUAD | CTLFLAG_LOCKED | CTLFLAG_MASKED,
2109 &osvariant_status, sizeof(osvariant_status),
2110 sysctl_osvariant_status, "Q", "Opaque flags used to cache OS variant information");
2111
2112 static bool
2113 _os_variant_check_disabled(enum os_variant_property property)
2114 {
2115 return (osvariant_status >> (32 + property)) & 0x1;
2116 }
2117
2118 static bool
2119 _os_variant_has(enum os_variant_status_flags_positions p)
2120 {
2121 return ((osvariant_status >> (p * OS_VARIANT_STATUS_BIT_WIDTH)) & OS_VARIANT_STATUS_MASK) == OS_VARIANT_S_YES;
2122 }
2123
2124 bool
2125 os_variant_has_internal_diagnostics(__unused const char *subsystem)
2126 {
2127 if (_os_variant_check_disabled(OS_VARIANT_PROPERTY_DIAGNOSTICS)) {
2128 return false;
2129 }
2130 #if XNU_TARGET_OS_OSX
2131 return _os_variant_has(OS_VARIANT_SFP_INTERNAL_CONTENT) || _os_variant_has(OS_VARIANT_SFP_INTERNAL_DIAGS_PROFILE);
2132 #else
2133 return _os_variant_has(OS_VARIANT_SFP_INTERNAL_RELEASE_TYPE);
2134 #endif /* XNU_TARGET_OS_OSX */
2135 }
2136
2137 void reset_osvariant_status(void);
2138
2139 void
2140 reset_osvariant_status(void)
2141 {
2142 osvariant_status = 0;
2143 reset_debug_syscall_rejection_mode();
2144 }
2145
2146 extern void commpage_update_dyld_flags(uint64_t);
2147 TUNABLE_WRITEABLE(uint64_t, dyld_flags, "dyld_flags", 0);
2148
2149 STATIC int
2150 sysctl_dyld_flags(__unused struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
2151 {
2152 /*
2153 * Can only ever be set by launchd, possibly several times
2154 * as dyld may change its mind after a userspace reboot.
2155 */
2156 if (req->newptr != 0 && proc_getpid(req->p) != 1) {
2157 return EPERM;
2158 }
2159
2160 int res = sysctl_handle_quad(oidp, arg1, arg2, req);
2161 if (req->newptr && res == 0) {
2162 commpage_update_dyld_flags(dyld_flags);
2163 }
2164 return res;
2165 }
2166
2167 SYSCTL_PROC(_kern, OID_AUTO, dyld_flags,
2168 CTLFLAG_RW | CTLTYPE_QUAD | CTLFLAG_LOCKED | CTLFLAG_MASKED,
2169 &dyld_flags, sizeof(dyld_flags),
2170 sysctl_dyld_flags, "Q", "Opaque flags used to cache dyld system-wide configuration");
2171
2172 #if defined(XNU_TARGET_OS_BRIDGE)
2173 char macosproductversion[MACOS_VERS_LEN] = { '\0' };
2174
2175 SYSCTL_STRING(_kern, OID_AUTO, macosproductversion,
2176 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2177 &macosproductversion[0], MACOS_VERS_LEN, "The currently running macOS ProductVersion (from SystemVersion.plist on macOS)");
2178
2179 char macosversion[MACOS_VERS_LEN] = { '\0' };
2180
2181 SYSCTL_STRING(_kern, OID_AUTO, macosversion,
2182 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2183 &macosversion[0], MACOS_VERS_LEN, "The currently running macOS build version");
2184 #endif
2185
2186 STATIC int
2187 sysctl_sysctl_bootargs
2188 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2189 {
2190 int error;
2191 char buf[BOOT_LINE_LENGTH];
2192
2193 strlcpy(buf, PE_boot_args(), BOOT_LINE_LENGTH);
2194 error = sysctl_io_string(req, buf, BOOT_LINE_LENGTH, 0, NULL);
2195 return error;
2196 }
2197
2198 SYSCTL_PROC(_kern, OID_AUTO, bootargs,
2199 CTLFLAG_LOCKED | CTLFLAG_RD | CTLFLAG_KERN | CTLTYPE_STRING,
2200 NULL, 0,
2201 sysctl_sysctl_bootargs, "A", "bootargs");
2202
2203 STATIC int
2204 sysctl_kernelcacheuuid(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
2205 {
2206 int rval = ENOENT;
2207 if (kernelcache_uuid_valid) {
2208 rval = sysctl_handle_string(oidp, arg1, arg2, req);
2209 }
2210 return rval;
2211 }
2212
2213 SYSCTL_PROC(_kern, OID_AUTO, kernelcacheuuid,
2214 CTLFLAG_RD | CTLFLAG_KERN | CTLTYPE_STRING | CTLFLAG_LOCKED,
2215 kernelcache_uuid_string, sizeof(kernelcache_uuid_string),
2216 sysctl_kernelcacheuuid, "A", "");
2217
2218 STATIC int
2219 sysctl_systemfilesetuuid(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
2220 {
2221 int rval = ENOENT;
2222 if (pageablekc_uuid_valid) {
2223 rval = sysctl_handle_string(oidp, arg1, arg2, req);
2224 }
2225 return rval;
2226 }
2227
2228 SYSCTL_PROC(_kern, OID_AUTO, systemfilesetuuid,
2229 CTLFLAG_RD | CTLFLAG_KERN | CTLTYPE_STRING | CTLFLAG_LOCKED,
2230 pageablekc_uuid_string, sizeof(pageablekc_uuid_string),
2231 sysctl_systemfilesetuuid, "A", "");
2232
2233 STATIC int
2234 sysctl_auxiliaryfilesetuuid(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
2235 {
2236 int rval = ENOENT;
2237 if (auxkc_uuid_valid) {
2238 rval = sysctl_handle_string(oidp, arg1, arg2, req);
2239 }
2240 return rval;
2241 }
2242
2243 SYSCTL_PROC(_kern, OID_AUTO, auxiliaryfilesetuuid,
2244 CTLFLAG_RD | CTLFLAG_KERN | CTLTYPE_STRING | CTLFLAG_LOCKED,
2245 auxkc_uuid_string, sizeof(auxkc_uuid_string),
2246 sysctl_auxiliaryfilesetuuid, "A", "");
2247
2248 STATIC int
2249 sysctl_filesetuuid(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2250 {
2251 int rval = ENOENT;
2252 kc_format_t kcformat;
2253 kernel_mach_header_t *mh;
2254 void *uuid = NULL;
2255 unsigned long uuidlen = 0;
2256 uuid_string_t uuid_str;
2257
2258 if (!PE_get_primary_kc_format(&kcformat) || kcformat != KCFormatFileset) {
2259 return rval;
2260 }
2261
2262 mh = (kernel_mach_header_t *)PE_get_kc_header(KCKindPrimary);
2263 uuid = getuuidfromheader(mh, &uuidlen);
2264
2265 if ((uuid != NULL) && (uuidlen == sizeof(uuid_t))) {
2266 uuid_unparse_upper(*(uuid_t *)uuid, uuid_str);
2267 rval = sysctl_io_string(req, (char *)uuid_str, sizeof(uuid_str), 0, NULL);
2268 }
2269
2270 return rval;
2271 }
2272
2273 SYSCTL_PROC(_kern, OID_AUTO, filesetuuid,
2274 CTLFLAG_RD | CTLFLAG_KERN | CTLTYPE_STRING | CTLFLAG_LOCKED,
2275 NULL, 0,
2276 sysctl_filesetuuid, "A", "");
2277
2278
2279 SYSCTL_INT(_kern, KERN_MAXFILES, maxfiles,
2280 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2281 &maxfiles, 0, "");
2282 SYSCTL_INT(_kern, KERN_ARGMAX, argmax,
2283 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
2284 (int *)NULL, ARG_MAX, "");
2285 SYSCTL_INT(_kern, KERN_POSIX1, posix1version,
2286 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
2287 (int *)NULL, _POSIX_VERSION, "");
2288 SYSCTL_INT(_kern, KERN_NGROUPS, ngroups,
2289 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
2290 (int *)NULL, NGROUPS_MAX, "");
2291 SYSCTL_INT(_kern, KERN_JOB_CONTROL, job_control,
2292 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
2293 (int *)NULL, 1, "");
2294 #if 1 /* _POSIX_SAVED_IDS from <unistd.h> */
2295 SYSCTL_INT(_kern, KERN_SAVED_IDS, saved_ids,
2296 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
2297 (int *)NULL, 1, "");
2298 #else
2299 SYSCTL_INT(_kern, KERN_SAVED_IDS, saved_ids,
2300 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
2301 NULL, 0, "");
2302 #endif
2303 SYSCTL_INT(_kern, OID_AUTO, num_files,
2304 CTLFLAG_RD | CTLFLAG_LOCKED,
2305 &nfiles, 0, "");
2306 SYSCTL_COMPAT_INT(_kern, OID_AUTO, num_vnodes,
2307 CTLFLAG_RD | CTLFLAG_LOCKED,
2308 &numvnodes, 0, "");
2309 SYSCTL_INT(_kern, OID_AUTO, num_tasks,
2310 CTLFLAG_RD | CTLFLAG_LOCKED,
2311 &task_max, 0, "");
2312 SYSCTL_INT(_kern, OID_AUTO, num_threads,
2313 CTLFLAG_RD | CTLFLAG_LOCKED,
2314 &thread_max, 0, "");
2315 SYSCTL_INT(_kern, OID_AUTO, num_taskthreads,
2316 CTLFLAG_RD | CTLFLAG_LOCKED,
2317 &task_threadmax, 0, "");
2318 SYSCTL_LONG(_kern, OID_AUTO, num_recycledvnodes,
2319 CTLFLAG_RD | CTLFLAG_LOCKED,
2320 &num_recycledvnodes, "");
2321 SYSCTL_COMPAT_INT(_kern, OID_AUTO, free_vnodes,
2322 CTLFLAG_RD | CTLFLAG_LOCKED,
2323 &freevnodes, 0, "");
2324
2325 STATIC int
2326 sysctl_maxvnodes(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2327 {
2328 int oldval = desiredvnodes;
2329 int error = sysctl_io_number(req, desiredvnodes, sizeof(int), &desiredvnodes, NULL);
2330
2331 if (oldval != desiredvnodes) {
2332 resize_namecache(desiredvnodes);
2333 }
2334
2335 return error;
2336 }
2337
2338 SYSCTL_INT(_kern, OID_AUTO, namecache_disabled,
2339 CTLFLAG_RW | CTLFLAG_LOCKED,
2340 &nc_disabled, 0, "");
2341
2342 SYSCTL_PROC(_kern, KERN_MAXVNODES, maxvnodes,
2343 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2344 0, 0, sysctl_maxvnodes, "I", "");
2345
2346 SYSCTL_PROC(_kern, KERN_MAXPROC, maxproc,
2347 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2348 0, 0, sysctl_maxproc, "I", "");
2349
2350 SYSCTL_PROC(_kern, KERN_AIOMAX, aiomax,
2351 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2352 0, 0, sysctl_aiomax, "I", "");
2353
2354 SYSCTL_PROC(_kern, KERN_AIOPROCMAX, aioprocmax,
2355 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2356 0, 0, sysctl_aioprocmax, "I", "");
2357
2358 SYSCTL_PROC(_kern, KERN_AIOTHREADS, aiothreads,
2359 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2360 0, 0, sysctl_aiothreads, "I", "");
2361
2362 SYSCTL_PROC(_kern, OID_AUTO, sched_enable_smt,
2363 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_KERN,
2364 0, 0, sysctl_sched_enable_smt, "I", "");
2365
2366 extern int sched_allow_NO_SMT_threads;
2367 SYSCTL_INT(_kern, OID_AUTO, sched_allow_NO_SMT_threads,
2368 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2369 &sched_allow_NO_SMT_threads, 0, "");
2370
2371 extern int sched_avoid_cpu0;
2372 SYSCTL_INT(_kern, OID_AUTO, sched_rt_avoid_cpu0,
2373 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2374 &sched_avoid_cpu0, 0, "If 1, choose cpu0 after all other primaries; if 2, choose cpu0 and cpu1 last, after all other cpus including secondaries");
2375
2376 #if (DEVELOPMENT || DEBUG)
2377
2378 static int
2379 sysctl_kern_max_unsafe_rt_quanta(__unused struct sysctl_oid *oidp,
2380 __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2381 {
2382 extern void sched_set_max_unsafe_rt_quanta(int);
2383 extern int max_unsafe_rt_quanta;
2384
2385 int new_value, changed;
2386 int old_value = max_unsafe_rt_quanta;
2387 int error = sysctl_io_number(req, old_value, sizeof(int), &new_value,
2388 &changed);
2389 if (changed) {
2390 sched_set_max_unsafe_rt_quanta(new_value);
2391 }
2392
2393 return error;
2394 }
2395
2396 SYSCTL_PROC(_kern, OID_AUTO, max_unsafe_rt_quanta,
2397 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2398 0, 0, sysctl_kern_max_unsafe_rt_quanta, "I",
2399 "Number of quanta to allow a realtime "
2400 "thread to run before being penalized");
2401
2402 static int
2403 sysctl_kern_max_unsafe_fixed_quanta(__unused struct sysctl_oid *oidp,
2404 __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2405 {
2406 extern void sched_set_max_unsafe_fixed_quanta(int);
2407 extern int max_unsafe_fixed_quanta;
2408
2409 int new_value, changed;
2410 int old_value = max_unsafe_fixed_quanta;
2411 int error = sysctl_io_number(req, old_value, sizeof(int), &new_value,
2412 &changed);
2413 if (changed) {
2414 sched_set_max_unsafe_fixed_quanta(new_value);
2415 }
2416
2417 return error;
2418 }
2419
2420 SYSCTL_PROC(_kern, OID_AUTO, max_unsafe_fixed_quanta,
2421 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2422 0, 0, sysctl_kern_max_unsafe_fixed_quanta, "I",
2423 "Number of quanta to allow a fixed sched mode "
2424 "thread to run before being penalized");
2425
2426 static int
2427 sysctl_kern_quantum_us(__unused struct sysctl_oid *oidp, __unused void *arg1,
2428 __unused int arg2, struct sysctl_req *req)
2429 {
2430 extern uint64_t sysctl_get_quantum_us(void);
2431 const uint64_t quantum_us = sysctl_get_quantum_us();
2432
2433 return sysctl_io_number(req, quantum_us, sizeof(quantum_us), NULL, NULL);
2434 }
2435
2436 SYSCTL_PROC(_kern, OID_AUTO, quantum_us,
2437 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
2438 0, 0, sysctl_kern_quantum_us, "Q",
2439 "Length of scheduling quantum in microseconds");
2440
2441 extern int smt_sched_bonus_16ths;
2442 SYSCTL_INT(_kern, OID_AUTO, smt_sched_bonus_16ths,
2443 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2444 &smt_sched_bonus_16ths, 0, "");
2445
2446 extern int smt_timeshare_enabled;
2447 SYSCTL_INT(_kern, OID_AUTO, sched_smt_timeshare_enable,
2448 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2449 &smt_timeshare_enabled, 0, "");
2450
2451 extern int sched_smt_balance;
2452 SYSCTL_INT(_kern, OID_AUTO, sched_smt_balance,
2453 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2454 &sched_smt_balance, 0, "");
2455 extern int sched_allow_rt_smt;
2456 SYSCTL_INT(_kern, OID_AUTO, sched_allow_rt_smt,
2457 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2458 &sched_allow_rt_smt, 0, "");
2459 extern int sched_allow_rt_steal;
2460 SYSCTL_INT(_kern, OID_AUTO, sched_allow_rt_steal,
2461 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2462 &sched_allow_rt_steal, 0, "");
2463 extern int sched_backup_cpu_timeout_count;
2464 SYSCTL_INT(_kern, OID_AUTO, sched_backup_cpu_timeout_count,
2465 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2466 &sched_backup_cpu_timeout_count, 0, "The maximum number of 10us delays before allowing a backup cpu to select a thread");
2467 #if __arm64__
2468 /* Scheduler perfcontrol callouts sysctls */
2469 SYSCTL_DECL(_kern_perfcontrol_callout);
2470 SYSCTL_NODE(_kern, OID_AUTO, perfcontrol_callout, CTLFLAG_RW | CTLFLAG_LOCKED, 0,
2471 "scheduler perfcontrol callouts");
2472
2473 extern int perfcontrol_callout_stats_enabled;
2474 SYSCTL_INT(_kern_perfcontrol_callout, OID_AUTO, stats_enabled,
2475 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2476 &perfcontrol_callout_stats_enabled, 0, "");
2477
2478 extern uint64_t perfcontrol_callout_stat_avg(perfcontrol_callout_type_t type,
2479 perfcontrol_callout_stat_t stat);
2480
2481 /* On-Core Callout */
2482 STATIC int
2483 sysctl_perfcontrol_callout_stat
2484 (__unused struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
2485 {
2486 perfcontrol_callout_stat_t stat = (perfcontrol_callout_stat_t)arg1;
2487 perfcontrol_callout_type_t type = (perfcontrol_callout_type_t)arg2;
2488 return sysctl_io_number(req, (int)perfcontrol_callout_stat_avg(type, stat),
2489 sizeof(int), NULL, NULL);
2490 }
2491
2492 SYSCTL_PROC(_kern_perfcontrol_callout, OID_AUTO, oncore_instr,
2493 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
2494 (void *)PERFCONTROL_STAT_INSTRS, PERFCONTROL_CALLOUT_ON_CORE,
2495 sysctl_perfcontrol_callout_stat, "I", "");
2496 SYSCTL_PROC(_kern_perfcontrol_callout, OID_AUTO, oncore_cycles,
2497 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
2498 (void *)PERFCONTROL_STAT_CYCLES, PERFCONTROL_CALLOUT_ON_CORE,
2499 sysctl_perfcontrol_callout_stat, "I", "");
2500 SYSCTL_PROC(_kern_perfcontrol_callout, OID_AUTO, offcore_instr,
2501 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
2502 (void *)PERFCONTROL_STAT_INSTRS, PERFCONTROL_CALLOUT_OFF_CORE,
2503 sysctl_perfcontrol_callout_stat, "I", "");
2504 SYSCTL_PROC(_kern_perfcontrol_callout, OID_AUTO, offcore_cycles,
2505 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
2506 (void *)PERFCONTROL_STAT_CYCLES, PERFCONTROL_CALLOUT_OFF_CORE,
2507 sysctl_perfcontrol_callout_stat, "I", "");
2508 SYSCTL_PROC(_kern_perfcontrol_callout, OID_AUTO, context_instr,
2509 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
2510 (void *)PERFCONTROL_STAT_INSTRS, PERFCONTROL_CALLOUT_CONTEXT,
2511 sysctl_perfcontrol_callout_stat, "I", "");
2512 SYSCTL_PROC(_kern_perfcontrol_callout, OID_AUTO, context_cycles,
2513 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
2514 (void *)PERFCONTROL_STAT_CYCLES, PERFCONTROL_CALLOUT_CONTEXT,
2515 sysctl_perfcontrol_callout_stat, "I", "");
2516 SYSCTL_PROC(_kern_perfcontrol_callout, OID_AUTO, update_instr,
2517 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
2518 (void *)PERFCONTROL_STAT_INSTRS, PERFCONTROL_CALLOUT_STATE_UPDATE,
2519 sysctl_perfcontrol_callout_stat, "I", "");
2520 SYSCTL_PROC(_kern_perfcontrol_callout, OID_AUTO, update_cycles,
2521 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
2522 (void *)PERFCONTROL_STAT_CYCLES, PERFCONTROL_CALLOUT_STATE_UPDATE,
2523 sysctl_perfcontrol_callout_stat, "I", "");
2524
2525 #if __AMP__
2526 extern int sched_amp_idle_steal;
2527 SYSCTL_INT(_kern, OID_AUTO, sched_amp_idle_steal,
2528 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2529 &sched_amp_idle_steal, 0, "");
2530 extern int sched_amp_spill_steal;
2531 SYSCTL_INT(_kern, OID_AUTO, sched_amp_spill_steal,
2532 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2533 &sched_amp_spill_steal, 0, "");
2534 extern int sched_amp_spill_count;
2535 SYSCTL_INT(_kern, OID_AUTO, sched_amp_spill_count,
2536 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2537 &sched_amp_spill_count, 0, "");
2538 extern int sched_amp_spill_deferred_ipi;
2539 SYSCTL_INT(_kern, OID_AUTO, sched_amp_spill_deferred_ipi,
2540 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2541 &sched_amp_spill_deferred_ipi, 0, "");
2542 extern int sched_amp_pcores_preempt_immediate_ipi;
2543 SYSCTL_INT(_kern, OID_AUTO, sched_amp_pcores_preempt_immediate_ipi,
2544 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2545 &sched_amp_pcores_preempt_immediate_ipi, 0, "");
2546 #endif /* __AMP__ */
2547 #endif /* __arm64__ */
2548
2549 #if __arm64__
2550 extern int legacy_footprint_entitlement_mode;
2551 SYSCTL_INT(_kern, OID_AUTO, legacy_footprint_entitlement_mode,
2552 CTLFLAG_KERN | CTLFLAG_RD | CTLFLAG_LOCKED,
2553 &legacy_footprint_entitlement_mode, 0, "");
2554 #endif /* __arm64__ */
2555
2556 /*
2557 * Realtime threads are ordered by highest priority first then,
2558 * for threads of the same priority, by earliest deadline first.
2559 * But if sched_rt_runq_strict_priority is false (the default),
2560 * a lower priority thread with an earlier deadline will be preferred
2561 * over a higher priority thread with a later deadline, as long as
2562 * both threads' computations will fit before the later deadline.
2563 */
2564 extern int sched_rt_runq_strict_priority;
2565 SYSCTL_INT(_kern, OID_AUTO, sched_rt_runq_strict_priority,
2566 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2567 &sched_rt_runq_strict_priority, 0, "");
2568
2569 static int
2570 sysctl_kern_sched_rt_n_backup_processors(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2571 {
2572 int new_value, changed;
2573 int old_value = sched_get_rt_n_backup_processors();
2574 int error = sysctl_io_number(req, old_value, sizeof(int), &new_value, &changed);
2575 if (changed) {
2576 sched_set_rt_n_backup_processors(new_value);
2577 }
2578
2579 return error;
2580 }
2581
2582 SYSCTL_PROC(_kern, OID_AUTO, sched_rt_n_backup_processors,
2583 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2584 0, 0, sysctl_kern_sched_rt_n_backup_processors, "I", "");
2585
2586 static int
2587 sysctl_kern_sched_rt_deadline_epsilon_us(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2588 {
2589 int new_value, changed;
2590 int old_value = sched_get_rt_deadline_epsilon();
2591 int error = sysctl_io_number(req, old_value, sizeof(int), &new_value, &changed);
2592 if (changed) {
2593 sched_set_rt_deadline_epsilon(new_value);
2594 }
2595
2596 return error;
2597 }
2598
2599 SYSCTL_PROC(_kern, OID_AUTO, sched_rt_deadline_epsilon_us,
2600 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2601 0, 0, sysctl_kern_sched_rt_deadline_epsilon_us, "I", "");
2602
2603 extern int sched_idle_delay_cpuid;
2604 SYSCTL_INT(_kern, OID_AUTO, sched_idle_delay_cpuid,
2605 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2606 &sched_idle_delay_cpuid, 0, "This cpuid will be delayed by 500us on exiting idle, to simulate interrupt or preemption delays when testing the scheduler");
2607
2608 static int
2609 sysctl_kern_sched_powered_cores(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2610 {
2611 int new_value, changed;
2612 int old_value = sched_get_powered_cores();
2613 int error = sysctl_io_number(req, old_value, sizeof(int), &new_value, &changed);
2614 if (changed) {
2615 sched_set_powered_cores(new_value);
2616 }
2617
2618 return error;
2619 }
2620
2621 SYSCTL_PROC(_kern, OID_AUTO, sched_powered_cores,
2622 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2623 0, 0, sysctl_kern_sched_powered_cores, "I", "");
2624
2625 #endif /* (DEVELOPMENT || DEBUG) */
2626
2627 extern uint64_t perfcontrol_requested_recommended_cores;
2628 SYSCTL_QUAD(_kern, OID_AUTO, sched_recommended_cores,
2629 CTLFLAG_KERN | CTLFLAG_RD | CTLFLAG_LOCKED,
2630 &perfcontrol_requested_recommended_cores, "");
2631
2632 static int
2633 sysctl_kern_suspend_cluster_powerdown(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2634 {
2635 int new_value, changed;
2636 int old_value = get_cluster_powerdown_user_suspended();
2637 int error = sysctl_io_number(req, old_value, sizeof(int), &new_value, &changed);
2638 if (!error && changed) {
2639 if (new_value > 0) {
2640 error = suspend_cluster_powerdown_from_user();
2641 } else {
2642 error = resume_cluster_powerdown_from_user();
2643 }
2644 if (error) {
2645 error = EALREADY;
2646 }
2647 }
2648
2649 return error;
2650 }
2651
2652 SYSCTL_PROC(_kern, OID_AUTO, suspend_cluster_powerdown,
2653 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2654 0, 0, sysctl_kern_suspend_cluster_powerdown, "I", "");
2655
2656
2657 STATIC int
2658 sysctl_securelvl
2659 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2660 {
2661 int new_value, changed;
2662 int error = sysctl_io_number(req, securelevel, sizeof(int), &new_value, &changed);
2663 if (changed) {
2664 if (!(new_value < securelevel && proc_getpid(req->p) != 1)) {
2665 proc_list_lock();
2666 securelevel = new_value;
2667 proc_list_unlock();
2668 } else {
2669 error = EPERM;
2670 }
2671 }
2672 return error;
2673 }
2674
2675 SYSCTL_PROC(_kern, KERN_SECURELVL, securelevel,
2676 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2677 0, 0, sysctl_securelvl, "I", "");
2678
2679
2680 STATIC int
2681 sysctl_domainname
2682 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2683 {
2684 int error, changed;
2685 char tmpname[MAXHOSTNAMELEN] = {};
2686
2687 lck_mtx_lock(&domainname_lock);
2688 strlcpy(tmpname, domainname, sizeof(tmpname));
2689 lck_mtx_unlock(&domainname_lock);
2690
2691 error = sysctl_io_string(req, tmpname, sizeof(tmpname), 0, &changed);
2692 if (!error && changed) {
2693 lck_mtx_lock(&domainname_lock);
2694 strlcpy(domainname, tmpname, sizeof(domainname));
2695 lck_mtx_unlock(&domainname_lock);
2696 }
2697 return error;
2698 }
2699
2700 SYSCTL_PROC(_kern, KERN_DOMAINNAME, nisdomainname,
2701 CTLTYPE_STRING | CTLFLAG_RW | CTLFLAG_LOCKED,
2702 0, 0, sysctl_domainname, "A", "");
2703
2704 SYSCTL_COMPAT_INT(_kern, KERN_HOSTID, hostid,
2705 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2706 &hostid, 0, "");
2707
2708 STATIC int
2709 sysctl_hostname
2710 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2711 {
2712 int error, changed;
2713 char tmpname[MAXHOSTNAMELEN] = {};
2714 const char * name;
2715
2716 #if XNU_TARGET_OS_OSX
2717 name = hostname;
2718 #else /* XNU_TARGET_OS_OSX */
2719 #define ENTITLEMENT_USER_ASSIGNED_DEVICE_NAME \
2720 "com.apple.developer.device-information.user-assigned-device-name"
2721 if (csproc_get_platform_binary(current_proc()) ||
2722 IOCurrentTaskHasEntitlement(ENTITLEMENT_USER_ASSIGNED_DEVICE_NAME)) {
2723 name = hostname;
2724 } else {
2725 name = "localhost";
2726 }
2727 #endif /* ! XNU_TARGET_OS_OSX */
2728
2729 lck_mtx_lock(&hostname_lock);
2730 strlcpy(tmpname, name, sizeof(tmpname));
2731 lck_mtx_unlock(&hostname_lock);
2732
2733 error = sysctl_io_string(req, tmpname, sizeof(tmpname), 1, &changed);
2734 if (!error && changed) {
2735 lck_mtx_lock(&hostname_lock);
2736 strlcpy(hostname, tmpname, sizeof(hostname));
2737 lck_mtx_unlock(&hostname_lock);
2738 }
2739 return error;
2740 }
2741
2742 SYSCTL_PROC(_kern, KERN_HOSTNAME, hostname,
2743 CTLTYPE_STRING | CTLFLAG_RW | CTLFLAG_LOCKED,
2744 0, 0, sysctl_hostname, "A", "");
2745
2746 STATIC int
2747 sysctl_procname
2748 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2749 {
2750 /* Original code allowed writing, I'm copying this, although this all makes
2751 * no sense to me. Besides, this sysctl is never used. */
2752 return sysctl_io_string(req, &req->p->p_name[0], (2 * MAXCOMLEN + 1), 1, NULL);
2753 }
2754
2755 SYSCTL_PROC(_kern, KERN_PROCNAME, procname,
2756 CTLTYPE_STRING | CTLFLAG_RW | CTLFLAG_ANYBODY | CTLFLAG_LOCKED,
2757 0, 0, sysctl_procname, "A", "");
2758
2759 SYSCTL_INT(_kern, KERN_SPECULATIVE_READS, speculative_reads_disabled,
2760 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2761 &speculative_reads_disabled, 0, "");
2762
2763 SYSCTL_UINT(_kern, OID_AUTO, preheat_max_bytes,
2764 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2765 &preheat_max_bytes, 0, "");
2766
2767 SYSCTL_UINT(_kern, OID_AUTO, preheat_min_bytes,
2768 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2769 &preheat_min_bytes, 0, "");
2770
2771 SYSCTL_UINT(_kern, OID_AUTO, speculative_prefetch_max,
2772 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2773 &speculative_prefetch_max, 0, "");
2774
2775 SYSCTL_UINT(_kern, OID_AUTO, speculative_prefetch_max_iosize,
2776 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2777 &speculative_prefetch_max_iosize, 0, "");
2778
2779 SYSCTL_UINT(_kern, OID_AUTO, vm_page_free_target,
2780 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2781 &vm_page_free_target, 0, "");
2782
2783 SYSCTL_UINT(_kern, OID_AUTO, vm_page_free_min,
2784 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2785 &vm_page_free_min, 0, "");
2786
2787 SYSCTL_UINT(_kern, OID_AUTO, vm_page_free_reserved,
2788 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2789 &vm_page_free_reserved, 0, "");
2790
2791 SYSCTL_UINT(_kern, OID_AUTO, vm_page_speculative_percentage,
2792 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2793 &vm_pageout_state.vm_page_speculative_percentage, 0, "");
2794
2795 SYSCTL_UINT(_kern, OID_AUTO, vm_page_speculative_q_age_ms,
2796 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2797 &vm_pageout_state.vm_page_speculative_q_age_ms, 0, "");
2798
2799 SYSCTL_UINT(_kern, OID_AUTO, vm_max_delayed_work_limit,
2800 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2801 &vm_max_delayed_work_limit, 0, "");
2802
2803 SYSCTL_UINT(_kern, OID_AUTO, vm_max_batch,
2804 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2805 &vm_max_batch, 0, "");
2806
2807 SYSCTL_STRING(_kern, OID_AUTO, bootsessionuuid,
2808 CTLFLAG_RD | CTLFLAG_LOCKED,
2809 &bootsessionuuid_string, sizeof(bootsessionuuid_string), "");
2810
2811
2812 STATIC int
2813 sysctl_boottime
2814 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2815 {
2816 struct timeval tv;
2817 boottime_timeval(&tv);
2818 struct proc *p = req->p;
2819
2820 if (proc_is64bit(p)) {
2821 struct user64_timeval t = {};
2822 t.tv_sec = tv.tv_sec;
2823 t.tv_usec = tv.tv_usec;
2824 return sysctl_io_opaque(req, &t, sizeof(t), NULL);
2825 } else {
2826 struct user32_timeval t = {};
2827 t.tv_sec = (user32_time_t)tv.tv_sec;
2828 t.tv_usec = tv.tv_usec;
2829 return sysctl_io_opaque(req, &t, sizeof(t), NULL);
2830 }
2831 }
2832
2833 SYSCTL_PROC(_kern, KERN_BOOTTIME, boottime,
2834 CTLTYPE_STRUCT | CTLFLAG_KERN | CTLFLAG_RD | CTLFLAG_LOCKED,
2835 0, 0, sysctl_boottime, "S,timeval", "");
2836
2837 extern bool IOGetBootUUID(char *);
2838
2839 /* non-static: written by imageboot.c */
2840 uuid_string_t fake_bootuuid;
2841
2842 STATIC int
2843 sysctl_bootuuid
2844 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2845 {
2846 int error = ENOENT;
2847
2848 /* check the first byte to see if the string has been
2849 * populated. this is a uuid_STRING_t, this check would
2850 * not work with a uuid_t.
2851 */
2852 if (fake_bootuuid[0] != '\0') {
2853 error = sysctl_io_string(req, fake_bootuuid, 0, 0, NULL);
2854 goto out;
2855 }
2856
2857 uuid_string_t uuid_string;
2858 if (IOGetBootUUID(uuid_string)) {
2859 uuid_t boot_uuid;
2860 error = uuid_parse(uuid_string, boot_uuid);
2861 if (!error) {
2862 error = sysctl_io_string(req, __DECONST(char *, uuid_string), 0, 0, NULL);
2863 }
2864 }
2865
2866 out:
2867 return error;
2868 }
2869
2870 SYSCTL_PROC(_kern, OID_AUTO, bootuuid,
2871 CTLTYPE_STRING | CTLFLAG_KERN | CTLFLAG_RD | CTLFLAG_LOCKED,
2872 0, 0, sysctl_bootuuid, "A", "");
2873
2874
2875 extern bool IOGetApfsPrebootUUID(char *);
2876 extern bool IOGetAssociatedApfsVolgroupUUID(char *);
2877
2878 STATIC int
2879 sysctl_apfsprebootuuid
2880 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2881 {
2882 int error = ENOENT;
2883
2884 uuid_string_t uuid_string;
2885 if (IOGetApfsPrebootUUID(uuid_string)) {
2886 uuid_t apfs_preboot_uuid;
2887 error = uuid_parse(uuid_string, apfs_preboot_uuid);
2888 if (!error) {
2889 error = sysctl_io_string(req, __DECONST(char *, uuid_string), 0, 0, NULL);
2890 }
2891 }
2892
2893 return error;
2894 }
2895
2896 SYSCTL_PROC(_kern, OID_AUTO, apfsprebootuuid,
2897 CTLTYPE_STRING | CTLFLAG_KERN | CTLFLAG_RD | CTLFLAG_LOCKED,
2898 0, 0, sysctl_apfsprebootuuid, "A", "");
2899
2900 STATIC int
2901 sysctl_targetsystemvolgroupuuid
2902 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2903 {
2904 int error = ENOENT;
2905
2906 uuid_string_t uuid_string;
2907 if (IOGetApfsPrebootUUID(uuid_string)) {
2908 uuid_t apfs_preboot_uuid;
2909 error = uuid_parse(uuid_string, apfs_preboot_uuid);
2910 if (!error) {
2911 error = sysctl_io_string(req, __DECONST(char *, uuid_string), 0, 0, NULL);
2912 }
2913 } else {
2914 /*
2915 * In special boot modes, such as kcgen-mode, the
2916 * apfs-preboot-uuid property will not be set. Instead, a
2917 * different property, associated-volume-group, will be set
2918 * which indicates the UUID of the VolumeGroup containing the
2919 * system volume into which you will boot.
2920 */
2921 if (IOGetAssociatedApfsVolgroupUUID(uuid_string)) {
2922 uuid_t apfs_preboot_uuid;
2923 error = uuid_parse(uuid_string, apfs_preboot_uuid);
2924 if (!error) {
2925 error = sysctl_io_string(req, __DECONST(char *, uuid_string), 0, 0, NULL);
2926 }
2927 }
2928 }
2929
2930 return error;
2931 }
2932
2933 SYSCTL_PROC(_kern, OID_AUTO, targetsystemvolgroupuuid,
2934 CTLTYPE_STRING | CTLFLAG_KERN | CTLFLAG_RD | CTLFLAG_MASKED | CTLFLAG_LOCKED,
2935 0, 0, sysctl_targetsystemvolgroupuuid, "A", "");
2936
2937
2938 extern bool IOGetBootManifestHash(char *, size_t *);
2939 extern bool IOGetBootObjectsPath(char *);
2940
2941 STATIC int
2942 sysctl_bootobjectspath
2943 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2944 {
2945 int error = ENOENT;
2946
2947 #if defined(__x86_64__)
2948 /* auth-root-dmg is used for the Intel BaseSystem in some flows,
2949 * e.g. createinstallmedia and as part of upgrading from 10.15 or earlier
2950 * under these scenarios, set_fake_bootuuid will be called when pivoting to
2951 * the new root filesystem. need honor the fake bootuuid.
2952 */
2953 if (fake_bootuuid[0] != '\0') {
2954 error = sysctl_io_string(req, fake_bootuuid, 0, 0, NULL);
2955 } else {
2956 /* for intel mac, boot objects reside in [preboot volume]/[bootuuid]
2957 * bootuuid and apfsprebootuuid are populated by efiboot and they are alias.
2958 */
2959 uuid_string_t uuid_string;
2960 if (IOGetBootUUID(uuid_string)) {
2961 uuid_t boot_uuid;
2962 error = uuid_parse(uuid_string, boot_uuid);
2963 if (!error) {
2964 error = sysctl_io_string(req, (char *)uuid_string, 0, 0, NULL);
2965 }
2966 }
2967 }
2968 #else
2969 char boot_obj_path[MAXPATHLEN] = { "\0" };
2970 static const char kAsciiHexChars[] = "0123456789ABCDEF";
2971 unsigned int i, j;
2972
2973 /* Hashed with SHA2-384 or SHA1, boot manifest hash is 48 bytes or 20 bytes
2974 * hence, need a 97 bytes char array for the string.
2975 */
2976 size_t hash_data_size = CCSHA384_OUTPUT_SIZE;
2977 char hash_data[CCSHA384_OUTPUT_SIZE] = { "\0" };
2978 char boot_manifest_hash[CCSHA384_OUTPUT_SIZE * 2 + 1] = { "\0" };;
2979
2980 /* for Apple Silicon Macs, there is a boot-objects-path under IODeviceTree:/chosen
2981 * and boot objects reside in [preboot volume]/[boot-objects-path]
2982 * for embedded platforms, there would be a boot-manifest-hash under IODeviceTree:/chosen
2983 * and boot objects reside in [preboot volume]/[boot-manifest-hash]
2984 */
2985 if (IOGetBootObjectsPath(boot_obj_path)) {
2986 error = sysctl_io_string(req, (char *)boot_obj_path, 0, 0, NULL);
2987 } else if (IOGetBootManifestHash(hash_data, &hash_data_size)) {
2988 j = 0;
2989 for (i = 0; i < hash_data_size; ++i) {
2990 char octet = hash_data[i];
2991 boot_manifest_hash[j++] = kAsciiHexChars[((octet & 0xF0) >> 4)];
2992 boot_manifest_hash[j++] = kAsciiHexChars[(octet & 0x0F)];
2993 }
2994 /* make sure string has null termination */
2995 boot_manifest_hash[j] = '\0';
2996 error = sysctl_io_string(req, (char *)boot_manifest_hash, 0, 0, NULL);
2997 }
2998 #endif
2999 return error;
3000 }
3001
3002 SYSCTL_PROC(_kern, OID_AUTO, bootobjectspath,
3003 CTLTYPE_STRING | CTLFLAG_KERN | CTLFLAG_RD | CTLFLAG_LOCKED,
3004 0, 0, sysctl_bootobjectspath, "A", "");
3005
3006
3007 STATIC int
3008 sysctl_symfile
3009 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3010 {
3011 char *str;
3012 int error = get_kernel_symfile(req->p, &str);
3013 if (error) {
3014 return error;
3015 }
3016 return sysctl_io_string(req, str, 0, 0, NULL);
3017 }
3018
3019
3020 SYSCTL_PROC(_kern, KERN_SYMFILE, symfile,
3021 CTLTYPE_STRING | CTLFLAG_RD | CTLFLAG_LOCKED,
3022 0, 0, sysctl_symfile, "A", "");
3023
3024 #if CONFIG_NETBOOT
3025 STATIC int
3026 sysctl_netboot
3027 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3028 {
3029 return sysctl_io_number(req, netboot_root(), sizeof(int), NULL, NULL);
3030 }
3031
3032 SYSCTL_PROC(_kern, KERN_NETBOOT, netboot,
3033 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
3034 0, 0, sysctl_netboot, "I", "");
3035 #endif
3036
3037 #ifdef CONFIG_IMGSRC_ACCESS
3038 /*
3039 * Legacy--act as if only one layer of nesting is possible.
3040 */
3041 STATIC int
3042 sysctl_imgsrcdev
3043 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3044 {
3045 vfs_context_t ctx = vfs_context_current();
3046 vnode_t devvp;
3047 int result;
3048
3049 if (!vfs_context_issuser(ctx)) {
3050 return EPERM;
3051 }
3052
3053 if (imgsrc_rootvnodes[0] == NULL) {
3054 return ENOENT;
3055 }
3056
3057 result = vnode_getwithref(imgsrc_rootvnodes[0]);
3058 if (result != 0) {
3059 return result;
3060 }
3061
3062 devvp = vnode_mount(imgsrc_rootvnodes[0])->mnt_devvp;
3063 result = vnode_getwithref(devvp);
3064 if (result != 0) {
3065 goto out;
3066 }
3067
3068 result = sysctl_io_number(req, vnode_specrdev(devvp), sizeof(dev_t), NULL, NULL);
3069
3070 vnode_put(devvp);
3071 out:
3072 vnode_put(imgsrc_rootvnodes[0]);
3073 return result;
3074 }
3075
3076 SYSCTL_PROC(_kern, OID_AUTO, imgsrcdev,
3077 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
3078 0, 0, sysctl_imgsrcdev, "I", "");
3079
3080 STATIC int
3081 sysctl_imgsrcinfo
3082 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3083 {
3084 int error;
3085 struct imgsrc_info info[MAX_IMAGEBOOT_NESTING] = {}; /* 2 for now, no problem */
3086 uint32_t i;
3087 vnode_t rvp, devvp;
3088
3089 if (imgsrc_rootvnodes[0] == NULLVP) {
3090 return ENXIO;
3091 }
3092
3093 for (i = 0; i < MAX_IMAGEBOOT_NESTING; i++) {
3094 /*
3095 * Go get the root vnode.
3096 */
3097 rvp = imgsrc_rootvnodes[i];
3098 if (rvp == NULLVP) {
3099 break;
3100 }
3101
3102 error = vnode_get(rvp);
3103 if (error != 0) {
3104 return error;
3105 }
3106
3107 /*
3108 * For now, no getting at a non-local volume.
3109 */
3110 devvp = vnode_mount(rvp)->mnt_devvp;
3111 if (devvp == NULL) {
3112 vnode_put(rvp);
3113 return EINVAL;
3114 }
3115
3116 error = vnode_getwithref(devvp);
3117 if (error != 0) {
3118 vnode_put(rvp);
3119 return error;
3120 }
3121
3122 /*
3123 * Fill in info.
3124 */
3125 info[i].ii_dev = vnode_specrdev(devvp);
3126 info[i].ii_flags = 0;
3127 info[i].ii_height = i;
3128 bzero(info[i].ii_reserved, sizeof(info[i].ii_reserved));
3129
3130 vnode_put(devvp);
3131 vnode_put(rvp);
3132 }
3133
3134 return sysctl_io_opaque(req, info, i * sizeof(info[0]), NULL);
3135 }
3136
3137 SYSCTL_PROC(_kern, OID_AUTO, imgsrcinfo,
3138 CTLTYPE_OPAQUE | CTLFLAG_RD | CTLFLAG_LOCKED,
3139 0, 0, sysctl_imgsrcinfo, "I", "");
3140
3141 #endif /* CONFIG_IMGSRC_ACCESS */
3142
3143
3144 SYSCTL_DECL(_kern_timer);
3145 SYSCTL_NODE(_kern, OID_AUTO, timer, CTLFLAG_RW | CTLFLAG_LOCKED, 0, "timer");
3146
3147
3148 SYSCTL_INT(_kern_timer, OID_AUTO, coalescing_enabled,
3149 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
3150 &mach_timer_coalescing_enabled, 0, "");
3151
3152 SYSCTL_QUAD(_kern_timer, OID_AUTO, deadline_tracking_bin_1,
3153 CTLFLAG_RW | CTLFLAG_LOCKED,
3154 &timer_deadline_tracking_bin_1, "");
3155 SYSCTL_QUAD(_kern_timer, OID_AUTO, deadline_tracking_bin_2,
3156 CTLFLAG_RW | CTLFLAG_LOCKED,
3157 &timer_deadline_tracking_bin_2, "");
3158
3159 SYSCTL_DECL(_kern_timer_longterm);
3160 SYSCTL_NODE(_kern_timer, OID_AUTO, longterm, CTLFLAG_RW | CTLFLAG_LOCKED, 0, "longterm");
3161
3162
3163 /* Must match definition in osfmk/kern/timer_call.c */
3164 enum {
3165 THRESHOLD, QCOUNT,
3166 ENQUEUES, DEQUEUES, ESCALATES, SCANS, PREEMPTS,
3167 LATENCY, LATENCY_MIN, LATENCY_MAX, LONG_TERM_SCAN_LIMIT,
3168 LONG_TERM_SCAN_INTERVAL, LONG_TERM_SCAN_PAUSES,
3169 SCAN_LIMIT, SCAN_INTERVAL, SCAN_PAUSES, SCAN_POSTPONES,
3170 };
3171 extern uint64_t timer_sysctl_get(int);
3172 extern int timer_sysctl_set(int, uint64_t);
3173
3174 STATIC int
3175 sysctl_timer
3176 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3177 {
3178 int oid = (int)arg1;
3179 uint64_t value = timer_sysctl_get(oid);
3180 uint64_t new_value;
3181 int error;
3182 int changed;
3183
3184 error = sysctl_io_number(req, value, sizeof(value), &new_value, &changed);
3185 if (changed) {
3186 error = timer_sysctl_set(oid, new_value);
3187 }
3188
3189 return error;
3190 }
3191
3192 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, threshold,
3193 CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_LOCKED,
3194 (void *) THRESHOLD, 0, sysctl_timer, "Q", "");
3195 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, scan_limit,
3196 CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_LOCKED,
3197 (void *) LONG_TERM_SCAN_LIMIT, 0, sysctl_timer, "Q", "");
3198 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, scan_interval,
3199 CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_LOCKED,
3200 (void *) LONG_TERM_SCAN_INTERVAL, 0, sysctl_timer, "Q", "");
3201
3202 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, qlen,
3203 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3204 (void *) QCOUNT, 0, sysctl_timer, "Q", "");
3205 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, scan_pauses,
3206 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3207 (void *) LONG_TERM_SCAN_PAUSES, 0, sysctl_timer, "Q", "");
3208
3209 #if DEBUG
3210 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, enqueues,
3211 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3212 (void *) ENQUEUES, 0, sysctl_timer, "Q", "");
3213 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, dequeues,
3214 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3215 (void *) DEQUEUES, 0, sysctl_timer, "Q", "");
3216 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, escalates,
3217 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3218 (void *) ESCALATES, 0, sysctl_timer, "Q", "");
3219 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, scans,
3220 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3221 (void *) SCANS, 0, sysctl_timer, "Q", "");
3222 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, preempts,
3223 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3224 (void *) PREEMPTS, 0, sysctl_timer, "Q", "");
3225 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, latency,
3226 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3227 (void *) LATENCY, 0, sysctl_timer, "Q", "");
3228 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, latency_min,
3229 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3230 (void *) LATENCY_MIN, 0, sysctl_timer, "Q", "");
3231 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, latency_max,
3232 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3233 (void *) LATENCY_MAX, 0, sysctl_timer, "Q", "");
3234 #endif /* DEBUG */
3235
3236 SYSCTL_PROC(_kern_timer, OID_AUTO, scan_limit,
3237 CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_LOCKED,
3238 (void *) SCAN_LIMIT, 0, sysctl_timer, "Q", "");
3239 SYSCTL_PROC(_kern_timer, OID_AUTO, scan_interval,
3240 CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_LOCKED,
3241 (void *) SCAN_INTERVAL, 0, sysctl_timer, "Q", "");
3242 SYSCTL_PROC(_kern_timer, OID_AUTO, scan_pauses,
3243 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3244 (void *) SCAN_PAUSES, 0, sysctl_timer, "Q", "");
3245 SYSCTL_PROC(_kern_timer, OID_AUTO, scan_postpones,
3246 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3247 (void *) SCAN_POSTPONES, 0, sysctl_timer, "Q", "");
3248
3249 STATIC int
3250 sysctl_usrstack
3251 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3252 {
3253 return sysctl_io_number(req, (int)req->p->user_stack, sizeof(int), NULL, NULL);
3254 }
3255
3256 SYSCTL_PROC(_kern, KERN_USRSTACK32, usrstack,
3257 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
3258 0, 0, sysctl_usrstack, "I", "");
3259
3260 STATIC int
3261 sysctl_usrstack64
3262 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3263 {
3264 return sysctl_io_number(req, req->p->user_stack, sizeof(req->p->user_stack), NULL, NULL);
3265 }
3266
3267 SYSCTL_PROC(_kern, KERN_USRSTACK64, usrstack64,
3268 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3269 0, 0, sysctl_usrstack64, "Q", "");
3270
3271 #if CONFIG_COREDUMP
3272
3273 SYSCTL_STRING(_kern, KERN_COREFILE, corefile,
3274 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
3275 corefilename, sizeof(corefilename), "");
3276
3277 SYSCTL_STRING(_kern, OID_AUTO, drivercorefile,
3278 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
3279 drivercorefilename, sizeof(drivercorefilename), "");
3280
3281 STATIC int
3282 sysctl_coredump
3283 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3284 {
3285 #ifdef SECURE_KERNEL
3286 (void)req;
3287 return ENOTSUP;
3288 #else
3289 int new_value, changed;
3290 int error = sysctl_io_number(req, do_coredump, sizeof(int), &new_value, &changed);
3291 if (changed) {
3292 if ((new_value == 0) || (new_value == 1)) {
3293 do_coredump = new_value;
3294 } else {
3295 error = EINVAL;
3296 }
3297 }
3298 return error;
3299 #endif
3300 }
3301
3302 SYSCTL_PROC(_kern, KERN_COREDUMP, coredump,
3303 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
3304 0, 0, sysctl_coredump, "I", "");
3305
3306 STATIC int
3307 sysctl_suid_coredump
3308 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3309 {
3310 #ifdef SECURE_KERNEL
3311 (void)req;
3312 return ENOTSUP;
3313 #else
3314 int new_value, changed;
3315 int error = sysctl_io_number(req, sugid_coredump, sizeof(int), &new_value, &changed);
3316 if (changed) {
3317 if ((new_value == 0) || (new_value == 1)) {
3318 sugid_coredump = new_value;
3319 } else {
3320 error = EINVAL;
3321 }
3322 }
3323 return error;
3324 #endif
3325 }
3326
3327 SYSCTL_PROC(_kern, KERN_SUGID_COREDUMP, sugid_coredump,
3328 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
3329 0, 0, sysctl_suid_coredump, "I", "");
3330
3331 #endif /* CONFIG_COREDUMP */
3332
3333 STATIC int
3334 sysctl_delayterm
3335 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3336 {
3337 struct proc *p = req->p;
3338 int new_value, changed;
3339 int error = sysctl_io_number(req, (req->p->p_lflag & P_LDELAYTERM)? 1: 0, sizeof(int), &new_value, &changed);
3340 if (changed) {
3341 proc_lock(p);
3342 if (new_value) {
3343 req->p->p_lflag |= P_LDELAYTERM;
3344 } else {
3345 req->p->p_lflag &= ~P_LDELAYTERM;
3346 }
3347 proc_unlock(p);
3348 }
3349 return error;
3350 }
3351
3352 SYSCTL_PROC(_kern, KERN_PROCDELAYTERM, delayterm,
3353 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
3354 0, 0, sysctl_delayterm, "I", "");
3355
3356
3357 STATIC int
3358 sysctl_rage_vnode
3359 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3360 {
3361 struct proc *p = req->p;
3362 struct uthread *ut;
3363 int new_value, old_value, changed;
3364 int error;
3365
3366 ut = current_uthread();
3367
3368 if (ut->uu_flag & UT_RAGE_VNODES) {
3369 old_value = KERN_RAGE_THREAD;
3370 } else if (p->p_lflag & P_LRAGE_VNODES) {
3371 old_value = KERN_RAGE_PROC;
3372 } else {
3373 old_value = 0;
3374 }
3375
3376 error = sysctl_io_number(req, old_value, sizeof(int), &new_value, &changed);
3377
3378 if ((error == 0) && (changed != 0)) {
3379 switch (new_value) {
3380 case KERN_RAGE_PROC:
3381 proc_lock(p);
3382 p->p_lflag |= P_LRAGE_VNODES;
3383 proc_unlock(p);
3384 break;
3385 case KERN_UNRAGE_PROC:
3386 proc_lock(p);
3387 p->p_lflag &= ~P_LRAGE_VNODES;
3388 proc_unlock(p);
3389 break;
3390
3391 case KERN_RAGE_THREAD:
3392 ut->uu_flag |= UT_RAGE_VNODES;
3393 break;
3394 case KERN_UNRAGE_THREAD:
3395 ut = current_uthread();
3396 ut->uu_flag &= ~UT_RAGE_VNODES;
3397 break;
3398 }
3399 }
3400 return error;
3401 }
3402
3403 SYSCTL_PROC(_kern, KERN_RAGEVNODE, rage_vnode,
3404 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_ANYBODY | CTLFLAG_LOCKED,
3405 0, 0, sysctl_rage_vnode, "I", "");
3406
3407 /* XXX until filecoordinationd fixes a bit of inverted logic. */
3408 STATIC int
3409 sysctl_vfsnspace
3410 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3411 {
3412 int old_value = 0, new_value, changed;
3413
3414 return sysctl_io_number(req, old_value, sizeof(int), &new_value,
3415 &changed);
3416 }
3417
3418 SYSCTL_PROC(_kern, OID_AUTO, vfsnspace,
3419 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_ANYBODY | CTLFLAG_LOCKED,
3420 0, 0, sysctl_vfsnspace, "I", "");
3421
3422 /* XXX move this interface into libproc and remove this sysctl */
3423 STATIC int
3424 sysctl_setthread_cpupercent
3425 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3426 {
3427 int new_value, old_value;
3428 int error = 0;
3429 kern_return_t kret = KERN_SUCCESS;
3430 uint8_t percent = 0;
3431 int ms_refill = 0;
3432
3433 if (!req->newptr) {
3434 return 0;
3435 }
3436
3437 old_value = 0;
3438
3439 if ((error = sysctl_io_number(req, old_value, sizeof(old_value), &new_value, NULL)) != 0) {
3440 return error;
3441 }
3442
3443 percent = new_value & 0xff; /* low 8 bytes for perent */
3444 ms_refill = (new_value >> 8) & 0xffffff; /* upper 24bytes represent ms refill value */
3445 if (percent > 100) {
3446 return EINVAL;
3447 }
3448
3449 /*
3450 * If the caller is specifying a percentage of 0, this will unset the CPU limit, if present.
3451 */
3452 kret = percent == 0 ?
3453 thread_set_cpulimit(THREAD_CPULIMIT_DISABLE, 0, 0) :
3454 thread_set_cpulimit(THREAD_CPULIMIT_BLOCK, percent, ms_refill * (int)NSEC_PER_MSEC);
3455
3456 if (kret != 0) {
3457 return EIO;
3458 }
3459
3460 return 0;
3461 }
3462
3463 SYSCTL_PROC(_kern, OID_AUTO, setthread_cpupercent,
3464 CTLTYPE_INT | CTLFLAG_WR | CTLFLAG_ANYBODY,
3465 0, 0, sysctl_setthread_cpupercent, "I", "set thread cpu percentage limit");
3466
3467
3468 STATIC int
3469 sysctl_kern_check_openevt
3470 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3471 {
3472 struct proc *p = req->p;
3473 int new_value, old_value, changed;
3474 int error;
3475
3476 if (p->p_flag & P_CHECKOPENEVT) {
3477 old_value = KERN_OPENEVT_PROC;
3478 } else {
3479 old_value = 0;
3480 }
3481
3482 error = sysctl_io_number(req, old_value, sizeof(int), &new_value, &changed);
3483
3484 if ((error == 0) && (changed != 0)) {
3485 switch (new_value) {
3486 case KERN_OPENEVT_PROC:
3487 OSBitOrAtomic(P_CHECKOPENEVT, &p->p_flag);
3488 break;
3489
3490 case KERN_UNOPENEVT_PROC:
3491 OSBitAndAtomic(~((uint32_t)P_CHECKOPENEVT), &p->p_flag);
3492 break;
3493
3494 default:
3495 error = EINVAL;
3496 }
3497 }
3498 return error;
3499 }
3500
3501 SYSCTL_PROC(_kern, KERN_CHECKOPENEVT, check_openevt, CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_ANYBODY | CTLFLAG_LOCKED,
3502 0, 0, sysctl_kern_check_openevt, "I", "set the per-process check-open-evt flag");
3503
3504
3505 #if DEVELOPMENT || DEBUG
3506 STATIC int
3507 sysctl_nx
3508 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3509 {
3510 #ifdef SECURE_KERNEL
3511 (void)req;
3512 return ENOTSUP;
3513 #else
3514 int new_value, changed;
3515 int error;
3516
3517 error = sysctl_io_number(req, nx_enabled, sizeof(nx_enabled), &new_value, &changed);
3518 if (error) {
3519 return error;
3520 }
3521
3522 if (changed) {
3523 #if defined(__x86_64__)
3524 /*
3525 * Only allow setting if NX is supported on the chip
3526 */
3527 if (!(cpuid_extfeatures() & CPUID_EXTFEATURE_XD)) {
3528 return ENOTSUP;
3529 }
3530 #endif
3531 nx_enabled = new_value;
3532 }
3533 return error;
3534 #endif /* SECURE_KERNEL */
3535 }
3536 #endif
3537
3538 #if DEVELOPMENT || DEBUG
3539 SYSCTL_PROC(_kern, KERN_NX_PROTECTION, nx,
3540 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
3541 0, 0, sysctl_nx, "I", "");
3542 #endif
3543
3544 STATIC int
3545 sysctl_loadavg
3546 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3547 {
3548 if (proc_is64bit(req->p)) {
3549 struct user64_loadavg loadinfo64 = {};
3550 fill_loadavg64(&averunnable, &loadinfo64);
3551 return sysctl_io_opaque(req, &loadinfo64, sizeof(loadinfo64), NULL);
3552 } else {
3553 struct user32_loadavg loadinfo32 = {};
3554 fill_loadavg32(&averunnable, &loadinfo32);
3555 return sysctl_io_opaque(req, &loadinfo32, sizeof(loadinfo32), NULL);
3556 }
3557 }
3558
3559 SYSCTL_PROC(_vm, VM_LOADAVG, loadavg,
3560 CTLTYPE_STRUCT | CTLFLAG_RD | CTLFLAG_LOCKED,
3561 0, 0, sysctl_loadavg, "S,loadavg", "");
3562
3563 /*
3564 * Note: Thread safe; vm_map_lock protects in vm_toggle_entry_reuse()
3565 */
3566 STATIC int
3567 sysctl_vm_toggle_address_reuse(__unused struct sysctl_oid *oidp, __unused void *arg1,
3568 __unused int arg2, struct sysctl_req *req)
3569 {
3570 int old_value = 0, new_value = 0, error = 0;
3571
3572 if (vm_toggle_entry_reuse( VM_TOGGLE_GETVALUE, &old_value )) {
3573 return error;
3574 }
3575 error = sysctl_io_number(req, old_value, sizeof(int), &new_value, NULL);
3576 if (!error) {
3577 return vm_toggle_entry_reuse(new_value, NULL);
3578 }
3579 return error;
3580 }
3581
3582 SYSCTL_PROC(_debug, OID_AUTO, toggle_address_reuse, CTLFLAG_ANYBODY | CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED, 0, 0, sysctl_vm_toggle_address_reuse, "I", "");
3583
3584 #ifdef CONFIG_XNUPOST
3585
3586 extern uint32_t xnupost_get_estimated_testdata_size(void);
3587 extern int xnupost_reset_all_tests(void);
3588
3589 STATIC int
3590 sysctl_handle_xnupost_get_tests SYSCTL_HANDLER_ARGS
3591 {
3592 /* fixup unused arguments warnings */
3593 __unused int _oa2 = arg2;
3594 __unused void * _oa1 = arg1;
3595 __unused struct sysctl_oid * _oidp = oidp;
3596
3597 int error = 0;
3598 user_addr_t oldp = 0;
3599 user_addr_t newp = 0;
3600 uint32_t usedbytes = 0;
3601
3602 oldp = req->oldptr;
3603 newp = req->newptr;
3604
3605 if (newp) {
3606 return ENOTSUP;
3607 }
3608
3609 if ((void *)oldp == NULL) {
3610 /* return estimated size for second call where info can be placed */
3611 req->oldidx = xnupost_get_estimated_testdata_size();
3612 } else {
3613 error = xnupost_export_testdata((void *)oldp, req->oldlen, &usedbytes);
3614 req->oldidx = usedbytes;
3615 }
3616
3617 return error;
3618 }
3619
3620 SYSCTL_PROC(_debug,
3621 OID_AUTO,
3622 xnupost_get_tests,
3623 CTLFLAG_MASKED | CTLFLAG_ANYBODY | CTLTYPE_OPAQUE | CTLFLAG_RD | CTLFLAG_LOCKED,
3624 0,
3625 0,
3626 sysctl_handle_xnupost_get_tests,
3627 "-",
3628 "read xnupost test data in kernel");
3629
3630 #if CONFIG_EXT_PANICLOG
3631 /*
3632 * Extensible panic log test hooks
3633 */
3634 static int
3635 sysctl_debug_ext_paniclog_test_hook SYSCTL_HANDLER_ARGS
3636 {
3637 #pragma unused(arg1, arg2)
3638 int rval = 0;
3639 uint32_t test_option = 0;
3640
3641 rval = sysctl_handle_int(oidp, &test_option, 0, req);
3642
3643 if (rval == 0 && req->newptr) {
3644 rval = ext_paniclog_test_hook(test_option);
3645 }
3646
3647 return rval;
3648 }
3649
3650 SYSCTL_PROC(_debug, OID_AUTO, ext_paniclog_test_hook,
3651 CTLTYPE_INT | CTLFLAG_RW,
3652 0, 0,
3653 sysctl_debug_ext_paniclog_test_hook, "A", "ext paniclog test hook");
3654
3655 #endif
3656
3657 STATIC int
3658 sysctl_debug_xnupost_ctl SYSCTL_HANDLER_ARGS
3659 {
3660 /* fixup unused arguments warnings */
3661 __unused int _oa2 = arg2;
3662 __unused void * _oa1 = arg1;
3663 __unused struct sysctl_oid * _oidp = oidp;
3664
3665 #define ARRCOUNT 4
3666 /*
3667 * INPUT: ACTION, PARAM1, PARAM2, PARAM3
3668 * OUTPUT: RESULTCODE, ADDITIONAL DATA
3669 */
3670 int32_t outval[ARRCOUNT] = {0};
3671 int32_t input[ARRCOUNT] = {0};
3672 int32_t out_size = sizeof(outval);
3673 int32_t in_size = sizeof(input);
3674 int error = 0;
3675
3676 /* if this is NULL call to find out size, send out size info */
3677 if (!req->newptr) {
3678 goto out;
3679 }
3680
3681 /* pull in provided value from userspace */
3682 error = SYSCTL_IN(req, &input[0], in_size);
3683 if (error) {
3684 return error;
3685 }
3686
3687 if (input[0] == XTCTL_RESET_TESTDATA) {
3688 outval[0] = xnupost_reset_all_tests();
3689 goto out;
3690 }
3691
3692 out:
3693 error = SYSCTL_OUT(req, &outval[0], out_size);
3694 return error;
3695 }
3696
3697 SYSCTL_PROC(_debug,
3698 OID_AUTO,
3699 xnupost_testctl,
3700 CTLFLAG_MASKED | CTLFLAG_ANYBODY | CTLTYPE_OPAQUE | CTLFLAG_RW | CTLFLAG_LOCKED,
3701 0,
3702 0,
3703 sysctl_debug_xnupost_ctl,
3704 "I",
3705 "xnupost control for kernel testing");
3706
3707 extern void test_oslog_handleOSLogCtl(int32_t * in, int32_t * out, int32_t arraycount);
3708
3709 STATIC int
3710 sysctl_debug_test_oslog_ctl(__unused struct sysctl_oid * oidp, __unused void * arg1, __unused int arg2, struct sysctl_req * req)
3711 {
3712 #define ARRCOUNT 4
3713 int32_t outval[ARRCOUNT] = {0};
3714 int32_t input[ARRCOUNT] = {0};
3715 int32_t size_outval = sizeof(outval);
3716 int32_t size_inval = sizeof(input);
3717 int32_t error;
3718
3719 /* if this is NULL call to find out size, send out size info */
3720 if (!req->newptr) {
3721 error = SYSCTL_OUT(req, &outval[0], size_outval);
3722 return error;
3723 }
3724
3725 /* pull in provided value from userspace */
3726 error = SYSCTL_IN(req, &input[0], size_inval);
3727 if (error) {
3728 return error;
3729 }
3730
3731 test_oslog_handleOSLogCtl(input, outval, ARRCOUNT);
3732
3733 error = SYSCTL_OUT(req, &outval[0], size_outval);
3734
3735 return error;
3736 }
3737
3738 SYSCTL_PROC(_debug,
3739 OID_AUTO,
3740 test_OSLogCtl,
3741 CTLFLAG_MASKED | CTLFLAG_ANYBODY | CTLTYPE_OPAQUE | CTLFLAG_RW | CTLFLAG_LOCKED,
3742 0,
3743 0,
3744 sysctl_debug_test_oslog_ctl,
3745 "I",
3746 "testing oslog in kernel");
3747
3748 #include <mach/task.h>
3749 #include <mach/semaphore.h>
3750
3751 static LCK_GRP_DECLARE(sysctl_debug_test_stackshot_owner_grp, "test-stackshot-owner-grp");
3752 static LCK_MTX_DECLARE(sysctl_debug_test_stackshot_owner_init_mtx,
3753 &sysctl_debug_test_stackshot_owner_grp);
3754
3755 /* This is a sysctl for testing collection of owner info on a lock in kernel space. A multi-threaded
3756 * test from userland sets this sysctl in such a way that a thread blocks in kernel mode, and a
3757 * stackshot is taken to see if the owner of the lock can be identified.
3758 *
3759 * We can't return to userland with a kernel lock held, so be sure to unlock before we leave.
3760 * the semaphores allow us to artificially create cases where the lock is being held and the
3761 * thread is hanging / taking a long time to do something. */
3762
3763 volatile char sysctl_debug_test_stackshot_mtx_inited = 0;
3764 semaphore_t sysctl_debug_test_stackshot_mutex_sem;
3765 lck_mtx_t sysctl_debug_test_stackshot_owner_lck;
3766
3767 #define SYSCTL_DEBUG_MTX_ACQUIRE_WAIT 1
3768 #define SYSCTL_DEBUG_MTX_ACQUIRE_NOWAIT 2
3769 #define SYSCTL_DEBUG_MTX_SIGNAL 3
3770 #define SYSCTL_DEBUG_MTX_TEARDOWN 4
3771
3772 STATIC int
3773 sysctl_debug_test_stackshot_mutex_owner(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3774 {
3775 long long option = -1;
3776 /* if the user tries to read the sysctl, we tell them what the address of the lock is (to test against stackshot's output) */
3777 long long mtx_unslid_addr = (long long)VM_KERNEL_UNSLIDE_OR_PERM(&sysctl_debug_test_stackshot_owner_lck);
3778 int error = sysctl_io_number(req, mtx_unslid_addr, sizeof(long long), (void*)&option, NULL);
3779
3780 lck_mtx_lock(&sysctl_debug_test_stackshot_owner_init_mtx);
3781 if (!sysctl_debug_test_stackshot_mtx_inited) {
3782 lck_mtx_init(&sysctl_debug_test_stackshot_owner_lck,
3783 &sysctl_debug_test_stackshot_owner_grp,
3784 LCK_ATTR_NULL);
3785 semaphore_create(kernel_task,
3786 &sysctl_debug_test_stackshot_mutex_sem,
3787 SYNC_POLICY_FIFO, 0);
3788 sysctl_debug_test_stackshot_mtx_inited = 1;
3789 }
3790 lck_mtx_unlock(&sysctl_debug_test_stackshot_owner_init_mtx);
3791
3792 if (!error) {
3793 switch (option) {
3794 case SYSCTL_DEBUG_MTX_ACQUIRE_NOWAIT:
3795 lck_mtx_lock(&sysctl_debug_test_stackshot_owner_lck);
3796 lck_mtx_unlock(&sysctl_debug_test_stackshot_owner_lck);
3797 break;
3798 case SYSCTL_DEBUG_MTX_ACQUIRE_WAIT:
3799 lck_mtx_lock(&sysctl_debug_test_stackshot_owner_lck);
3800 semaphore_wait(sysctl_debug_test_stackshot_mutex_sem);
3801 lck_mtx_unlock(&sysctl_debug_test_stackshot_owner_lck);
3802 break;
3803 case SYSCTL_DEBUG_MTX_SIGNAL:
3804 semaphore_signal(sysctl_debug_test_stackshot_mutex_sem);
3805 break;
3806 case SYSCTL_DEBUG_MTX_TEARDOWN:
3807 lck_mtx_lock(&sysctl_debug_test_stackshot_owner_init_mtx);
3808
3809 lck_mtx_destroy(&sysctl_debug_test_stackshot_owner_lck,
3810 &sysctl_debug_test_stackshot_owner_grp);
3811 semaphore_destroy(kernel_task,
3812 sysctl_debug_test_stackshot_mutex_sem);
3813 sysctl_debug_test_stackshot_mtx_inited = 0;
3814
3815 lck_mtx_unlock(&sysctl_debug_test_stackshot_owner_init_mtx);
3816 break;
3817 case -1: /* user just wanted to read the value, so do nothing */
3818 break;
3819 default:
3820 error = EINVAL;
3821 break;
3822 }
3823 }
3824 return error;
3825 }
3826
3827 /* we can't return to userland with a kernel rwlock held, so be sure to unlock before we leave.
3828 * the semaphores allow us to artificially create cases where the lock is being held and the
3829 * thread is hanging / taking a long time to do something. */
3830
3831 SYSCTL_PROC(_debug,
3832 OID_AUTO,
3833 test_MutexOwnerCtl,
3834 CTLFLAG_MASKED | CTLFLAG_ANYBODY | CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_LOCKED,
3835 0,
3836 0,
3837 sysctl_debug_test_stackshot_mutex_owner,
3838 "-",
3839 "Testing mutex owner in kernel");
3840
3841 volatile char sysctl_debug_test_stackshot_rwlck_inited = 0;
3842 lck_rw_t sysctl_debug_test_stackshot_owner_rwlck;
3843 semaphore_t sysctl_debug_test_stackshot_rwlck_sem;
3844
3845 #define SYSCTL_DEBUG_KRWLCK_RACQUIRE_NOWAIT 1
3846 #define SYSCTL_DEBUG_KRWLCK_RACQUIRE_WAIT 2
3847 #define SYSCTL_DEBUG_KRWLCK_WACQUIRE_NOWAIT 3
3848 #define SYSCTL_DEBUG_KRWLCK_WACQUIRE_WAIT 4
3849 #define SYSCTL_DEBUG_KRWLCK_SIGNAL 5
3850 #define SYSCTL_DEBUG_KRWLCK_TEARDOWN 6
3851
3852 STATIC int
3853 sysctl_debug_test_stackshot_rwlck_owner(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3854 {
3855 long long option = -1;
3856 /* if the user tries to read the sysctl, we tell them what the address of the lock is
3857 * (to test against stackshot's output) */
3858 long long rwlck_unslid_addr = (long long)VM_KERNEL_UNSLIDE_OR_PERM(&sysctl_debug_test_stackshot_owner_rwlck);
3859 int error = sysctl_io_number(req, rwlck_unslid_addr, sizeof(long long), (void*)&option, NULL);
3860
3861 lck_mtx_lock(&sysctl_debug_test_stackshot_owner_init_mtx);
3862 if (!sysctl_debug_test_stackshot_rwlck_inited) {
3863 lck_rw_init(&sysctl_debug_test_stackshot_owner_rwlck,
3864 &sysctl_debug_test_stackshot_owner_grp,
3865 LCK_ATTR_NULL);
3866 semaphore_create(kernel_task,
3867 &sysctl_debug_test_stackshot_rwlck_sem,
3868 SYNC_POLICY_FIFO,
3869 0);
3870 sysctl_debug_test_stackshot_rwlck_inited = 1;
3871 }
3872 lck_mtx_unlock(&sysctl_debug_test_stackshot_owner_init_mtx);
3873
3874 if (!error) {
3875 switch (option) {
3876 case SYSCTL_DEBUG_KRWLCK_RACQUIRE_NOWAIT:
3877 lck_rw_lock(&sysctl_debug_test_stackshot_owner_rwlck, LCK_RW_TYPE_SHARED);
3878 lck_rw_unlock(&sysctl_debug_test_stackshot_owner_rwlck, LCK_RW_TYPE_SHARED);
3879 break;
3880 case SYSCTL_DEBUG_KRWLCK_RACQUIRE_WAIT:
3881 lck_rw_lock(&sysctl_debug_test_stackshot_owner_rwlck, LCK_RW_TYPE_SHARED);
3882 semaphore_wait(sysctl_debug_test_stackshot_rwlck_sem);
3883 lck_rw_unlock(&sysctl_debug_test_stackshot_owner_rwlck, LCK_RW_TYPE_SHARED);
3884 break;
3885 case SYSCTL_DEBUG_KRWLCK_WACQUIRE_NOWAIT:
3886 lck_rw_lock(&sysctl_debug_test_stackshot_owner_rwlck, LCK_RW_TYPE_EXCLUSIVE);
3887 lck_rw_unlock(&sysctl_debug_test_stackshot_owner_rwlck, LCK_RW_TYPE_EXCLUSIVE);
3888 break;
3889 case SYSCTL_DEBUG_KRWLCK_WACQUIRE_WAIT:
3890 lck_rw_lock(&sysctl_debug_test_stackshot_owner_rwlck, LCK_RW_TYPE_EXCLUSIVE);
3891 semaphore_wait(sysctl_debug_test_stackshot_rwlck_sem);
3892 lck_rw_unlock(&sysctl_debug_test_stackshot_owner_rwlck, LCK_RW_TYPE_EXCLUSIVE);
3893 break;
3894 case SYSCTL_DEBUG_KRWLCK_SIGNAL:
3895 semaphore_signal(sysctl_debug_test_stackshot_rwlck_sem);
3896 break;
3897 case SYSCTL_DEBUG_KRWLCK_TEARDOWN:
3898 lck_mtx_lock(&sysctl_debug_test_stackshot_owner_init_mtx);
3899
3900 lck_rw_destroy(&sysctl_debug_test_stackshot_owner_rwlck,
3901 &sysctl_debug_test_stackshot_owner_grp);
3902 semaphore_destroy(kernel_task,
3903 sysctl_debug_test_stackshot_rwlck_sem);
3904 sysctl_debug_test_stackshot_rwlck_inited = 0;
3905
3906 lck_mtx_unlock(&sysctl_debug_test_stackshot_owner_init_mtx);
3907 break;
3908 case -1: /* user just wanted to read the value, so do nothing */
3909 break;
3910 default:
3911 error = EINVAL;
3912 break;
3913 }
3914 }
3915 return error;
3916 }
3917
3918
3919 SYSCTL_PROC(_debug,
3920 OID_AUTO,
3921 test_RWLockOwnerCtl,
3922 CTLFLAG_MASKED | CTLFLAG_ANYBODY | CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_LOCKED,
3923 0,
3924 0,
3925 sysctl_debug_test_stackshot_rwlck_owner,
3926 "-",
3927 "Testing rwlock owner in kernel");
3928 #endif /* !CONFIG_XNUPOST */
3929
3930 STATIC int
3931 sysctl_swapusage
3932 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3933 {
3934 int error;
3935 uint64_t swap_total;
3936 uint64_t swap_avail;
3937 vm_size_t swap_pagesize;
3938 boolean_t swap_encrypted;
3939 struct xsw_usage xsu = {};
3940
3941 error = macx_swapinfo(&swap_total,
3942 &swap_avail,
3943 &swap_pagesize,
3944 &swap_encrypted);
3945 if (error) {
3946 return error;
3947 }
3948
3949 xsu.xsu_total = swap_total;
3950 xsu.xsu_avail = swap_avail;
3951 xsu.xsu_used = swap_total - swap_avail;
3952 xsu.xsu_pagesize = (u_int32_t)MIN(swap_pagesize, UINT32_MAX);
3953 xsu.xsu_encrypted = swap_encrypted;
3954 return sysctl_io_opaque(req, &xsu, sizeof(xsu), NULL);
3955 }
3956
3957
3958
3959 SYSCTL_PROC(_vm, VM_SWAPUSAGE, swapusage,
3960 CTLTYPE_STRUCT | CTLFLAG_RD | CTLFLAG_LOCKED,
3961 0, 0, sysctl_swapusage, "S,xsw_usage", "");
3962
3963 extern int vm_swap_enabled;
3964 SYSCTL_INT(_vm, OID_AUTO, swap_enabled, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_swap_enabled, 0, "");
3965
3966 #if DEVELOPMENT || DEBUG
3967 extern int vm_num_swap_files_config;
3968 extern int vm_num_swap_files;
3969 extern lck_mtx_t vm_swap_data_lock;
3970 #define VM_MAX_SWAP_FILE_NUM 100
3971
3972 static int
3973 sysctl_vm_config_num_swap_files SYSCTL_HANDLER_ARGS
3974 {
3975 #pragma unused(arg1, arg2)
3976 int error = 0, val = vm_num_swap_files_config;
3977
3978 error = sysctl_handle_int(oidp, &val, 0, req);
3979 if (error || !req->newptr) {
3980 goto out;
3981 }
3982
3983 if (!VM_CONFIG_SWAP_IS_ACTIVE && !VM_CONFIG_FREEZER_SWAP_IS_ACTIVE) {
3984 printf("Swap is disabled\n");
3985 error = EINVAL;
3986 goto out;
3987 }
3988
3989 lck_mtx_lock(&vm_swap_data_lock);
3990
3991 if (val < vm_num_swap_files) {
3992 printf("Cannot configure fewer swap files than already exist.\n");
3993 error = EINVAL;
3994 lck_mtx_unlock(&vm_swap_data_lock);
3995 goto out;
3996 }
3997
3998 if (val > VM_MAX_SWAP_FILE_NUM) {
3999 printf("Capping number of swap files to upper bound.\n");
4000 val = VM_MAX_SWAP_FILE_NUM;
4001 }
4002
4003 vm_num_swap_files_config = val;
4004 lck_mtx_unlock(&vm_swap_data_lock);
4005 out:
4006
4007 return 0;
4008 }
4009
4010 SYSCTL_PROC(_debug, OID_AUTO, num_swap_files_configured, CTLFLAG_ANYBODY | CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED, 0, 0, sysctl_vm_config_num_swap_files, "I", "");
4011 #endif /* DEVELOPMENT || DEBUG */
4012
4013 /* this kernel does NOT implement shared_region_make_private_np() */
4014 SYSCTL_INT(_kern, KERN_SHREG_PRIVATIZABLE, shreg_private,
4015 CTLFLAG_RD | CTLFLAG_LOCKED,
4016 (int *)NULL, 0, "");
4017
4018 STATIC int
4019 fetch_process_cputype(
4020 proc_t cur_proc,
4021 int *name,
4022 u_int namelen,
4023 cpu_type_t *cputype)
4024 {
4025 proc_t p = PROC_NULL;
4026 int refheld = 0;
4027 cpu_type_t ret = 0;
4028 int error = 0;
4029
4030 if (namelen == 0) {
4031 p = cur_proc;
4032 } else if (namelen == 1) {
4033 p = proc_find(name[0]);
4034 if (p == NULL) {
4035 return EINVAL;
4036 }
4037 refheld = 1;
4038 } else {
4039 error = EINVAL;
4040 goto out;
4041 }
4042
4043 ret = cpu_type() & ~CPU_ARCH_MASK;
4044 if (IS_64BIT_PROCESS(p)) {
4045 ret |= CPU_ARCH_ABI64;
4046 }
4047
4048 *cputype = ret;
4049
4050 if (refheld != 0) {
4051 proc_rele(p);
4052 }
4053 out:
4054 return error;
4055 }
4056
4057
4058 STATIC int
4059 sysctl_sysctl_native(__unused struct sysctl_oid *oidp, void *arg1, int arg2,
4060 struct sysctl_req *req)
4061 {
4062 int error;
4063 cpu_type_t proc_cputype = 0;
4064 if ((error = fetch_process_cputype(req->p, (int *)arg1, arg2, &proc_cputype)) != 0) {
4065 return error;
4066 }
4067 int res = 1;
4068 if ((proc_cputype & ~CPU_ARCH_MASK) != (cpu_type() & ~CPU_ARCH_MASK)) {
4069 res = 0;
4070 }
4071 return SYSCTL_OUT(req, &res, sizeof(res));
4072 }
4073 SYSCTL_PROC(_sysctl, OID_AUTO, proc_native, CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED, 0, 0, sysctl_sysctl_native, "I", "proc_native");
4074
4075 STATIC int
4076 sysctl_sysctl_cputype(__unused struct sysctl_oid *oidp, void *arg1, int arg2,
4077 struct sysctl_req *req)
4078 {
4079 int error;
4080 cpu_type_t proc_cputype = 0;
4081 if ((error = fetch_process_cputype(req->p, (int *)arg1, arg2, &proc_cputype)) != 0) {
4082 return error;
4083 }
4084 return SYSCTL_OUT(req, &proc_cputype, sizeof(proc_cputype));
4085 }
4086 SYSCTL_PROC(_sysctl, OID_AUTO, proc_cputype, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED, 0, 0, sysctl_sysctl_cputype, "I", "proc_cputype");
4087
4088 STATIC int
4089 sysctl_safeboot
4090 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4091 {
4092 return sysctl_io_number(req, boothowto & RB_SAFEBOOT ? 1 : 0, sizeof(int), NULL, NULL);
4093 }
4094
4095 SYSCTL_PROC(_kern, KERN_SAFEBOOT, safeboot,
4096 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
4097 0, 0, sysctl_safeboot, "I", "");
4098
4099 STATIC int
4100 sysctl_singleuser
4101 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4102 {
4103 return sysctl_io_number(req, boothowto & RB_SINGLE ? 1 : 0, sizeof(int), NULL, NULL);
4104 }
4105
4106 SYSCTL_PROC(_kern, OID_AUTO, singleuser,
4107 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
4108 0, 0, sysctl_singleuser, "I", "");
4109
4110 STATIC int
4111 sysctl_minimalboot
4112 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4113 {
4114 return sysctl_io_number(req, minimalboot, sizeof(int), NULL, NULL);
4115 }
4116
4117 SYSCTL_PROC(_kern, OID_AUTO, minimalboot,
4118 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
4119 0, 0, sysctl_minimalboot, "I", "");
4120
4121 /*
4122 * Controls for debugging affinity sets - see osfmk/kern/affinity.c
4123 */
4124 extern boolean_t affinity_sets_enabled;
4125 extern int affinity_sets_mapping;
4126
4127 SYSCTL_INT(_kern, OID_AUTO, affinity_sets_enabled,
4128 CTLFLAG_RW | CTLFLAG_LOCKED, (int *) &affinity_sets_enabled, 0, "hinting enabled");
4129 SYSCTL_INT(_kern, OID_AUTO, affinity_sets_mapping,
4130 CTLFLAG_RW | CTLFLAG_LOCKED, &affinity_sets_mapping, 0, "mapping policy");
4131
4132 /*
4133 * Boolean indicating if KASLR is active.
4134 */
4135 STATIC int
4136 sysctl_slide
4137 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4138 {
4139 uint32_t slide;
4140
4141 slide = vm_kernel_slide ? 1 : 0;
4142
4143 return sysctl_io_number( req, slide, sizeof(int), NULL, NULL);
4144 }
4145
4146 SYSCTL_PROC(_kern, OID_AUTO, slide,
4147 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
4148 0, 0, sysctl_slide, "I", "");
4149
4150 #if DEBUG || DEVELOPMENT
4151 #if defined(__arm64__)
4152 extern vm_offset_t segTEXTEXECB;
4153
4154 static int
4155 sysctl_kernel_text_exec_base_slide SYSCTL_HANDLER_ARGS
4156 {
4157 #pragma unused(arg1, arg2, oidp)
4158 unsigned long slide = 0;
4159 kc_format_t kc_format;
4160
4161 PE_get_primary_kc_format(&kc_format);
4162
4163 if (kc_format == KCFormatFileset) {
4164 void *kch = PE_get_kc_header(KCKindPrimary);
4165 slide = (unsigned long)segTEXTEXECB - (unsigned long)kch + vm_kernel_slide;
4166 }
4167 return SYSCTL_OUT(req, &slide, sizeof(slide));
4168 }
4169
4170 SYSCTL_QUAD(_kern, OID_AUTO, kernel_slide, CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED, &vm_kernel_slide, "");
4171 SYSCTL_QUAD(_kern, OID_AUTO, kernel_text_exec_base, CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED, &segTEXTEXECB, "");
4172 SYSCTL_PROC(_kern, OID_AUTO, kernel_text_exec_base_slide, CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED, 0, 0, sysctl_kernel_text_exec_base_slide, "Q", "");
4173 #endif /* defined(__arm64__) */
4174
4175 /* User address of the PFZ */
4176 extern user32_addr_t commpage_text32_location;
4177 extern user64_addr_t commpage_text64_location;
4178
4179 STATIC int
4180 sysctl_pfz_start SYSCTL_HANDLER_ARGS
4181 {
4182 #pragma unused(oidp, arg1, arg2)
4183
4184 #ifdef __LP64__
4185 return sysctl_io_number(req, commpage_text64_location, sizeof(user64_addr_t), NULL, NULL);
4186 #else
4187 return sysctl_io_number(req, commpage_text32_location, sizeof(user32_addr_t), NULL, NULL);
4188 #endif
4189 }
4190
4191 SYSCTL_PROC(_kern, OID_AUTO, pfz,
4192 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED | CTLFLAG_MASKED,
4193 0, 0, sysctl_pfz_start, "I", "");
4194 #endif
4195
4196
4197 /*
4198 * Limit on total memory users can wire.
4199 *
4200 * vm_global_user_wire_limit - system wide limit on wired memory from all processes combined.
4201 *
4202 * vm_per_task_user_wire_limit - per address space limit on wired memory. This puts a cap on the process's rlimit value.
4203 *
4204 * These values are initialized to reasonable defaults at boot time based on the available physical memory in
4205 * kmem_init().
4206 *
4207 * All values are in bytes.
4208 */
4209
4210 vm_map_size_t vm_global_user_wire_limit;
4211 vm_map_size_t vm_per_task_user_wire_limit;
4212 extern uint64_t max_mem_actual, max_mem;
4213
4214 uint64_t vm_add_wire_count_over_global_limit;
4215 uint64_t vm_add_wire_count_over_user_limit;
4216 /*
4217 * We used to have a global in the kernel called vm_global_no_user_wire_limit which was the inverse
4218 * of vm_global_user_wire_limit. But maintaining both of those is silly, and vm_global_user_wire_limit is the
4219 * real limit.
4220 * This function is for backwards compatibility with userspace
4221 * since we exposed the old global via a sysctl.
4222 */
4223 STATIC int
4224 sysctl_global_no_user_wire_amount(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4225 {
4226 vm_map_size_t old_value;
4227 vm_map_size_t new_value;
4228 int changed;
4229 int error;
4230 uint64_t config_memsize = max_mem;
4231 #if defined(XNU_TARGET_OS_OSX)
4232 config_memsize = max_mem_actual;
4233 #endif /* defined(XNU_TARGET_OS_OSX) */
4234
4235 old_value = (vm_map_size_t)(config_memsize - vm_global_user_wire_limit);
4236 error = sysctl_io_number(req, old_value, sizeof(vm_map_size_t), &new_value, &changed);
4237 if (changed) {
4238 if ((uint64_t)new_value > config_memsize) {
4239 error = EINVAL;
4240 } else {
4241 vm_global_user_wire_limit = (vm_map_size_t)(config_memsize - new_value);
4242 }
4243 }
4244 return error;
4245 }
4246 /*
4247 * There needs to be a more automatic/elegant way to do this
4248 */
4249 SYSCTL_QUAD(_vm, OID_AUTO, global_user_wire_limit, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_global_user_wire_limit, "");
4250 SYSCTL_QUAD(_vm, OID_AUTO, user_wire_limit, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_per_task_user_wire_limit, "");
4251 SYSCTL_PROC(_vm, OID_AUTO, global_no_user_wire_amount, CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_LOCKED, 0, 0, &sysctl_global_no_user_wire_amount, "Q", "");
4252
4253 /*
4254 * Relaxed atomic RW of a 64bit value via sysctl.
4255 */
4256 STATIC int
4257 sysctl_r_64bit_atomic(uint64_t *ptr, struct sysctl_req *req)
4258 {
4259 uint64_t old_value;
4260 uint64_t new_value;
4261 int error;
4262
4263 old_value = os_atomic_load_wide(ptr, relaxed);
4264 error = sysctl_io_number(req, old_value, sizeof(vm_map_size_t), &new_value, NULL);
4265 return error;
4266 }
4267 STATIC int
4268 sysctl_add_wire_count_over_global_limit(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4269 {
4270 return sysctl_r_64bit_atomic(&vm_add_wire_count_over_global_limit, req);
4271 }
4272 STATIC int
4273 sysctl_add_wire_count_over_user_limit(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4274 {
4275 return sysctl_r_64bit_atomic(&vm_add_wire_count_over_user_limit, req);
4276 }
4277
4278 SYSCTL_PROC(_vm, OID_AUTO, add_wire_count_over_global_limit, CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED, 0, 0, &sysctl_add_wire_count_over_global_limit, "Q", "");
4279 SYSCTL_PROC(_vm, OID_AUTO, add_wire_count_over_user_limit, CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED, 0, 0, &sysctl_add_wire_count_over_user_limit, "Q", "");
4280
4281 #if DEVELOPMENT || DEBUG
4282 /* These sysctls are used to test the wired limit. */
4283 extern unsigned int vm_page_wire_count;
4284 extern uint32_t vm_lopage_free_count;
4285 SYSCTL_INT(_vm, OID_AUTO, page_wire_count, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_page_wire_count, 0, "");
4286 SYSCTL_INT(_vm, OID_AUTO, lopage_free_count, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_lopage_free_count, 0, "");
4287
4288 /*
4289 * Setting the per task variable exclude_physfootprint_ledger to 1 will allow the calling task to exclude memory entries that are
4290 * tagged by VM_LEDGER_TAG_DEFAULT and flagged by VM_LEDGER_FLAG_EXCLUDE_FOOTPRINT_DEBUG from its phys_footprint ledger.
4291 */
4292
4293 STATIC int
4294 sysctl_rw_task_no_footprint_for_debug(struct sysctl_oid *oidp __unused, void *arg1 __unused, int arg2 __unused, struct sysctl_req *req)
4295 {
4296 int error;
4297 int value;
4298 proc_t p = current_proc();
4299
4300 if (req->newptr) {
4301 // Write request
4302 error = SYSCTL_IN(req, &value, sizeof(value));
4303 if (!error) {
4304 if (value == 1) {
4305 task_set_no_footprint_for_debug(proc_task(p), TRUE);
4306 } else if (value == 0) {
4307 task_set_no_footprint_for_debug(proc_task(p), FALSE);
4308 } else {
4309 error = EINVAL;
4310 }
4311 }
4312 } else {
4313 // Read request
4314 value = task_get_no_footprint_for_debug(proc_task(p));
4315 error = SYSCTL_OUT(req, &value, sizeof(value));
4316 }
4317 return error;
4318 }
4319
4320 SYSCTL_PROC(_vm, OID_AUTO, task_no_footprint_for_debug,
4321 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED | CTLFLAG_ANYBODY,
4322 0, 0, &sysctl_rw_task_no_footprint_for_debug, "I", "Allow debug memory to be excluded from this task's memory footprint (debug only)");
4323
4324 #endif /* DEVELOPMENT || DEBUG */
4325
4326
4327 extern int vm_map_copy_overwrite_aligned_src_not_internal;
4328 extern int vm_map_copy_overwrite_aligned_src_not_symmetric;
4329 extern int vm_map_copy_overwrite_aligned_src_large;
4330 SYSCTL_INT(_vm, OID_AUTO, vm_copy_src_not_internal, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_map_copy_overwrite_aligned_src_not_internal, 0, "");
4331 SYSCTL_INT(_vm, OID_AUTO, vm_copy_src_not_symmetric, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_map_copy_overwrite_aligned_src_not_symmetric, 0, "");
4332 SYSCTL_INT(_vm, OID_AUTO, vm_copy_src_large, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_map_copy_overwrite_aligned_src_large, 0, "");
4333
4334
4335 extern uint32_t vm_page_external_count;
4336
4337 SYSCTL_INT(_vm, OID_AUTO, vm_page_external_count, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_page_external_count, 0, "");
4338
4339 SYSCTL_INT(_vm, OID_AUTO, vm_page_filecache_min, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_pageout_state.vm_page_filecache_min, 0, "");
4340 SYSCTL_INT(_vm, OID_AUTO, vm_page_xpmapped_min, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_pageout_state.vm_page_xpmapped_min, 0, "");
4341
4342 #if DEVELOPMENT || DEBUG
4343 SYSCTL_INT(_vm, OID_AUTO, vm_page_filecache_min_divisor, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_pageout_state.vm_page_filecache_min_divisor, 0, "");
4344 SYSCTL_INT(_vm, OID_AUTO, vm_page_xpmapped_min_divisor, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_pageout_state.vm_page_xpmapped_min_divisor, 0, "");
4345 extern boolean_t vps_yield_for_pgqlockwaiters;
4346 SYSCTL_INT(_vm, OID_AUTO, vm_pageoutscan_yields_for_pageQlockwaiters, CTLFLAG_RW | CTLFLAG_LOCKED, &vps_yield_for_pgqlockwaiters, 0, "");
4347 #endif
4348
4349 extern int vm_compressor_mode;
4350 extern int vm_compressor_is_active;
4351 extern int vm_compressor_available;
4352 extern uint32_t c_seg_bufsize;
4353 extern uint64_t compressor_pool_size;
4354 extern uint32_t vm_ripe_target_age;
4355 extern uint32_t swapout_target_age;
4356 extern int64_t compressor_bytes_used;
4357 extern int64_t c_segment_input_bytes;
4358 extern int64_t c_segment_compressed_bytes;
4359 extern uint32_t compressor_eval_period_in_msecs;
4360 extern uint32_t compressor_sample_min_in_msecs;
4361 extern uint32_t compressor_sample_max_in_msecs;
4362 extern uint32_t compressor_thrashing_threshold_per_10msecs;
4363 extern uint32_t compressor_thrashing_min_per_10msecs;
4364 extern uint32_t vm_compressor_time_thread;
4365
4366 #if DEVELOPMENT || DEBUG
4367 extern uint32_t vm_compressor_minorcompact_threshold_divisor;
4368 extern uint32_t vm_compressor_majorcompact_threshold_divisor;
4369 extern uint32_t vm_compressor_unthrottle_threshold_divisor;
4370 extern uint32_t vm_compressor_catchup_threshold_divisor;
4371
4372 extern uint32_t vm_compressor_minorcompact_threshold_divisor_overridden;
4373 extern uint32_t vm_compressor_majorcompact_threshold_divisor_overridden;
4374 extern uint32_t vm_compressor_unthrottle_threshold_divisor_overridden;
4375 extern uint32_t vm_compressor_catchup_threshold_divisor_overridden;
4376
4377 extern vmct_stats_t vmct_stats;
4378
4379
4380 STATIC int
4381 sysctl_minorcompact_threshold_divisor(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4382 {
4383 int new_value, changed;
4384 int error = sysctl_io_number(req, vm_compressor_minorcompact_threshold_divisor, sizeof(int), &new_value, &changed);
4385
4386 if (changed) {
4387 vm_compressor_minorcompact_threshold_divisor = new_value;
4388 vm_compressor_minorcompact_threshold_divisor_overridden = 1;
4389 }
4390 return error;
4391 }
4392
4393 SYSCTL_PROC(_vm, OID_AUTO, compressor_minorcompact_threshold_divisor,
4394 CTLTYPE_INT | CTLFLAG_LOCKED | CTLFLAG_RW,
4395 0, 0, sysctl_minorcompact_threshold_divisor, "I", "");
4396
4397
4398 STATIC int
4399 sysctl_majorcompact_threshold_divisor(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4400 {
4401 int new_value, changed;
4402 int error = sysctl_io_number(req, vm_compressor_majorcompact_threshold_divisor, sizeof(int), &new_value, &changed);
4403
4404 if (changed) {
4405 vm_compressor_majorcompact_threshold_divisor = new_value;
4406 vm_compressor_majorcompact_threshold_divisor_overridden = 1;
4407 }
4408 return error;
4409 }
4410
4411 SYSCTL_PROC(_vm, OID_AUTO, compressor_majorcompact_threshold_divisor,
4412 CTLTYPE_INT | CTLFLAG_LOCKED | CTLFLAG_RW,
4413 0, 0, sysctl_majorcompact_threshold_divisor, "I", "");
4414
4415
4416 STATIC int
4417 sysctl_unthrottle_threshold_divisor(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4418 {
4419 int new_value, changed;
4420 int error = sysctl_io_number(req, vm_compressor_unthrottle_threshold_divisor, sizeof(int), &new_value, &changed);
4421
4422 if (changed) {
4423 vm_compressor_unthrottle_threshold_divisor = new_value;
4424 vm_compressor_unthrottle_threshold_divisor_overridden = 1;
4425 }
4426 return error;
4427 }
4428
4429 SYSCTL_PROC(_vm, OID_AUTO, compressor_unthrottle_threshold_divisor,
4430 CTLTYPE_INT | CTLFLAG_LOCKED | CTLFLAG_RW,
4431 0, 0, sysctl_unthrottle_threshold_divisor, "I", "");
4432
4433
4434 STATIC int
4435 sysctl_catchup_threshold_divisor(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4436 {
4437 int new_value, changed;
4438 int error = sysctl_io_number(req, vm_compressor_catchup_threshold_divisor, sizeof(int), &new_value, &changed);
4439
4440 if (changed) {
4441 vm_compressor_catchup_threshold_divisor = new_value;
4442 vm_compressor_catchup_threshold_divisor_overridden = 1;
4443 }
4444 return error;
4445 }
4446
4447 SYSCTL_PROC(_vm, OID_AUTO, compressor_catchup_threshold_divisor,
4448 CTLTYPE_INT | CTLFLAG_LOCKED | CTLFLAG_RW,
4449 0, 0, sysctl_catchup_threshold_divisor, "I", "");
4450 #endif
4451
4452
4453 SYSCTL_QUAD(_vm, OID_AUTO, compressor_input_bytes, CTLFLAG_RD | CTLFLAG_LOCKED, &c_segment_input_bytes, "");
4454 SYSCTL_QUAD(_vm, OID_AUTO, compressor_compressed_bytes, CTLFLAG_RD | CTLFLAG_LOCKED, &c_segment_compressed_bytes, "");
4455 SYSCTL_QUAD(_vm, OID_AUTO, compressor_bytes_used, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_bytes_used, "");
4456
4457 SYSCTL_INT(_vm, OID_AUTO, compressor_mode, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_compressor_mode, 0, "");
4458 SYSCTL_INT(_vm, OID_AUTO, compressor_is_active, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_compressor_is_active, 0, "");
4459 SYSCTL_INT(_vm, OID_AUTO, compressor_swapout_target_age, CTLFLAG_RD | CTLFLAG_LOCKED, &swapout_target_age, 0, "");
4460 SYSCTL_INT(_vm, OID_AUTO, compressor_available, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_compressor_available, 0, "");
4461 SYSCTL_INT(_vm, OID_AUTO, compressor_segment_buffer_size, CTLFLAG_RD | CTLFLAG_LOCKED, &c_seg_bufsize, 0, "");
4462 SYSCTL_QUAD(_vm, OID_AUTO, compressor_pool_size, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_pool_size, "");
4463
4464 #if CONFIG_TRACK_UNMODIFIED_ANON_PAGES
4465 extern uint64_t compressor_ro_uncompressed;
4466 extern uint64_t compressor_ro_uncompressed_total_returned;
4467 extern uint64_t compressor_ro_uncompressed_skip_returned;
4468 extern uint64_t compressor_ro_uncompressed_get;
4469 extern uint64_t compressor_ro_uncompressed_put;
4470 extern uint64_t compressor_ro_uncompressed_swap_usage;
4471
4472 SYSCTL_QUAD(_vm, OID_AUTO, compressor_ro_uncompressed_total_returned, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_ro_uncompressed_total_returned, "");
4473 SYSCTL_QUAD(_vm, OID_AUTO, compressor_ro_uncompressed_writes_saved, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_ro_uncompressed_skip_returned, "");
4474 SYSCTL_QUAD(_vm, OID_AUTO, compressor_ro_uncompressed_candidates, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_ro_uncompressed, "");
4475 SYSCTL_QUAD(_vm, OID_AUTO, compressor_ro_uncompressed_rereads, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_ro_uncompressed_get, "");
4476 SYSCTL_QUAD(_vm, OID_AUTO, compressor_ro_uncompressed_swap_pages_on_disk, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_ro_uncompressed_swap_usage, "");
4477 #endif /* CONFIG_TRACK_UNMODIFIED_ANON_PAGES */
4478
4479 extern int min_csegs_per_major_compaction;
4480 SYSCTL_INT(_vm, OID_AUTO, compressor_min_csegs_per_major_compaction, CTLFLAG_RW | CTLFLAG_LOCKED, &min_csegs_per_major_compaction, 0, "");
4481
4482 SYSCTL_INT(_vm, OID_AUTO, vm_ripe_target_age_in_secs, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_ripe_target_age, 0, "");
4483
4484 SYSCTL_INT(_vm, OID_AUTO, compressor_eval_period_in_msecs, CTLFLAG_RW | CTLFLAG_LOCKED, &compressor_eval_period_in_msecs, 0, "");
4485 SYSCTL_INT(_vm, OID_AUTO, compressor_sample_min_in_msecs, CTLFLAG_RW | CTLFLAG_LOCKED, &compressor_sample_min_in_msecs, 0, "");
4486 SYSCTL_INT(_vm, OID_AUTO, compressor_sample_max_in_msecs, CTLFLAG_RW | CTLFLAG_LOCKED, &compressor_sample_max_in_msecs, 0, "");
4487 SYSCTL_INT(_vm, OID_AUTO, compressor_thrashing_threshold_per_10msecs, CTLFLAG_RW | CTLFLAG_LOCKED, &compressor_thrashing_threshold_per_10msecs, 0, "");
4488 SYSCTL_INT(_vm, OID_AUTO, compressor_thrashing_min_per_10msecs, CTLFLAG_RW | CTLFLAG_LOCKED, &compressor_thrashing_min_per_10msecs, 0, "");
4489
4490 SYSCTL_QUAD(_vm, OID_AUTO, compressor_swapouts_under_30s, CTLFLAG_RD | CTLFLAG_LOCKED, &vmcs_stats.unripe_under_30s, "");
4491 SYSCTL_QUAD(_vm, OID_AUTO, compressor_swapouts_under_60s, CTLFLAG_RD | CTLFLAG_LOCKED, &vmcs_stats.unripe_under_60s, "");
4492 SYSCTL_QUAD(_vm, OID_AUTO, compressor_swapouts_under_300s, CTLFLAG_RD | CTLFLAG_LOCKED, &vmcs_stats.unripe_under_300s, "");
4493 SYSCTL_QUAD(_vm, OID_AUTO, compressor_swapper_reclaim_swapins, CTLFLAG_RD | CTLFLAG_LOCKED, &vmcs_stats.reclaim_swapins, "");
4494 SYSCTL_QUAD(_vm, OID_AUTO, compressor_swapper_defrag_swapins, CTLFLAG_RD | CTLFLAG_LOCKED, &vmcs_stats.defrag_swapins, "");
4495 SYSCTL_QUAD(_vm, OID_AUTO, compressor_swapper_swapout_threshold_exceeded, CTLFLAG_RD | CTLFLAG_LOCKED, &vmcs_stats.compressor_swap_threshold_exceeded, "");
4496 SYSCTL_QUAD(_vm, OID_AUTO, compressor_swapper_swapout_fileq_throttled, CTLFLAG_RD | CTLFLAG_LOCKED, &vmcs_stats.external_q_throttled, "");
4497 SYSCTL_QUAD(_vm, OID_AUTO, compressor_swapper_swapout_free_count_low, CTLFLAG_RD | CTLFLAG_LOCKED, &vmcs_stats.free_count_below_reserve, "");
4498 SYSCTL_QUAD(_vm, OID_AUTO, compressor_swapper_swapout_thrashing_detected, CTLFLAG_RD | CTLFLAG_LOCKED, &vmcs_stats.thrashing_detected, "");
4499 SYSCTL_QUAD(_vm, OID_AUTO, compressor_swapper_swapout_fragmentation_detected, CTLFLAG_RD | CTLFLAG_LOCKED, &vmcs_stats.fragmentation_detected, "");
4500
4501 SYSCTL_STRING(_vm, OID_AUTO, swapfileprefix, CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED, swapfilename, sizeof(swapfilename) - SWAPFILENAME_INDEX_LEN, "");
4502
4503 SYSCTL_INT(_vm, OID_AUTO, compressor_timing_enabled, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_compressor_time_thread, 0, "");
4504
4505 #if DEVELOPMENT || DEBUG
4506 SYSCTL_QUAD(_vm, OID_AUTO, compressor_thread_runtime0, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_runtimes[0], "");
4507 SYSCTL_QUAD(_vm, OID_AUTO, compressor_thread_runtime1, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_runtimes[1], "");
4508
4509 SYSCTL_QUAD(_vm, OID_AUTO, compressor_threads_total_execution_time, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_cthreads_total, "");
4510
4511 SYSCTL_QUAD(_vm, OID_AUTO, compressor_thread_pages0, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_pages[0], "");
4512 SYSCTL_QUAD(_vm, OID_AUTO, compressor_thread_pages1, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_pages[1], "");
4513
4514 SYSCTL_QUAD(_vm, OID_AUTO, compressor_thread_iterations0, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_iterations[0], "");
4515 SYSCTL_QUAD(_vm, OID_AUTO, compressor_thread_iterations1, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_iterations[1], "");
4516
4517 SYSCTL_INT(_vm, OID_AUTO, compressor_thread_minpages0, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_minpages[0], 0, "");
4518 SYSCTL_INT(_vm, OID_AUTO, compressor_thread_minpages1, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_minpages[1], 0, "");
4519
4520 SYSCTL_INT(_vm, OID_AUTO, compressor_thread_maxpages0, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_maxpages[0], 0, "");
4521 SYSCTL_INT(_vm, OID_AUTO, compressor_thread_maxpages1, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_maxpages[1], 0, "");
4522
4523 int vm_compressor_injected_error_count;
4524
4525 SYSCTL_INT(_vm, OID_AUTO, compressor_injected_error_count, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_compressor_injected_error_count, 0, "");
4526
4527 static int
4528 sysctl_compressor_inject_error(__unused struct sysctl_oid *oidp,
4529 __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4530 {
4531 int result;
4532 vm_address_t va = 0;
4533 int changed;
4534
4535 result = sysctl_io_number(req, va, sizeof(va), &va, &changed);
4536 if (result == 0 && changed) {
4537 result = vm_map_inject_error(current_map(), va);
4538 if (result == 0) {
4539 /*
4540 * Count the number of errors injected successfully to detect
4541 * situations where corruption was caused by improper use of this
4542 * sysctl.
4543 */
4544 os_atomic_inc(&vm_compressor_injected_error_count, relaxed);
4545 }
4546 }
4547 return result;
4548 }
4549
4550 SYSCTL_PROC(_vm, OID_AUTO, compressor_inject_error, CTLTYPE_QUAD | CTLFLAG_LOCKED | CTLFLAG_RW,
4551 0, 0, sysctl_compressor_inject_error, "Q", "flips a bit in a compressed page for the current task");
4552
4553 /*
4554 * Opt a process in/out of self donation mode.
4555 */
4556 static int
4557 sysctl_vm_pid_toggle_selfdonate_pages SYSCTL_HANDLER_ARGS
4558 {
4559 #pragma unused(arg1, arg2)
4560 int error, pid = 0;
4561 proc_t p;
4562
4563 error = sysctl_handle_int(oidp, &pid, 0, req);
4564 if (error || !req->newptr) {
4565 return error;
4566 }
4567
4568 p = proc_find(pid);
4569 if (p != NULL) {
4570 (void) vm_toggle_task_selfdonate_pages(proc_task(p));
4571 proc_rele(p);
4572 return error;
4573 } else {
4574 printf("sysctl_vm_pid_selfdonate_pages: Invalid process\n");
4575 }
4576
4577 return EINVAL;
4578 }
4579 SYSCTL_PROC(_vm, OID_AUTO, pid_toggle_selfdonate_pages, CTLTYPE_INT | CTLFLAG_WR | CTLFLAG_LOCKED | CTLFLAG_MASKED,
4580 0, 0, &sysctl_vm_pid_toggle_selfdonate_pages, "I", "");
4581 #endif
4582 extern uint32_t vm_page_donate_mode;
4583 extern uint32_t vm_page_donate_target_high, vm_page_donate_target_low;
4584 SYSCTL_INT(_vm, OID_AUTO, vm_page_donate_mode, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_page_donate_mode, 0, "");
4585 SYSCTL_INT(_vm, OID_AUTO, vm_page_donate_target_high, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_page_donate_target_high, 0, "");
4586 SYSCTL_INT(_vm, OID_AUTO, vm_page_donate_target_low, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_page_donate_target_low, 0, "");
4587
4588 SYSCTL_QUAD(_vm, OID_AUTO, lz4_compressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.lz4_compressions, "");
4589 SYSCTL_QUAD(_vm, OID_AUTO, lz4_compression_failures, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.lz4_compression_failures, "");
4590 SYSCTL_QUAD(_vm, OID_AUTO, lz4_compressed_bytes, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.lz4_compressed_bytes, "");
4591 SYSCTL_QUAD(_vm, OID_AUTO, lz4_wk_compression_delta, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.lz4_wk_compression_delta, "");
4592 SYSCTL_QUAD(_vm, OID_AUTO, lz4_wk_compression_negative_delta, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.lz4_wk_compression_negative_delta, "");
4593
4594 SYSCTL_QUAD(_vm, OID_AUTO, lz4_decompressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.lz4_decompressions, "");
4595 SYSCTL_QUAD(_vm, OID_AUTO, lz4_decompressed_bytes, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.lz4_decompressed_bytes, "");
4596
4597 SYSCTL_QUAD(_vm, OID_AUTO, uc_decompressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.uc_decompressions, "");
4598
4599 SYSCTL_QUAD(_vm, OID_AUTO, wk_compressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_compressions, "");
4600
4601 SYSCTL_QUAD(_vm, OID_AUTO, wk_catime, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_cabstime, "");
4602
4603 SYSCTL_QUAD(_vm, OID_AUTO, wkh_catime, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wkh_cabstime, "");
4604 SYSCTL_QUAD(_vm, OID_AUTO, wkh_compressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wkh_compressions, "");
4605
4606 SYSCTL_QUAD(_vm, OID_AUTO, wks_catime, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wks_cabstime, "");
4607 SYSCTL_QUAD(_vm, OID_AUTO, wks_compressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wks_compressions, "");
4608
4609 SYSCTL_QUAD(_vm, OID_AUTO, wk_compressions_exclusive, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_compressions_exclusive, "");
4610 SYSCTL_QUAD(_vm, OID_AUTO, wk_sv_compressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_sv_compressions, "");
4611 SYSCTL_QUAD(_vm, OID_AUTO, wk_mzv_compressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_mzv_compressions, "");
4612 SYSCTL_QUAD(_vm, OID_AUTO, wk_compression_failures, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_compression_failures, "");
4613 SYSCTL_QUAD(_vm, OID_AUTO, wk_compressed_bytes_exclusive, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_compressed_bytes_exclusive, "");
4614 SYSCTL_QUAD(_vm, OID_AUTO, wk_compressed_bytes_total, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_compressed_bytes_total, "");
4615
4616 SYSCTL_QUAD(_vm, OID_AUTO, wks_compressed_bytes, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wks_compressed_bytes, "");
4617 SYSCTL_QUAD(_vm, OID_AUTO, wks_compression_failures, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wks_compression_failures, "");
4618 SYSCTL_QUAD(_vm, OID_AUTO, wks_sv_compressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wks_sv_compressions, "");
4619
4620
4621 SYSCTL_QUAD(_vm, OID_AUTO, wk_decompressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_decompressions, "");
4622
4623 SYSCTL_QUAD(_vm, OID_AUTO, wk_datime, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_dabstime, "");
4624
4625 SYSCTL_QUAD(_vm, OID_AUTO, wkh_datime, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wkh_dabstime, "");
4626 SYSCTL_QUAD(_vm, OID_AUTO, wkh_decompressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wkh_decompressions, "");
4627
4628 SYSCTL_QUAD(_vm, OID_AUTO, wks_datime, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wks_dabstime, "");
4629 SYSCTL_QUAD(_vm, OID_AUTO, wks_decompressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wks_decompressions, "");
4630
4631 SYSCTL_QUAD(_vm, OID_AUTO, wk_decompressed_bytes, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_decompressed_bytes, "");
4632 SYSCTL_QUAD(_vm, OID_AUTO, wk_sv_decompressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_sv_decompressions, "");
4633
4634 SYSCTL_INT(_vm, OID_AUTO, lz4_threshold, CTLFLAG_RW | CTLFLAG_LOCKED, &vmctune.lz4_threshold, 0, "");
4635 SYSCTL_INT(_vm, OID_AUTO, wkdm_reeval_threshold, CTLFLAG_RW | CTLFLAG_LOCKED, &vmctune.wkdm_reeval_threshold, 0, "");
4636 SYSCTL_INT(_vm, OID_AUTO, lz4_max_failure_skips, CTLFLAG_RW | CTLFLAG_LOCKED, &vmctune.lz4_max_failure_skips, 0, "");
4637 SYSCTL_INT(_vm, OID_AUTO, lz4_max_failure_run_length, CTLFLAG_RW | CTLFLAG_LOCKED, &vmctune.lz4_max_failure_run_length, 0, "");
4638 SYSCTL_INT(_vm, OID_AUTO, lz4_max_preselects, CTLFLAG_RW | CTLFLAG_LOCKED, &vmctune.lz4_max_preselects, 0, "");
4639 SYSCTL_INT(_vm, OID_AUTO, lz4_run_preselection_threshold, CTLFLAG_RW | CTLFLAG_LOCKED, &vmctune.lz4_run_preselection_threshold, 0, "");
4640 SYSCTL_INT(_vm, OID_AUTO, lz4_run_continue_bytes, CTLFLAG_RW | CTLFLAG_LOCKED, &vmctune.lz4_run_continue_bytes, 0, "");
4641 SYSCTL_INT(_vm, OID_AUTO, lz4_profitable_bytes, CTLFLAG_RW | CTLFLAG_LOCKED, &vmctune.lz4_profitable_bytes, 0, "");
4642 #if DEVELOPMENT || DEBUG
4643 extern int vm_compressor_current_codec;
4644 extern int vm_compressor_test_seg_wp;
4645 extern boolean_t vm_compressor_force_sw_wkdm;
4646 SYSCTL_INT(_vm, OID_AUTO, compressor_codec, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_compressor_current_codec, 0, "");
4647 SYSCTL_INT(_vm, OID_AUTO, compressor_test_wp, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_compressor_test_seg_wp, 0, "");
4648
4649 SYSCTL_INT(_vm, OID_AUTO, wksw_force, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_compressor_force_sw_wkdm, 0, "");
4650 extern int precompy, wkswhw;
4651
4652 SYSCTL_INT(_vm, OID_AUTO, precompy, CTLFLAG_RW | CTLFLAG_LOCKED, &precompy, 0, "");
4653 SYSCTL_INT(_vm, OID_AUTO, wkswhw, CTLFLAG_RW | CTLFLAG_LOCKED, &wkswhw, 0, "");
4654 extern unsigned int vm_ktrace_enabled;
4655 SYSCTL_INT(_vm, OID_AUTO, vm_ktrace, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_ktrace_enabled, 0, "");
4656 #endif
4657
4658 #if CONFIG_PHANTOM_CACHE
4659 extern uint32_t phantom_cache_thrashing_threshold;
4660 extern uint32_t phantom_cache_eval_period_in_msecs;
4661 extern uint32_t phantom_cache_thrashing_threshold_ssd;
4662
4663
4664 SYSCTL_INT(_vm, OID_AUTO, phantom_cache_eval_period_in_msecs, CTLFLAG_RW | CTLFLAG_LOCKED, &phantom_cache_eval_period_in_msecs, 0, "");
4665 SYSCTL_INT(_vm, OID_AUTO, phantom_cache_thrashing_threshold, CTLFLAG_RW | CTLFLAG_LOCKED, &phantom_cache_thrashing_threshold, 0, "");
4666 SYSCTL_INT(_vm, OID_AUTO, phantom_cache_thrashing_threshold_ssd, CTLFLAG_RW | CTLFLAG_LOCKED, &phantom_cache_thrashing_threshold_ssd, 0, "");
4667 #endif
4668
4669 #if defined(__LP64__)
4670 extern uint32_t vm_page_background_count;
4671 extern uint32_t vm_page_background_target;
4672 extern uint32_t vm_page_background_internal_count;
4673 extern uint32_t vm_page_background_external_count;
4674 extern uint32_t vm_page_background_mode;
4675 extern uint32_t vm_page_background_exclude_external;
4676 extern uint64_t vm_page_background_promoted_count;
4677 extern uint64_t vm_pageout_rejected_bq_internal;
4678 extern uint64_t vm_pageout_rejected_bq_external;
4679
4680 SYSCTL_INT(_vm, OID_AUTO, vm_page_background_mode, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_page_background_mode, 0, "");
4681 SYSCTL_INT(_vm, OID_AUTO, vm_page_background_exclude_external, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_page_background_exclude_external, 0, "");
4682 SYSCTL_INT(_vm, OID_AUTO, vm_page_background_target, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_page_background_target, 0, "");
4683 SYSCTL_INT(_vm, OID_AUTO, vm_page_background_count, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_page_background_count, 0, "");
4684 SYSCTL_INT(_vm, OID_AUTO, vm_page_background_internal_count, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_page_background_internal_count, 0, "");
4685 SYSCTL_INT(_vm, OID_AUTO, vm_page_background_external_count, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_page_background_external_count, 0, "");
4686
4687 SYSCTL_QUAD(_vm, OID_AUTO, vm_page_background_promoted_count, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_page_background_promoted_count, "");
4688 SYSCTL_QUAD(_vm, OID_AUTO, vm_pageout_considered_bq_internal, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_pageout_vminfo.vm_pageout_considered_bq_internal, "");
4689 SYSCTL_QUAD(_vm, OID_AUTO, vm_pageout_considered_bq_external, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_pageout_vminfo.vm_pageout_considered_bq_external, "");
4690 SYSCTL_QUAD(_vm, OID_AUTO, vm_pageout_rejected_bq_internal, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_pageout_rejected_bq_internal, "");
4691 SYSCTL_QUAD(_vm, OID_AUTO, vm_pageout_rejected_bq_external, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_pageout_rejected_bq_external, "");
4692
4693 #endif /* __LP64__ */
4694
4695 extern void vm_update_darkwake_mode(boolean_t);
4696 extern boolean_t vm_darkwake_mode;
4697
4698 STATIC int
4699 sysctl_toggle_darkwake_mode(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4700 {
4701 int new_value, changed;
4702 int error = sysctl_io_number(req, vm_darkwake_mode, sizeof(int), &new_value, &changed);
4703
4704 if (!error && changed) {
4705 if (new_value != 0 && new_value != 1) {
4706 printf("Error: Invalid value passed to darkwake sysctl. Acceptable: 0 or 1.\n");
4707 error = EINVAL;
4708 } else {
4709 vm_update_darkwake_mode((boolean_t) new_value);
4710 }
4711 }
4712
4713 return error;
4714 }
4715
4716 SYSCTL_PROC(_vm, OID_AUTO, darkwake_mode,
4717 CTLTYPE_INT | CTLFLAG_LOCKED | CTLFLAG_RW,
4718 0, 0, sysctl_toggle_darkwake_mode, "I", "");
4719
4720 #if (DEVELOPMENT || DEBUG)
4721
4722 SYSCTL_UINT(_vm, OID_AUTO, vm_page_creation_throttled_hard,
4723 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
4724 &vm_page_creation_throttled_hard, 0, "");
4725
4726 SYSCTL_UINT(_vm, OID_AUTO, vm_page_creation_throttled_soft,
4727 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
4728 &vm_page_creation_throttled_soft, 0, "");
4729
4730 extern uint32_t vm_pageout_memorystatus_fb_factor_nr;
4731 extern uint32_t vm_pageout_memorystatus_fb_factor_dr;
4732 SYSCTL_INT(_vm, OID_AUTO, vm_pageout_memorystatus_fb_factor_nr, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_pageout_memorystatus_fb_factor_nr, 0, "");
4733 SYSCTL_INT(_vm, OID_AUTO, vm_pageout_memorystatus_fb_factor_dr, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_pageout_memorystatus_fb_factor_dr, 0, "");
4734
4735 extern uint32_t vm_grab_anon_nops;
4736
4737 SYSCTL_INT(_vm, OID_AUTO, vm_grab_anon_overrides, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_pageout_debug.vm_grab_anon_overrides, 0, "");
4738 SYSCTL_INT(_vm, OID_AUTO, vm_grab_anon_nops, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_pageout_debug.vm_grab_anon_nops, 0, "");
4739 SYSCTL_INT(_vm, OID_AUTO, vm_pageout_yield_for_free_pages, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_pageout_debug.vm_pageout_yield_for_free_pages, 0, "");
4740
4741
4742 extern int vm_page_delayed_work_ctx_needed;
4743 SYSCTL_INT(_vm, OID_AUTO, vm_page_needed_delayed_work_ctx, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_page_delayed_work_ctx_needed, 0, "");
4744
4745 /* log message counters for persistence mode */
4746 SCALABLE_COUNTER_DECLARE(oslog_p_total_msgcount);
4747 SCALABLE_COUNTER_DECLARE(oslog_p_metadata_saved_msgcount);
4748 SCALABLE_COUNTER_DECLARE(oslog_p_metadata_dropped_msgcount);
4749 SCALABLE_COUNTER_DECLARE(oslog_p_error_count);
4750 SCALABLE_COUNTER_DECLARE(oslog_p_saved_msgcount);
4751 SCALABLE_COUNTER_DECLARE(oslog_p_dropped_msgcount);
4752 SCALABLE_COUNTER_DECLARE(oslog_p_boot_dropped_msgcount);
4753 SCALABLE_COUNTER_DECLARE(oslog_p_coprocessor_total_msgcount);
4754 SCALABLE_COUNTER_DECLARE(oslog_p_coprocessor_dropped_msgcount);
4755 SCALABLE_COUNTER_DECLARE(oslog_p_unresolved_kc_msgcount);
4756 SCALABLE_COUNTER_DECLARE(oslog_p_fmt_invalid_msgcount);
4757 SCALABLE_COUNTER_DECLARE(oslog_p_fmt_max_args_msgcount);
4758 SCALABLE_COUNTER_DECLARE(oslog_p_truncated_msgcount);
4759
4760 SCALABLE_COUNTER_DECLARE(log_queue_cnt_received);
4761 SCALABLE_COUNTER_DECLARE(log_queue_cnt_rejected_fh);
4762 SCALABLE_COUNTER_DECLARE(log_queue_cnt_sent);
4763 SCALABLE_COUNTER_DECLARE(log_queue_cnt_dropped_nomem);
4764 SCALABLE_COUNTER_DECLARE(log_queue_cnt_queued);
4765 SCALABLE_COUNTER_DECLARE(log_queue_cnt_dropped_off);
4766 SCALABLE_COUNTER_DECLARE(log_queue_cnt_mem_active);
4767 SCALABLE_COUNTER_DECLARE(log_queue_cnt_mem_allocated);
4768 SCALABLE_COUNTER_DECLARE(log_queue_cnt_mem_released);
4769 SCALABLE_COUNTER_DECLARE(log_queue_cnt_mem_failed);
4770
4771 /* log message counters for streaming mode */
4772 SCALABLE_COUNTER_DECLARE(oslog_s_total_msgcount);
4773 SCALABLE_COUNTER_DECLARE(oslog_s_metadata_msgcount);
4774 SCALABLE_COUNTER_DECLARE(oslog_s_error_count);
4775 SCALABLE_COUNTER_DECLARE(oslog_s_streamed_msgcount);
4776 SCALABLE_COUNTER_DECLARE(oslog_s_dropped_msgcount);
4777
4778 /* log message counters for msgbuf logging */
4779 SCALABLE_COUNTER_DECLARE(oslog_msgbuf_msgcount);
4780 SCALABLE_COUNTER_DECLARE(oslog_msgbuf_dropped_msgcount);
4781 extern uint32_t oslog_msgbuf_dropped_charcount;
4782
4783 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_total_msgcount, oslog_p_total_msgcount, "");
4784 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_metadata_saved_msgcount, oslog_p_metadata_saved_msgcount, "");
4785 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_metadata_dropped_msgcount, oslog_p_metadata_dropped_msgcount, "");
4786 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_error_count, oslog_p_error_count, "");
4787 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_saved_msgcount, oslog_p_saved_msgcount, "");
4788 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_dropped_msgcount, oslog_p_dropped_msgcount, "");
4789 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_boot_dropped_msgcount, oslog_p_boot_dropped_msgcount, "");
4790 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_coprocessor_total_msgcount, oslog_p_coprocessor_total_msgcount, "");
4791 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_coprocessor_dropped_msgcount, oslog_p_coprocessor_dropped_msgcount, "");
4792 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_unresolved_kc_msgcount, oslog_p_unresolved_kc_msgcount, "");
4793
4794 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_fmt_invalid_msgcount, oslog_p_fmt_invalid_msgcount, "");
4795 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_fmt_max_args_msgcount, oslog_p_fmt_max_args_msgcount, "");
4796 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_truncated_msgcount, oslog_p_truncated_msgcount, "");
4797
4798 SYSCTL_SCALABLE_COUNTER(_debug, oslog_s_total_msgcount, oslog_s_total_msgcount, "Number of logs sent to streaming");
4799 SYSCTL_SCALABLE_COUNTER(_debug, oslog_s_metadata_msgcount, oslog_s_metadata_msgcount, "Number of metadata sent to streaming");
4800 SYSCTL_SCALABLE_COUNTER(_debug, oslog_s_error_count, oslog_s_error_count, "Number of invalid stream logs");
4801 SYSCTL_SCALABLE_COUNTER(_debug, oslog_s_streamed_msgcount, oslog_s_streamed_msgcount, "Number of streamed logs");
4802 SYSCTL_SCALABLE_COUNTER(_debug, oslog_s_dropped_msgcount, oslog_s_dropped_msgcount, "Number of logs dropped from stream");
4803
4804 SYSCTL_SCALABLE_COUNTER(_debug, oslog_msgbuf_msgcount, oslog_msgbuf_msgcount, "Number of dmesg log messages");
4805 SYSCTL_SCALABLE_COUNTER(_debug, oslog_msgbuf_dropped_msgcount, oslog_msgbuf_dropped_msgcount, "Number of dropped dmesg log messages");
4806 SYSCTL_UINT(_debug, OID_AUTO, oslog_msgbuf_dropped_charcount, CTLFLAG_ANYBODY | CTLFLAG_RD | CTLFLAG_LOCKED, &oslog_msgbuf_dropped_charcount, 0, "Number of dropped dmesg log chars");
4807
4808 SYSCTL_SCALABLE_COUNTER(_debug, log_queue_cnt_received, log_queue_cnt_received, "Number of received logs");
4809 SYSCTL_SCALABLE_COUNTER(_debug, log_queue_cnt_rejected_fh, log_queue_cnt_rejected_fh, "Number of logs initially rejected by FH");
4810 SYSCTL_SCALABLE_COUNTER(_debug, log_queue_cnt_sent, log_queue_cnt_sent, "Number of logs successfully saved in FH");
4811 SYSCTL_SCALABLE_COUNTER(_debug, log_queue_cnt_dropped_nomem, log_queue_cnt_dropped_nomem, "Number of logs dropped due to lack of queue memory");
4812 SYSCTL_SCALABLE_COUNTER(_debug, log_queue_cnt_queued, log_queue_cnt_queued, "Current number of logs stored in log queues");
4813 SYSCTL_SCALABLE_COUNTER(_debug, log_queue_cnt_dropped_off, log_queue_cnt_dropped_off, "Number of logs dropped due to disabled log queues");
4814 SYSCTL_SCALABLE_COUNTER(_debug, log_queue_cnt_mem_allocated, log_queue_cnt_mem_allocated, "Number of memory allocations");
4815 SYSCTL_SCALABLE_COUNTER(_debug, log_queue_cnt_mem_released, log_queue_cnt_mem_released, "Number of memory releases");
4816 SYSCTL_SCALABLE_COUNTER(_debug, log_queue_cnt_mem_failed, log_queue_cnt_mem_failed, "Number of failed memory allocations");
4817
4818 #endif /* DEVELOPMENT || DEBUG */
4819
4820 /*
4821 * Enable tracing of voucher contents
4822 */
4823 extern uint32_t ipc_voucher_trace_contents;
4824
4825 SYSCTL_INT(_kern, OID_AUTO, ipc_voucher_trace_contents,
4826 CTLFLAG_RW | CTLFLAG_LOCKED, &ipc_voucher_trace_contents, 0, "Enable tracing voucher contents");
4827
4828 /*
4829 * Kernel stack size and depth
4830 */
4831 SYSCTL_INT(_kern, OID_AUTO, stack_size,
4832 CTLFLAG_RD | CTLFLAG_LOCKED, (int *) &kernel_stack_size, 0, "Kernel stack size");
4833 SYSCTL_INT(_kern, OID_AUTO, stack_depth_max,
4834 CTLFLAG_RD | CTLFLAG_LOCKED, (int *) &kernel_stack_depth_max, 0, "Max kernel stack depth at interrupt or context switch");
4835
4836 extern unsigned int kern_feature_overrides;
4837 SYSCTL_INT(_kern, OID_AUTO, kern_feature_overrides,
4838 CTLFLAG_RD | CTLFLAG_LOCKED, &kern_feature_overrides, 0, "Kernel feature override mask");
4839
4840 /*
4841 * enable back trace for port allocations
4842 */
4843 extern int ipc_portbt;
4844
4845 SYSCTL_INT(_kern, OID_AUTO, ipc_portbt,
4846 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
4847 &ipc_portbt, 0, "");
4848
4849 /*
4850 * Mach message signature validation control and outputs
4851 */
4852 extern unsigned int ikm_signature_failures;
4853 SYSCTL_INT(_kern, OID_AUTO, ikm_signature_failures,
4854 CTLFLAG_RD | CTLFLAG_LOCKED, &ikm_signature_failures, 0, "Message signature failure count");
4855 extern unsigned int ikm_signature_failure_id;
4856 SYSCTL_INT(_kern, OID_AUTO, ikm_signature_failure_id,
4857 CTLFLAG_RD | CTLFLAG_LOCKED, &ikm_signature_failure_id, 0, "Message signature failure count");
4858
4859 #if (DEVELOPMENT || DEBUG)
4860 extern unsigned int ikm_signature_panic_disable;
4861 SYSCTL_INT(_kern, OID_AUTO, ikm_signature_panic_disable,
4862 CTLFLAG_RW | CTLFLAG_LOCKED, &ikm_signature_panic_disable, 0, "Message signature failure mode");
4863 extern unsigned int ikm_signature_header_failures;
4864 SYSCTL_INT(_kern, OID_AUTO, ikm_signature_header_failures,
4865 CTLFLAG_RD | CTLFLAG_LOCKED, &ikm_signature_header_failures, 0, "Message header signature failure count");
4866 extern unsigned int ikm_signature_trailer_failures;
4867 SYSCTL_INT(_kern, OID_AUTO, ikm_signature_trailer_failures,
4868 CTLFLAG_RD | CTLFLAG_LOCKED, &ikm_signature_trailer_failures, 0, "Message trailer signature failure count");
4869 #endif
4870
4871 /*
4872 * Scheduler sysctls
4873 */
4874
4875 SYSCTL_STRING(_kern, OID_AUTO, sched,
4876 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
4877 sched_string, sizeof(sched_string),
4878 "Timeshare scheduler implementation");
4879
4880 static int
4881 sysctl_cpu_quiescent_counter_interval SYSCTL_HANDLER_ARGS
4882 {
4883 #pragma unused(arg1, arg2)
4884
4885 uint32_t local_min_interval_us = smr_cpu_checkin_get_min_interval_us();
4886
4887 int error = sysctl_handle_int(oidp, &local_min_interval_us, 0, req);
4888 if (error || !req->newptr) {
4889 return error;
4890 }
4891
4892 smr_cpu_checkin_set_min_interval_us(local_min_interval_us);
4893
4894 return 0;
4895 }
4896
4897 SYSCTL_PROC(_kern, OID_AUTO, cpu_checkin_interval,
4898 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
4899 0, 0,
4900 sysctl_cpu_quiescent_counter_interval, "I",
4901 "Quiescent CPU checkin interval (microseconds)");
4902
4903 /*
4904 * Allow the precise user/kernel time sysctl to be set, but don't allow it to
4905 * affect anything. Some tools expect to be able to set this, even though
4906 * runtime configuration is no longer supported.
4907 */
4908
4909 static int
4910 sysctl_precise_user_kernel_time SYSCTL_HANDLER_ARGS
4911 {
4912 #if PRECISE_USER_KERNEL_TIME
4913 int dummy_set = 1;
4914 #else /* PRECISE_USER_KERNEL_TIME */
4915 int dummy_set = 0;
4916 #endif /* !PRECISE_USER_KERNEL_TIME */
4917 return sysctl_handle_int(oidp, &dummy_set, 0, req);
4918 }
4919
4920 SYSCTL_PROC(_kern, OID_AUTO, precise_user_kernel_time,
4921 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
4922 0, 0, sysctl_precise_user_kernel_time, "I",
4923 "Precise accounting of kernel vs. user time (deprecated)");
4924
4925 #if CONFIG_PERVASIVE_ENERGY && HAS_CPU_DPE_COUNTER
4926 __security_const_late static int pervasive_energy = 1;
4927 #else /* CONFIG_PERVASIVE_ENERGY && HAS_CPU_DPE_COUNTER */
4928 __security_const_late static int pervasive_energy = 0;
4929 #endif /* !CONFIG_PERVASIVE_ENERGY || !HAS_CPU_DPE_COUNTER */
4930
4931 SYSCTL_INT(_kern, OID_AUTO, pervasive_energy,
4932 CTLFLAG_KERN | CTLFLAG_RD | CTLFLAG_LOCKED, &pervasive_energy, 0, "");
4933
4934 /* Parameters related to timer coalescing tuning, to be replaced
4935 * with a dedicated systemcall in the future.
4936 */
4937 /* Enable processing pending timers in the context of any other interrupt
4938 * Coalescing tuning parameters for various thread/task attributes */
4939 STATIC int
4940 sysctl_timer_user_us_kernel_abstime SYSCTL_HANDLER_ARGS
4941 {
4942 #pragma unused(oidp)
4943 int size = arg2; /* subcommand*/
4944 int error;
4945 int changed = 0;
4946 uint64_t old_value_ns;
4947 uint64_t new_value_ns;
4948 uint64_t value_abstime;
4949 if (size == sizeof(uint32_t)) {
4950 value_abstime = *((uint32_t *)arg1);
4951 } else if (size == sizeof(uint64_t)) {
4952 value_abstime = *((uint64_t *)arg1);
4953 } else {
4954 return ENOTSUP;
4955 }
4956
4957 absolutetime_to_nanoseconds(value_abstime, &old_value_ns);
4958 error = sysctl_io_number(req, old_value_ns, sizeof(old_value_ns), &new_value_ns, &changed);
4959 if ((error) || (!changed)) {
4960 return error;
4961 }
4962
4963 nanoseconds_to_absolutetime(new_value_ns, &value_abstime);
4964 if (size == sizeof(uint32_t)) {
4965 *((uint32_t *)arg1) = (uint32_t)value_abstime;
4966 } else {
4967 *((uint64_t *)arg1) = value_abstime;
4968 }
4969 return error;
4970 }
4971
4972 SYSCTL_INT(_kern, OID_AUTO, timer_coalesce_bg_scale,
4973 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4974 &tcoal_prio_params.timer_coalesce_bg_shift, 0, "");
4975 SYSCTL_PROC(_kern, OID_AUTO, timer_resort_threshold_ns,
4976 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4977 &tcoal_prio_params.timer_resort_threshold_abstime,
4978 sizeof(tcoal_prio_params.timer_resort_threshold_abstime),
4979 sysctl_timer_user_us_kernel_abstime,
4980 "Q", "");
4981 SYSCTL_PROC(_kern, OID_AUTO, timer_coalesce_bg_ns_max,
4982 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4983 &tcoal_prio_params.timer_coalesce_bg_abstime_max,
4984 sizeof(tcoal_prio_params.timer_coalesce_bg_abstime_max),
4985 sysctl_timer_user_us_kernel_abstime,
4986 "Q", "");
4987
4988 SYSCTL_INT(_kern, OID_AUTO, timer_coalesce_kt_scale,
4989 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4990 &tcoal_prio_params.timer_coalesce_kt_shift, 0, "");
4991
4992 SYSCTL_PROC(_kern, OID_AUTO, timer_coalesce_kt_ns_max,
4993 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4994 &tcoal_prio_params.timer_coalesce_kt_abstime_max,
4995 sizeof(tcoal_prio_params.timer_coalesce_kt_abstime_max),
4996 sysctl_timer_user_us_kernel_abstime,
4997 "Q", "");
4998
4999 SYSCTL_INT(_kern, OID_AUTO, timer_coalesce_fp_scale,
5000 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5001 &tcoal_prio_params.timer_coalesce_fp_shift, 0, "");
5002
5003 SYSCTL_PROC(_kern, OID_AUTO, timer_coalesce_fp_ns_max,
5004 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5005 &tcoal_prio_params.timer_coalesce_fp_abstime_max,
5006 sizeof(tcoal_prio_params.timer_coalesce_fp_abstime_max),
5007 sysctl_timer_user_us_kernel_abstime,
5008 "Q", "");
5009
5010 SYSCTL_INT(_kern, OID_AUTO, timer_coalesce_ts_scale,
5011 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5012 &tcoal_prio_params.timer_coalesce_ts_shift, 0, "");
5013
5014 SYSCTL_PROC(_kern, OID_AUTO, timer_coalesce_ts_ns_max,
5015 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5016 &tcoal_prio_params.timer_coalesce_ts_abstime_max,
5017 sizeof(tcoal_prio_params.timer_coalesce_ts_abstime_max),
5018 sysctl_timer_user_us_kernel_abstime,
5019 "Q", "");
5020
5021 SYSCTL_INT(_kern, OID_AUTO, timer_coalesce_tier0_scale,
5022 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5023 &tcoal_prio_params.latency_qos_scale[0], 0, "");
5024
5025 SYSCTL_PROC(_kern, OID_AUTO, timer_coalesce_tier0_ns_max,
5026 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5027 &tcoal_prio_params.latency_qos_abstime_max[0],
5028 sizeof(tcoal_prio_params.latency_qos_abstime_max[0]),
5029 sysctl_timer_user_us_kernel_abstime,
5030 "Q", "");
5031
5032 SYSCTL_INT(_kern, OID_AUTO, timer_coalesce_tier1_scale,
5033 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5034 &tcoal_prio_params.latency_qos_scale[1], 0, "");
5035
5036 SYSCTL_PROC(_kern, OID_AUTO, timer_coalesce_tier1_ns_max,
5037 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5038 &tcoal_prio_params.latency_qos_abstime_max[1],
5039 sizeof(tcoal_prio_params.latency_qos_abstime_max[1]),
5040 sysctl_timer_user_us_kernel_abstime,
5041 "Q", "");
5042
5043 SYSCTL_INT(_kern, OID_AUTO, timer_coalesce_tier2_scale,
5044 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5045 &tcoal_prio_params.latency_qos_scale[2], 0, "");
5046
5047 SYSCTL_PROC(_kern, OID_AUTO, timer_coalesce_tier2_ns_max,
5048 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5049 &tcoal_prio_params.latency_qos_abstime_max[2],
5050 sizeof(tcoal_prio_params.latency_qos_abstime_max[2]),
5051 sysctl_timer_user_us_kernel_abstime,
5052 "Q", "");
5053
5054 SYSCTL_INT(_kern, OID_AUTO, timer_coalesce_tier3_scale,
5055 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5056 &tcoal_prio_params.latency_qos_scale[3], 0, "");
5057
5058 SYSCTL_PROC(_kern, OID_AUTO, timer_coalesce_tier3_ns_max,
5059 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5060 &tcoal_prio_params.latency_qos_abstime_max[3],
5061 sizeof(tcoal_prio_params.latency_qos_abstime_max[3]),
5062 sysctl_timer_user_us_kernel_abstime,
5063 "Q", "");
5064
5065 SYSCTL_INT(_kern, OID_AUTO, timer_coalesce_tier4_scale,
5066 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5067 &tcoal_prio_params.latency_qos_scale[4], 0, "");
5068
5069 SYSCTL_PROC(_kern, OID_AUTO, timer_coalesce_tier4_ns_max,
5070 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5071 &tcoal_prio_params.latency_qos_abstime_max[4],
5072 sizeof(tcoal_prio_params.latency_qos_abstime_max[4]),
5073 sysctl_timer_user_us_kernel_abstime,
5074 "Q", "");
5075
5076 SYSCTL_INT(_kern, OID_AUTO, timer_coalesce_tier5_scale,
5077 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5078 &tcoal_prio_params.latency_qos_scale[5], 0, "");
5079
5080 SYSCTL_PROC(_kern, OID_AUTO, timer_coalesce_tier5_ns_max,
5081 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5082 &tcoal_prio_params.latency_qos_abstime_max[5],
5083 sizeof(tcoal_prio_params.latency_qos_abstime_max[5]),
5084 sysctl_timer_user_us_kernel_abstime,
5085 "Q", "");
5086
5087 /* Communicate the "user idle level" heuristic to the timer layer, and
5088 * potentially other layers in the future.
5089 */
5090
5091 static int
5092 timer_user_idle_level(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
5093 {
5094 int new_value = 0, old_value = 0, changed = 0, error;
5095
5096 old_value = timer_get_user_idle_level();
5097
5098 error = sysctl_io_number(req, old_value, sizeof(int), &new_value, &changed);
5099
5100 if (error == 0 && changed) {
5101 if (timer_set_user_idle_level(new_value) != KERN_SUCCESS) {
5102 error = ERANGE;
5103 }
5104 }
5105
5106 return error;
5107 }
5108
5109 SYSCTL_PROC(_machdep, OID_AUTO, user_idle_level,
5110 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
5111 0, 0,
5112 timer_user_idle_level, "I", "User idle level heuristic, 0-128");
5113
5114 #if DEVELOPMENT || DEBUG
5115 /*
5116 * Basic console mode for games; used for development purposes only.
5117 * Final implementation for this feature (with possible removal of
5118 * sysctl) tracked via rdar://101215873.
5119 */
5120 static int console_mode = 0;
5121 SYSCTL_INT(_kern, OID_AUTO, console_mode,
5122 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED | CTLFLAG_MASKED,
5123 &console_mode, 0, "Game Console Mode");
5124 #endif /* DEVELOPMENT || DEBUG */
5125
5126
5127 #if HYPERVISOR
5128 SYSCTL_INT(_kern, OID_AUTO, hv_support,
5129 CTLFLAG_KERN | CTLFLAG_RD | CTLFLAG_LOCKED,
5130 &hv_support_available, 0, "");
5131
5132 SYSCTL_INT(_kern, OID_AUTO, hv_disable,
5133 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5134 &hv_disable, 0, "");
5135
5136 #endif /* HYPERVISOR */
5137
5138 #if DEVELOPMENT || DEBUG
5139 extern uint64_t driverkit_checkin_timed_out;
5140 SYSCTL_QUAD(_kern, OID_AUTO, driverkit_checkin_timed_out,
5141 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
5142 &driverkit_checkin_timed_out, "timestamp of dext checkin timeout");
5143 #endif
5144
5145 #if CONFIG_DARKBOOT
5146 STATIC int
5147 sysctl_darkboot SYSCTL_HANDLER_ARGS
5148 {
5149 int err = 0, value = 0;
5150 #pragma unused(oidp, arg1, arg2, err, value, req)
5151
5152 /*
5153 * Handle the sysctl request.
5154 *
5155 * If this is a read, the function will set the value to the current darkboot value. Otherwise,
5156 * we'll get the request identifier into "value" and then we can honor it.
5157 */
5158 if ((err = sysctl_io_number(req, darkboot, sizeof(int), &value, NULL)) != 0) {
5159 goto exit;
5160 }
5161
5162 /* writing requested, let's process the request */
5163 if (req->newptr) {
5164 /* writing is protected by an entitlement */
5165 if (priv_check_cred(kauth_cred_get(), PRIV_DARKBOOT, 0) != 0) {
5166 err = EPERM;
5167 goto exit;
5168 }
5169
5170 switch (value) {
5171 case MEMORY_MAINTENANCE_DARK_BOOT_UNSET:
5172 /*
5173 * If the darkboot sysctl is unset, the NVRAM variable
5174 * must be unset too. If that's not the case, it means
5175 * someone is doing something crazy and not supported.
5176 */
5177 if (darkboot != 0) {
5178 int ret = PERemoveNVRAMProperty(MEMORY_MAINTENANCE_DARK_BOOT_NVRAM_NAME);
5179 if (ret) {
5180 darkboot = 0;
5181 } else {
5182 err = EINVAL;
5183 }
5184 }
5185 break;
5186 case MEMORY_MAINTENANCE_DARK_BOOT_SET:
5187 darkboot = 1;
5188 break;
5189 case MEMORY_MAINTENANCE_DARK_BOOT_SET_PERSISTENT: {
5190 /*
5191 * Set the NVRAM and update 'darkboot' in case
5192 * of success. Otherwise, do not update
5193 * 'darkboot' and report the failure.
5194 */
5195 if (PEWriteNVRAMBooleanProperty(MEMORY_MAINTENANCE_DARK_BOOT_NVRAM_NAME, TRUE)) {
5196 darkboot = 1;
5197 } else {
5198 err = EINVAL;
5199 }
5200
5201 break;
5202 }
5203 default:
5204 err = EINVAL;
5205 }
5206 }
5207
5208 exit:
5209 return err;
5210 }
5211
5212 SYSCTL_PROC(_kern, OID_AUTO, darkboot,
5213 CTLFLAG_KERN | CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED | CTLFLAG_ANYBODY,
5214 0, 0, sysctl_darkboot, "I", "");
5215 #endif /* CONFIG_DARKBOOT */
5216
5217 #if DEVELOPMENT || DEBUG
5218 #include <sys/sysent.h>
5219 /* This should result in a fatal exception, verifying that "sysent" is
5220 * write-protected.
5221 */
5222 static int
5223 kern_sysent_write(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
5224 {
5225 uint64_t new_value = 0, old_value = 0;
5226 int changed = 0, error;
5227
5228 error = sysctl_io_number(req, old_value, sizeof(uint64_t), &new_value, &changed);
5229 if ((error == 0) && changed) {
5230 volatile uint32_t *wraddr = __DECONST(uint32_t *, &sysent[0]);
5231 *wraddr = 0;
5232 printf("sysent[0] write succeeded\n");
5233 }
5234 return error;
5235 }
5236
5237 SYSCTL_PROC(_kern, OID_AUTO, sysent_const_check,
5238 CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_LOCKED,
5239 0, 0,
5240 kern_sysent_write, "I", "Attempt sysent[0] write");
5241
5242 #endif
5243
5244 #if DEVELOPMENT || DEBUG
5245 SYSCTL_COMPAT_INT(_kern, OID_AUTO, development, CTLFLAG_RD | CTLFLAG_MASKED | CTLFLAG_KERN, NULL, 1, "");
5246 #else
5247 SYSCTL_COMPAT_INT(_kern, OID_AUTO, development, CTLFLAG_RD | CTLFLAG_MASKED, NULL, 0, "");
5248 #endif
5249
5250
5251 #if DEVELOPMENT || DEBUG
5252
5253 decl_lck_spin_data(, spinlock_panic_test_lock);
5254
5255 __attribute__((noreturn))
5256 static void
5257 spinlock_panic_test_acquire_spinlock(void * arg __unused, wait_result_t wres __unused)
5258 {
5259 lck_spin_lock(&spinlock_panic_test_lock);
5260 while (1) {
5261 ;
5262 }
5263 }
5264
5265 static int
5266 sysctl_spinlock_panic_test SYSCTL_HANDLER_ARGS
5267 {
5268 #pragma unused(oidp, arg1, arg2)
5269 if (req->newlen == 0) {
5270 return EINVAL;
5271 }
5272
5273 thread_t panic_spinlock_thread;
5274 /* Initialize panic spinlock */
5275 lck_grp_t * panic_spinlock_grp;
5276 lck_grp_attr_t * panic_spinlock_grp_attr;
5277 lck_attr_t * panic_spinlock_attr;
5278
5279 panic_spinlock_grp_attr = lck_grp_attr_alloc_init();
5280 panic_spinlock_grp = lck_grp_alloc_init("panic_spinlock", panic_spinlock_grp_attr);
5281 panic_spinlock_attr = lck_attr_alloc_init();
5282
5283 lck_spin_init(&spinlock_panic_test_lock, panic_spinlock_grp, panic_spinlock_attr);
5284
5285
5286 /* Create thread to acquire spinlock */
5287 if (kernel_thread_start(spinlock_panic_test_acquire_spinlock, NULL, &panic_spinlock_thread) != KERN_SUCCESS) {
5288 return EBUSY;
5289 }
5290
5291 /* Try to acquire spinlock -- should panic eventually */
5292 lck_spin_lock(&spinlock_panic_test_lock);
5293 while (1) {
5294 ;
5295 }
5296 }
5297
5298 __attribute__((noreturn))
5299 static void
5300 simultaneous_panic_worker
5301 (void * arg, wait_result_t wres __unused)
5302 {
5303 atomic_int *start_panic = (atomic_int *)arg;
5304
5305 while (!atomic_load(start_panic)) {
5306 ;
5307 }
5308 panic("SIMULTANEOUS PANIC TEST: INITIATING PANIC FROM CPU %d", cpu_number());
5309 __builtin_unreachable();
5310 }
5311
5312 static int
5313 sysctl_simultaneous_panic_test SYSCTL_HANDLER_ARGS
5314 {
5315 #pragma unused(oidp, arg1, arg2)
5316 if (req->newlen == 0) {
5317 return EINVAL;
5318 }
5319
5320 int i = 0, threads_to_create = 2 * processor_count;
5321 atomic_int start_panic = 0;
5322 unsigned int threads_created = 0;
5323 thread_t new_panic_thread;
5324
5325 for (i = threads_to_create; i > 0; i--) {
5326 if (kernel_thread_start(simultaneous_panic_worker, (void *) &start_panic, &new_panic_thread) == KERN_SUCCESS) {
5327 threads_created++;
5328 }
5329 }
5330
5331 /* FAIL if we couldn't create at least processor_count threads */
5332 if (threads_created < processor_count) {
5333 panic("SIMULTANEOUS PANIC TEST: FAILED TO CREATE ENOUGH THREADS, ONLY CREATED %d (of %d)",
5334 threads_created, threads_to_create);
5335 }
5336
5337 atomic_exchange(&start_panic, 1);
5338 while (1) {
5339 ;
5340 }
5341 }
5342
5343 extern unsigned int panic_test_failure_mode;
5344 SYSCTL_INT(_debug, OID_AUTO, xnu_panic_failure_mode, CTLFLAG_RW | CTLFLAG_LOCKED | CTLFLAG_KERN, &panic_test_failure_mode, 0, "panic/debugger test failure mode");
5345
5346 extern unsigned int panic_test_action_count;
5347 SYSCTL_INT(_debug, OID_AUTO, xnu_panic_action_count, CTLFLAG_RW | CTLFLAG_LOCKED | CTLFLAG_KERN, &panic_test_action_count, 0, "panic/debugger test action count");
5348
5349 extern unsigned int panic_test_case;
5350 SYSCTL_INT(_debug, OID_AUTO, xnu_panic_test_case, CTLFLAG_RW | CTLFLAG_LOCKED | CTLFLAG_KERN, &panic_test_case, 0, "panic/debugger testcase");
5351
5352 SYSCTL_PROC(_debug, OID_AUTO, xnu_spinlock_panic_test, CTLTYPE_STRING | CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_MASKED, 0, 0, sysctl_spinlock_panic_test, "A", "spinlock panic test");
5353 SYSCTL_PROC(_debug, OID_AUTO, xnu_simultaneous_panic_test, CTLTYPE_STRING | CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_MASKED, 0, 0, sysctl_simultaneous_panic_test, "A", "simultaneous panic test");
5354
5355 extern int exc_resource_threads_enabled;
5356 SYSCTL_INT(_kern, OID_AUTO, exc_resource_threads_enabled, CTLFLAG_RW | CTLFLAG_LOCKED, &exc_resource_threads_enabled, 0, "exc_resource thread limit enabled");
5357
5358
5359 #endif /* DEVELOPMENT || DEBUG */
5360
5361 #if BUILT_LTO
5362 static int _built_lto = 1;
5363 #else // BUILT_LTO
5364 static int _built_lto = 0;
5365 #endif // !BUILT_LTO
5366
5367 SYSCTL_INT(_kern, OID_AUTO, link_time_optimized, CTLFLAG_RD | CTLFLAG_LOCKED | CTLFLAG_KERN, &_built_lto, 0, "Whether the kernel was built with Link Time Optimization enabled");
5368
5369 #if CONFIG_THREAD_GROUPS
5370 #if DEVELOPMENT || DEBUG
5371
5372 static int
5373 sysctl_get_thread_group_id SYSCTL_HANDLER_ARGS
5374 {
5375 #pragma unused(arg1, arg2, oidp)
5376 uint64_t thread_group_id = thread_group_get_id(thread_group_get(current_thread()));
5377 return SYSCTL_OUT(req, &thread_group_id, sizeof(thread_group_id));
5378 }
5379
5380 SYSCTL_PROC(_kern, OID_AUTO, thread_group_id, CTLFLAG_RD | CTLFLAG_LOCKED | CTLTYPE_QUAD,
5381 0, 0, &sysctl_get_thread_group_id, "I", "thread group id of the thread");
5382
5383 STATIC int
5384 sysctl_thread_group_count(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
5385 {
5386 int value = thread_group_count();
5387 return sysctl_io_number(req, value, sizeof(value), NULL, NULL);
5388 }
5389
5390 SYSCTL_PROC(_kern, OID_AUTO, thread_group_count, CTLFLAG_RD | CTLFLAG_LOCKED | CTLFLAG_KERN,
5391 0, 0, &sysctl_thread_group_count, "I", "count of thread groups");
5392
5393 #endif /* DEVELOPMENT || DEBUG */
5394 const uint32_t thread_groups_supported = 1;
5395 #else /* CONFIG_THREAD_GROUPS */
5396 const uint32_t thread_groups_supported = 0;
5397 #endif /* CONFIG_THREAD_GROUPS */
5398
5399 STATIC int
5400 sysctl_thread_groups_supported(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
5401 {
5402 int value = thread_groups_supported;
5403 return sysctl_io_number(req, value, sizeof(value), NULL, NULL);
5404 }
5405
5406 SYSCTL_PROC(_kern, OID_AUTO, thread_groups_supported, CTLFLAG_RD | CTLFLAG_LOCKED | CTLFLAG_KERN,
5407 0, 0, &sysctl_thread_groups_supported, "I", "thread groups supported");
5408
5409 static int
5410 sysctl_grade_cputype SYSCTL_HANDLER_ARGS
5411 {
5412 #pragma unused(arg1, arg2, oidp)
5413 int error = 0;
5414 int type_tuple[2] = {};
5415 int return_value = 0;
5416
5417 error = SYSCTL_IN(req, &type_tuple, sizeof(type_tuple));
5418
5419 if (error) {
5420 return error;
5421 }
5422
5423 return_value = grade_binary(type_tuple[0], type_tuple[1] & ~CPU_SUBTYPE_MASK, type_tuple[1] & CPU_SUBTYPE_MASK, FALSE);
5424
5425 error = SYSCTL_OUT(req, &return_value, sizeof(return_value));
5426
5427 if (error) {
5428 return error;
5429 }
5430
5431 return error;
5432 }
5433
5434 SYSCTL_PROC(_kern, OID_AUTO, grade_cputype,
5435 CTLFLAG_RW | CTLFLAG_ANYBODY | CTLFLAG_MASKED | CTLFLAG_LOCKED | CTLTYPE_OPAQUE,
5436 0, 0, &sysctl_grade_cputype, "S",
5437 "grade value of cpu_type_t+cpu_sub_type_t");
5438
5439 extern boolean_t allow_direct_handoff;
5440 SYSCTL_INT(_kern, OID_AUTO, direct_handoff,
5441 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5442 &allow_direct_handoff, 0, "Enable direct handoff for realtime threads");
5443
5444 #if DEVELOPMENT || DEBUG
5445
5446 SYSCTL_QUAD(_kern, OID_AUTO, phys_carveout_pa, CTLFLAG_RD | CTLFLAG_LOCKED | CTLFLAG_KERN,
5447 &phys_carveout_pa,
5448 "base physical address of the phys_carveout_mb boot-arg region");
5449 SYSCTL_QUAD(_kern, OID_AUTO, phys_carveout_size, CTLFLAG_RD | CTLFLAG_LOCKED | CTLFLAG_KERN,
5450 &phys_carveout_size,
5451 "size in bytes of the phys_carveout_mb boot-arg region");
5452
5453
5454 extern void do_cseg_wedge_thread(void);
5455 extern void do_cseg_unwedge_thread(void);
5456
5457 static int
5458 cseg_wedge_thread SYSCTL_HANDLER_ARGS
5459 {
5460 #pragma unused(arg1, arg2)
5461
5462 int error, val = 0;
5463 error = sysctl_handle_int(oidp, &val, 0, req);
5464 if (error || val == 0) {
5465 return error;
5466 }
5467
5468 do_cseg_wedge_thread();
5469 return 0;
5470 }
5471 SYSCTL_PROC(_kern, OID_AUTO, cseg_wedge_thread, CTLFLAG_RW | CTLFLAG_LOCKED | CTLFLAG_MASKED, 0, 0, cseg_wedge_thread, "I", "wedge c_seg thread");
5472
5473 static int
5474 cseg_unwedge_thread SYSCTL_HANDLER_ARGS
5475 {
5476 #pragma unused(arg1, arg2)
5477
5478 int error, val = 0;
5479 error = sysctl_handle_int(oidp, &val, 0, req);
5480 if (error || val == 0) {
5481 return error;
5482 }
5483
5484 do_cseg_unwedge_thread();
5485 return 0;
5486 }
5487 SYSCTL_PROC(_kern, OID_AUTO, cseg_unwedge_thread, CTLFLAG_RW | CTLFLAG_LOCKED | CTLFLAG_MASKED, 0, 0, cseg_unwedge_thread, "I", "unstuck c_seg thread");
5488
5489 static atomic_int wedge_thread_should_wake = 0;
5490
5491 static int
5492 unwedge_thread SYSCTL_HANDLER_ARGS
5493 {
5494 #pragma unused(arg1, arg2)
5495 int error, val = 0;
5496 error = sysctl_handle_int(oidp, &val, 0, req);
5497 if (error || val == 0) {
5498 return error;
5499 }
5500
5501 atomic_store(&wedge_thread_should_wake, 1);
5502 return 0;
5503 }
5504
5505 SYSCTL_PROC(_kern, OID_AUTO, unwedge_thread, CTLFLAG_RW | CTLFLAG_ANYBODY | CTLFLAG_LOCKED, 0, 0, unwedge_thread, "I", "unwedge the thread wedged by kern.wedge_thread");
5506
5507 static int
5508 wedge_thread SYSCTL_HANDLER_ARGS
5509 {
5510 #pragma unused(arg1, arg2)
5511
5512 int error, val = 0;
5513 error = sysctl_handle_int(oidp, &val, 0, req);
5514 if (error || val == 0) {
5515 return error;
5516 }
5517
5518 uint64_t interval = 1;
5519 nanoseconds_to_absolutetime(1000 * 1000 * 50, &interval);
5520
5521 atomic_store(&wedge_thread_should_wake, 0);
5522 while (!atomic_load(&wedge_thread_should_wake)) {
5523 tsleep1(NULL, 0, "wedge_thread", mach_absolute_time() + interval, NULL);
5524 }
5525
5526 return 0;
5527 }
5528
5529 SYSCTL_PROC(_kern, OID_AUTO, wedge_thread,
5530 CTLFLAG_RW | CTLFLAG_ANYBODY | CTLFLAG_LOCKED, 0, 0, wedge_thread, "I",
5531 "wedge this thread so it cannot be cleaned up");
5532
5533 static int
5534 sysctl_total_corpses_count SYSCTL_HANDLER_ARGS
5535 {
5536 #pragma unused(oidp, arg1, arg2)
5537 extern unsigned long total_corpses_count(void);
5538
5539 unsigned long corpse_count_long = total_corpses_count();
5540 unsigned int corpse_count = (unsigned int)MIN(corpse_count_long, UINT_MAX);
5541 return sysctl_io_opaque(req, &corpse_count, sizeof(corpse_count), NULL);
5542 }
5543
5544 SYSCTL_PROC(_kern, OID_AUTO, total_corpses_count,
5545 CTLFLAG_RD | CTLFLAG_ANYBODY | CTLFLAG_LOCKED, 0, 0,
5546 sysctl_total_corpses_count, "I", "total corpses on the system");
5547
5548 static int
5549 sysctl_turnstile_test_prim_lock SYSCTL_HANDLER_ARGS;
5550 static int
5551 sysctl_turnstile_test_prim_unlock SYSCTL_HANDLER_ARGS;
5552 int
5553 tstile_test_prim_lock(boolean_t use_hashtable);
5554 int
5555 tstile_test_prim_unlock(boolean_t use_hashtable);
5556
5557 static int
5558 sysctl_turnstile_test_prim_lock SYSCTL_HANDLER_ARGS
5559 {
5560 #pragma unused(arg1, arg2)
5561 int error, val = 0;
5562 error = sysctl_handle_int(oidp, &val, 0, req);
5563 if (error || val == 0) {
5564 return error;
5565 }
5566 switch (val) {
5567 case SYSCTL_TURNSTILE_TEST_USER_DEFAULT:
5568 case SYSCTL_TURNSTILE_TEST_USER_HASHTABLE:
5569 case SYSCTL_TURNSTILE_TEST_KERNEL_DEFAULT:
5570 case SYSCTL_TURNSTILE_TEST_KERNEL_HASHTABLE:
5571 return tstile_test_prim_lock(val);
5572 default:
5573 return error;
5574 }
5575 }
5576
5577 static int
5578 sysctl_turnstile_test_prim_unlock SYSCTL_HANDLER_ARGS
5579 {
5580 #pragma unused(arg1, arg2)
5581 int error, val = 0;
5582 error = sysctl_handle_int(oidp, &val, 0, req);
5583 if (error || val == 0) {
5584 return error;
5585 }
5586 switch (val) {
5587 case SYSCTL_TURNSTILE_TEST_USER_DEFAULT:
5588 case SYSCTL_TURNSTILE_TEST_USER_HASHTABLE:
5589 case SYSCTL_TURNSTILE_TEST_KERNEL_DEFAULT:
5590 case SYSCTL_TURNSTILE_TEST_KERNEL_HASHTABLE:
5591 return tstile_test_prim_unlock(val);
5592 default:
5593 return error;
5594 }
5595 }
5596
5597 SYSCTL_PROC(_kern, OID_AUTO, turnstiles_test_lock, CTLFLAG_WR | CTLFLAG_ANYBODY | CTLFLAG_KERN | CTLFLAG_LOCKED,
5598 0, 0, sysctl_turnstile_test_prim_lock, "I", "turnstiles test lock");
5599
5600 SYSCTL_PROC(_kern, OID_AUTO, turnstiles_test_unlock, CTLFLAG_WR | CTLFLAG_ANYBODY | CTLFLAG_KERN | CTLFLAG_LOCKED,
5601 0, 0, sysctl_turnstile_test_prim_unlock, "I", "turnstiles test unlock");
5602
5603 int
5604 turnstile_get_boost_stats_sysctl(void *req);
5605 int
5606 turnstile_get_unboost_stats_sysctl(void *req);
5607 static int
5608 sysctl_turnstile_boost_stats SYSCTL_HANDLER_ARGS;
5609 static int
5610 sysctl_turnstile_unboost_stats SYSCTL_HANDLER_ARGS;
5611 extern uint64_t thread_block_on_turnstile_count;
5612 extern uint64_t thread_block_on_regular_waitq_count;
5613
5614 static int
5615 sysctl_turnstile_boost_stats SYSCTL_HANDLER_ARGS
5616 {
5617 #pragma unused(arg1, arg2, oidp)
5618 return turnstile_get_boost_stats_sysctl(req);
5619 }
5620
5621 static int
5622 sysctl_turnstile_unboost_stats SYSCTL_HANDLER_ARGS
5623 {
5624 #pragma unused(arg1, arg2, oidp)
5625 return turnstile_get_unboost_stats_sysctl(req);
5626 }
5627
5628 SYSCTL_PROC(_kern, OID_AUTO, turnstile_boost_stats, CTLFLAG_RD | CTLFLAG_ANYBODY | CTLFLAG_KERN | CTLFLAG_LOCKED | CTLTYPE_STRUCT,
5629 0, 0, sysctl_turnstile_boost_stats, "S", "turnstiles boost stats");
5630 SYSCTL_PROC(_kern, OID_AUTO, turnstile_unboost_stats, CTLFLAG_RD | CTLFLAG_ANYBODY | CTLFLAG_KERN | CTLFLAG_LOCKED | CTLTYPE_STRUCT,
5631 0, 0, sysctl_turnstile_unboost_stats, "S", "turnstiles unboost stats");
5632 SYSCTL_QUAD(_kern, OID_AUTO, thread_block_count_on_turnstile,
5633 CTLFLAG_RD | CTLFLAG_ANYBODY | CTLFLAG_KERN | CTLFLAG_LOCKED,
5634 &thread_block_on_turnstile_count, "thread blocked on turnstile count");
5635 SYSCTL_QUAD(_kern, OID_AUTO, thread_block_count_on_reg_waitq,
5636 CTLFLAG_RD | CTLFLAG_ANYBODY | CTLFLAG_KERN | CTLFLAG_LOCKED,
5637 &thread_block_on_regular_waitq_count, "thread blocked on regular waitq count");
5638
5639 #if CONFIG_PV_TICKET
5640
5641 extern int ticket_lock_spins;
5642 SYSCTL_INT(_kern, OID_AUTO, ticket_lock_spins,
5643 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5644 &ticket_lock_spins, 0, "loops before hypercall");
5645
5646 #if (DEBUG || DEVELOPMENT)
5647
5648 /* PV ticket lock stats */
5649
5650 SYSCTL_SCALABLE_COUNTER(_kern, ticket_lock_kicks, ticket_kick_count,
5651 "ticket lock kicks");
5652 SYSCTL_SCALABLE_COUNTER(_kern, ticket_lock_waits, ticket_wait_count,
5653 "ticket lock waits");
5654 SYSCTL_SCALABLE_COUNTER(_kern, ticket_lock_already, ticket_already_count,
5655 "ticket lock already unlocked");
5656 SYSCTL_SCALABLE_COUNTER(_kern, ticket_lock_just_unlock, ticket_just_unlock,
5657 "ticket unlock without kick");
5658 SYSCTL_SCALABLE_COUNTER(_kern, ticket_lock_wflag_cleared, ticket_wflag_cleared,
5659 "ticket lock wait flag cleared");
5660 SYSCTL_SCALABLE_COUNTER(_kern, ticket_lock_wflag_still, ticket_wflag_still,
5661 "ticket lock wait flag not cleared");
5662 SYSCTL_SCALABLE_COUNTER(_kern, ticket_lock_spin_count, ticket_spin_count,
5663 "ticket lock spin count");
5664
5665 /* sysctl kern.hcall_probe=n -- does hypercall #n exist? */
5666
5667 static int
5668 sysctl_hcall_probe SYSCTL_HANDLER_ARGS
5669 {
5670 char instr[20];
5671
5672 if (!req->newptr) {
5673 return 0;
5674 }
5675 if (req->newlen >= sizeof(instr)) {
5676 return EOVERFLOW;
5677 }
5678
5679 int error = SYSCTL_IN(req, instr, req->newlen);
5680 if (error) {
5681 return error;
5682 }
5683 instr[req->newlen] = '\0';
5684
5685 int hcall = 0;
5686 error = sscanf(instr, "%d", &hcall);
5687 if (error != 1 || hcall < 0) {
5688 return EINVAL;
5689 }
5690 uprintf("%savailable\n",
5691 hvg_is_hcall_available((hvg_hcall_code_t)hcall) ? "" : "not ");
5692 return 0;
5693 }
5694
5695 SYSCTL_PROC(_kern, OID_AUTO, hcall_probe,
5696 CTLTYPE_STRING | CTLFLAG_WR | CTLFLAG_LOCKED | CTLFLAG_MASKED,
5697 0, 0, sysctl_hcall_probe, "A", "probe hypercall by id");
5698
5699 #endif /* (DEBUG || DEVELOPMENT) */
5700 #endif /* CONFIG_PV_TICKET */
5701
5702 #if defined(__x86_64__)
5703 extern uint64_t MutexSpin;
5704
5705 SYSCTL_QUAD(_kern, OID_AUTO, mutex_spin_abs, CTLFLAG_RW, &MutexSpin,
5706 "Spin time in abs for acquiring a kernel mutex");
5707 #else
5708 extern machine_timeout_t MutexSpin;
5709
5710 SYSCTL_QUAD(_kern, OID_AUTO, mutex_spin_abs, CTLFLAG_RW, &MutexSpin,
5711 "Spin time in abs for acquiring a kernel mutex");
5712 #endif
5713
5714 extern uint64_t low_MutexSpin;
5715 extern int64_t high_MutexSpin;
5716 extern unsigned int real_ncpus;
5717
5718 SYSCTL_QUAD(_kern, OID_AUTO, low_mutex_spin_abs, CTLFLAG_RW, &low_MutexSpin,
5719 "Low spin threshold in abs for acquiring a kernel mutex");
5720
5721 static int
5722 sysctl_high_mutex_spin_ns SYSCTL_HANDLER_ARGS
5723 {
5724 #pragma unused(oidp, arg1, arg2)
5725 int error;
5726 int64_t val = 0;
5727 int64_t res;
5728
5729 /* Check if the user is writing to high_MutexSpin, or just reading it */
5730 if (req->newptr) {
5731 error = SYSCTL_IN(req, &val, sizeof(val));
5732 if (error || (val < 0 && val != -1)) {
5733 return error;
5734 }
5735 high_MutexSpin = val;
5736 }
5737
5738 if (high_MutexSpin >= 0) {
5739 res = high_MutexSpin;
5740 } else {
5741 res = low_MutexSpin * real_ncpus;
5742 }
5743 return SYSCTL_OUT(req, &res, sizeof(res));
5744 }
5745 SYSCTL_PROC(_kern, OID_AUTO, high_mutex_spin_abs, CTLFLAG_RW | CTLTYPE_QUAD, 0, 0, sysctl_high_mutex_spin_ns, "I",
5746 "High spin threshold in abs for acquiring a kernel mutex");
5747
5748 #if defined (__x86_64__)
5749
5750 semaphore_t sysctl_test_panic_with_thread_sem;
5751
5752 #pragma clang diagnostic push
5753 #pragma clang diagnostic ignored "-Winfinite-recursion" /* rdar://38801963 */
5754 __attribute__((noreturn))
5755 static void
5756 panic_thread_test_child_spin(void * arg, wait_result_t wres)
5757 {
5758 static int panic_thread_recurse_count = 5;
5759
5760 if (panic_thread_recurse_count > 0) {
5761 panic_thread_recurse_count--;
5762 panic_thread_test_child_spin(arg, wres);
5763 }
5764
5765 semaphore_signal(sysctl_test_panic_with_thread_sem);
5766 while (1) {
5767 ;
5768 }
5769 }
5770 #pragma clang diagnostic pop
5771
5772 static void
5773 panic_thread_test_child_park(void * arg __unused, wait_result_t wres __unused)
5774 {
5775 int event;
5776
5777 assert_wait(&event, THREAD_UNINT);
5778 semaphore_signal(sysctl_test_panic_with_thread_sem);
5779 thread_block(panic_thread_test_child_park);
5780 }
5781
5782 static int
5783 sysctl_test_panic_with_thread SYSCTL_HANDLER_ARGS
5784 {
5785 #pragma unused(arg1, arg2)
5786 int rval = 0;
5787 char str[16] = { '\0' };
5788 thread_t child_thread = THREAD_NULL;
5789
5790 rval = sysctl_handle_string(oidp, str, sizeof(str), req);
5791 if (rval != 0 || !req->newptr) {
5792 return EINVAL;
5793 }
5794
5795 semaphore_create(kernel_task, &sysctl_test_panic_with_thread_sem, SYNC_POLICY_FIFO, 0);
5796
5797 /* Create thread to spin or park in continuation */
5798 if (strncmp("spin", str, strlen("spin")) == 0) {
5799 if (kernel_thread_start(panic_thread_test_child_spin, NULL, &child_thread) != KERN_SUCCESS) {
5800 semaphore_destroy(kernel_task, sysctl_test_panic_with_thread_sem);
5801 return EBUSY;
5802 }
5803 } else if (strncmp("continuation", str, strlen("continuation")) == 0) {
5804 if (kernel_thread_start(panic_thread_test_child_park, NULL, &child_thread) != KERN_SUCCESS) {
5805 semaphore_destroy(kernel_task, sysctl_test_panic_with_thread_sem);
5806 return EBUSY;
5807 }
5808 } else {
5809 semaphore_destroy(kernel_task, sysctl_test_panic_with_thread_sem);
5810 return EINVAL;
5811 }
5812
5813 semaphore_wait(sysctl_test_panic_with_thread_sem);
5814
5815 panic_with_thread_context(0, NULL, 0, child_thread, "testing panic_with_thread_context for thread %p", child_thread);
5816
5817 /* Not reached */
5818 return EINVAL;
5819 }
5820
5821 SYSCTL_PROC(_kern, OID_AUTO, test_panic_with_thread,
5822 CTLFLAG_MASKED | CTLFLAG_KERN | CTLFLAG_LOCKED | CTLFLAG_WR | CTLTYPE_STRING,
5823 0, 0, sysctl_test_panic_with_thread, "A", "test panic flow for backtracing a different thread");
5824 #endif /* defined (__x86_64__) */
5825
5826 #endif /* DEVELOPMENT || DEBUG */
5827
5828 static int
5829 sysctl_get_owned_vmobjects SYSCTL_HANDLER_ARGS
5830 {
5831 #pragma unused(oidp, arg1, arg2)
5832
5833 /* validate */
5834 if (req->newlen != sizeof(mach_port_name_t) || req->newptr == USER_ADDR_NULL ||
5835 req->oldidx != 0 || req->newidx != 0 || req->p == NULL ||
5836 (req->oldlen == 0 && req->oldptr != USER_ADDR_NULL)) {
5837 return EINVAL;
5838 }
5839
5840 int error;
5841 mach_port_name_t task_port_name;
5842 task_t task;
5843 size_t buffer_size = (req->oldptr != USER_ADDR_NULL) ? req->oldlen : 0;
5844 vmobject_list_output_t buffer = NULL;
5845 size_t output_size;
5846 size_t entries;
5847
5848 /* we have a "newptr" (for write) we get a task port name from the caller. */
5849 error = SYSCTL_IN(req, &task_port_name, sizeof(mach_port_name_t));
5850
5851 if (error != 0) {
5852 goto sysctl_get_vmobject_list_exit;
5853 }
5854
5855 task = port_name_to_task_read(task_port_name);
5856 if (task == TASK_NULL) {
5857 error = ESRCH;
5858 goto sysctl_get_vmobject_list_exit;
5859 }
5860
5861 bool corpse = task_is_a_corpse(task);
5862
5863 /* get the current size */
5864 size_t max_size;
5865 task_get_owned_vmobjects(task, 0, NULL, &max_size, &entries);
5866
5867 if (buffer_size && (buffer_size < sizeof(*buffer) + sizeof(vm_object_query_data_t))) {
5868 error = ENOMEM;
5869 goto sysctl_get_vmobject_list_deallocate_and_exit;
5870 }
5871
5872 if (corpse == false) {
5873 /* copy the vmobjects and vmobject data out of the task */
5874 if (buffer_size == 0) {
5875 output_size = max_size;
5876 } else {
5877 buffer_size = (buffer_size > max_size) ? max_size : buffer_size;
5878 buffer = (struct _vmobject_list_output_ *)kalloc_data(buffer_size, Z_WAITOK);
5879
5880 if (!buffer) {
5881 error = ENOMEM;
5882 goto sysctl_get_vmobject_list_deallocate_and_exit;
5883 }
5884
5885 task_get_owned_vmobjects(task, buffer_size, buffer, &output_size, &entries);
5886 }
5887
5888 /* req->oldptr should be USER_ADDR_NULL if buffer == NULL and return the current size */
5889 /* otherwise copy buffer to oldptr and return the bytes copied */
5890 error = SYSCTL_OUT(req, (char *)buffer, output_size);
5891 } else {
5892 vmobject_list_output_t list;
5893
5894 task_get_corpse_vmobject_list(task, &list, &max_size);
5895 assert(buffer == NULL);
5896
5897 /* copy corpse_vmobject_list to output buffer to avoid double copy */
5898 if (buffer_size) {
5899 size_t temp_size;
5900
5901 temp_size = buffer_size > max_size ? max_size : buffer_size;
5902 output_size = temp_size - sizeof(*buffer);
5903 /* whole multiple of vm_object_query_data_t */
5904 output_size = (output_size / sizeof(vm_object_query_data_t)) * sizeof(vm_object_query_data_t) + sizeof(*buffer);
5905 buffer = list;
5906 } else {
5907 output_size = max_size;
5908 }
5909
5910 /* req->oldptr should be USER_ADDR_NULL if buffer == NULL and return the current size */
5911 /* otherwise copy buffer to oldptr and return the bytes copied */
5912 error = SYSCTL_OUT(req, (char*)buffer, output_size);
5913 buffer = NULL;
5914 }
5915
5916 sysctl_get_vmobject_list_deallocate_and_exit:
5917 task_deallocate(task);
5918
5919 sysctl_get_vmobject_list_exit:
5920 if (buffer) {
5921 kfree_data(buffer, buffer_size);
5922 }
5923
5924 return error;
5925 }
5926
5927 SYSCTL_PROC(_vm, OID_AUTO, get_owned_vmobjects,
5928 CTLTYPE_OPAQUE | CTLFLAG_RD | CTLFLAG_WR | CTLFLAG_MASKED | CTLFLAG_KERN | CTLFLAG_LOCKED | CTLFLAG_ANYBODY,
5929 0, 0, sysctl_get_owned_vmobjects, "A", "get owned vmobjects in task");
5930
5931 extern uint64_t num_static_scalable_counters;
5932 SYSCTL_QUAD(_kern, OID_AUTO, num_static_scalable_counters, CTLFLAG_RD | CTLFLAG_LOCKED, &num_static_scalable_counters, "");
5933
5934 #if SCHED_HYGIENE_DEBUG
5935 TUNABLE_DT(bool, sched_hygiene_nonspec_tb, "machine-timeouts", "nonspec-tb", "sched-hygiene-nonspec-tb", false, TUNABLE_DT_NONE);
5936 #endif /* SCHED_HYGIENE_DEBUG */
5937
5938 uuid_string_t trial_treatment_id;
5939 uuid_string_t trial_experiment_id;
5940 int trial_deployment_id = -1;
5941
5942 SYSCTL_STRING(_kern, OID_AUTO, trial_treatment_id, CTLFLAG_RW | CTLFLAG_LOCKED | CTLFLAG_ANYBODY | CTLFLAG_EXPERIMENT, trial_treatment_id, sizeof(trial_treatment_id), "");
5943 SYSCTL_STRING(_kern, OID_AUTO, trial_experiment_id, CTLFLAG_RW | CTLFLAG_LOCKED | CTLFLAG_ANYBODY | CTLFLAG_EXPERIMENT, trial_experiment_id, sizeof(trial_experiment_id), "");
5944 SYSCTL_INT(_kern, OID_AUTO, trial_deployment_id, CTLFLAG_RW | CTLFLAG_LOCKED | CTLFLAG_ANYBODY | CTLFLAG_EXPERIMENT, &trial_deployment_id, 0, "");
5945
5946 #if (DEVELOPMENT || DEBUG)
5947 /* For unit testing setting factors & limits. */
5948 unsigned int testing_experiment_factor;
5949 EXPERIMENT_FACTOR_UINT(_kern, testing_experiment_factor, &testing_experiment_factor, 5, 10, "");
5950
5951 extern int exception_log_max_pid;
5952 SYSCTL_INT(_debug, OID_AUTO, exception_log_max_pid, CTLFLAG_RW | CTLFLAG_LOCKED, &exception_log_max_pid, 0, "Log exceptions for all processes up to this pid");
5953 #endif /* (DEVELOPMENT || DEBUG) */
5954
5955 #if DEVELOPMENT || DEBUG
5956 static int
5957 unlink_kernelcore_sysctl SYSCTL_HANDLER_ARGS
5958 {
5959 if (!req->newptr) {
5960 return EINVAL;
5961 }
5962 void IOBSDLowSpaceUnlinkKernelCore(void);
5963 IOBSDLowSpaceUnlinkKernelCore();
5964 return 0;
5965 }
5966
5967 SYSCTL_PROC(_kern, OID_AUTO, unlink_kernelcore,
5968 CTLTYPE_INT | CTLFLAG_WR | CTLFLAG_LOCKED | CTLFLAG_MASKED, 0, 0,
5969 unlink_kernelcore_sysctl, "-", "unlink the kernelcore file");
5970 #endif /* DEVELOPMENT || DEBUG */
5971
5972 #if CONFIG_IOTRACE
5973 #pragma clang diagnostic push
5974 #pragma clang diagnostic ignored "-Wcast-qual"
5975 SYSCTL_INT(_debug, OID_AUTO, MMIOtrace,
5976 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5977 (int *)&mmiotrace_enabled, 0, "");
5978 #pragma clang diagnostic pop
5979 #endif /* CONFIG_IOTRACE */
5980
5981 static int
5982 sysctl_page_protection_type SYSCTL_HANDLER_ARGS
5983 {
5984 #pragma unused(oidp, arg1, arg2)
5985 int value = ml_page_protection_type();
5986 return SYSCTL_OUT(req, &value, sizeof(value));
5987 }
5988
5989 SYSCTL_PROC(_kern, OID_AUTO, page_protection_type,
5990 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
5991 0, 0, sysctl_page_protection_type, "I", "Type of page protection that the system supports");
5992
5993 TUNABLE_DT(int, gpu_pmem_selector, "defaults", "kern.gpu_pmem_selector", "gpu-pmem-selector", 0, TUNABLE_DT_NONE);
5994
5995
5996 #if (DEVELOPMENT || DEBUG)
5997 SYSCTL_INT(_kern, OID_AUTO, gpu_pmem_selector,
5998 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED | CTLFLAG_KERN,
5999 &gpu_pmem_selector, 0, "GPU wire down limit selector");
6000 #else /* !(DEVELOPMENT || DEBUG) */
6001 SYSCTL_INT(_kern, OID_AUTO, gpu_pmem_selector,
6002 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED | CTLFLAG_KERN | CTLFLAG_MASKED,
6003 &gpu_pmem_selector, 0, "GPU wire down limit selector");
6004 #endif /* (DEVELOPMENT || DEBUG) */
6005
6006 static int
6007 sysctl_exclaves_status SYSCTL_HANDLER_ARGS
6008 {
6009 int value = exclaves_get_status();
6010 return sysctl_io_number(req, value, sizeof(value), NULL, NULL);
6011 }
6012
6013 SYSCTL_PROC(_kern, OID_AUTO, exclaves_status,
6014 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
6015 0, 0, sysctl_exclaves_status, "I", "Running status of Exclaves");
6016
6017