1 /*
2 * Copyright (c) 2000-2021 Apple Inc. All rights reserved.
3 *
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
5 *
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
14 *
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
17 *
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
25 *
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
27 */
28 /* Copyright (c) 1995 NeXT Computer, Inc. All Rights Reserved */
29 /*-
30 * Copyright (c) 1982, 1986, 1989, 1993
31 * The Regents of the University of California. All rights reserved.
32 *
33 * This code is derived from software contributed to Berkeley by
34 * Mike Karels at Berkeley Software Design, Inc.
35 *
36 * Redistribution and use in source and binary forms, with or without
37 * modification, are permitted provided that the following conditions
38 * are met:
39 * 1. Redistributions of source code must retain the above copyright
40 * notice, this list of conditions and the following disclaimer.
41 * 2. Redistributions in binary form must reproduce the above copyright
42 * notice, this list of conditions and the following disclaimer in the
43 * documentation and/or other materials provided with the distribution.
44 * 3. All advertising materials mentioning features or use of this software
45 * must display the following acknowledgement:
46 * This product includes software developed by the University of
47 * California, Berkeley and its contributors.
48 * 4. Neither the name of the University nor the names of its contributors
49 * may be used to endorse or promote products derived from this software
50 * without specific prior written permission.
51 *
52 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
53 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
54 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
55 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
56 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
57 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
58 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
59 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
60 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
61 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
62 * SUCH DAMAGE.
63 *
64 * @(#)kern_sysctl.c 8.4 (Berkeley) 4/14/94
65 */
66 /*
67 * NOTICE: This file was modified by SPARTA, Inc. in 2005 to introduce
68 * support for mandatory and extensible security protections. This notice
69 * is included in support of clause 2.2 (b) of the Apple Public License,
70 * Version 2.0.
71 */
72
73 /*
74 * DEPRECATED sysctl system call code
75 *
76 * Everything in this file is deprecated. Sysctls should be handled
77 * by the code in kern_newsysctl.c.
78 * The remaining "case" sections are supposed to be converted into
79 * SYSCTL_*-style definitions, and as soon as all of them are gone,
80 * this source file is supposed to die.
81 *
82 * DO NOT ADD ANY MORE "case" SECTIONS TO THIS FILE, instead define
83 * your sysctl with SYSCTL_INT, SYSCTL_PROC etc. in your source file.
84 */
85
86 #include <sys/param.h>
87 #include <sys/systm.h>
88 #include <sys/kernel.h>
89 #include <sys/malloc.h>
90 #include <sys/proc_internal.h>
91 #include <sys/kauth.h>
92 #include <sys/file_internal.h>
93 #include <sys/vnode_internal.h>
94 #include <sys/unistd.h>
95 #include <sys/buf.h>
96 #include <sys/ioctl.h>
97 #include <sys/namei.h>
98 #include <sys/tty.h>
99 #include <sys/disklabel.h>
100 #include <sys/vm.h>
101 #include <sys/sysctl.h>
102 #include <sys/user.h>
103 #include <sys/aio_kern.h>
104 #include <sys/reboot.h>
105 #include <sys/memory_maintenance.h>
106 #include <sys/priv.h>
107 #include <stdatomic.h>
108 #include <uuid/uuid.h>
109
110 #include <security/audit/audit.h>
111 #include <kern/kalloc.h>
112
113 #include <machine/smp.h>
114 #include <machine/atomic.h>
115 #include <machine/config.h>
116 #include <mach/machine.h>
117 #include <mach/mach_host.h>
118 #include <mach/mach_types.h>
119 #include <mach/processor_info.h>
120 #include <mach/vm_param.h>
121 #include <kern/debug.h>
122 #include <kern/mach_param.h>
123 #include <kern/task.h>
124 #include <kern/thread.h>
125 #include <kern/thread_group.h>
126 #include <kern/processor.h>
127 #include <kern/cpu_number.h>
128 #include <kern/cpu_quiesce.h>
129 #include <kern/sched_prim.h>
130 #include <kern/workload_config.h>
131 #include <kern/iotrace.h>
132 #include <vm/vm_kern.h>
133 #include <vm/vm_map.h>
134 #include <mach/host_info.h>
135 #include <kern/hvg_hypercall.h>
136
137 #include <sys/mount_internal.h>
138 #include <sys/kdebug.h>
139 #include <sys/kern_debug.h>
140 #include <sys/kern_sysctl.h>
141 #include <sys/variant_internal.h>
142
143 #include <IOKit/IOPlatformExpert.h>
144 #include <pexpert/pexpert.h>
145
146 #include <machine/machine_routines.h>
147 #include <machine/exec.h>
148
149 #include <nfs/nfs_conf.h>
150
151 #include <vm/vm_protos.h>
152 #include <vm/vm_pageout.h>
153 #include <vm/vm_compressor_algorithms.h>
154 #include <sys/imgsrc.h>
155 #include <kern/timer_call.h>
156 #include <sys/codesign.h>
157 #include <IOKit/IOBSD.h>
158 #if CONFIG_CSR
159 #include <sys/csr.h>
160 #endif
161
162 #if defined(__i386__) || defined(__x86_64__)
163 #include <i386/cpuid.h>
164 #endif
165
166 #if CONFIG_FREEZE
167 #include <sys/kern_memorystatus.h>
168 #endif
169
170 #if KPERF
171 #include <kperf/kperf.h>
172 #endif
173
174 #if HYPERVISOR
175 #include <kern/hv_support.h>
176 #endif
177
178
179 #include <corecrypto/ccsha2.h>
180
181 /*
182 * deliberately setting max requests to really high number
183 * so that runaway settings do not cause MALLOC overflows
184 */
185 #define AIO_MAX_REQUESTS (128 * CONFIG_AIO_MAX)
186
187 extern int aio_max_requests;
188 extern int aio_max_requests_per_process;
189 extern int aio_worker_threads;
190 extern int lowpri_IO_window_msecs;
191 extern int lowpri_IO_delay_msecs;
192 #if DEVELOPMENT || DEBUG
193 extern int nx_enabled;
194 #endif
195 extern int speculative_reads_disabled;
196 extern unsigned int speculative_prefetch_max;
197 extern unsigned int speculative_prefetch_max_iosize;
198 extern unsigned int preheat_max_bytes;
199 extern unsigned int preheat_min_bytes;
200 extern long numvnodes;
201 extern long freevnodes;
202 extern long num_recycledvnodes;
203
204 extern uuid_string_t bootsessionuuid_string;
205
206 extern unsigned int vm_max_delayed_work_limit;
207 extern unsigned int vm_max_batch;
208
209 extern unsigned int vm_page_free_min;
210 extern unsigned int vm_page_free_target;
211 extern unsigned int vm_page_free_reserved;
212
213 #if (DEVELOPMENT || DEBUG)
214 extern uint32_t vm_page_creation_throttled_hard;
215 extern uint32_t vm_page_creation_throttled_soft;
216 #endif /* DEVELOPMENT || DEBUG */
217
218 /*
219 * Conditionally allow dtrace to see these functions for debugging purposes.
220 */
221 #ifdef STATIC
222 #undef STATIC
223 #endif
224 #if 0
225 #define STATIC
226 #else
227 #define STATIC static
228 #endif
229
230 extern boolean_t mach_timer_coalescing_enabled;
231
232 extern uint64_t timer_deadline_tracking_bin_1, timer_deadline_tracking_bin_2;
233
234 STATIC void
235 fill_user32_eproc(proc_t, struct user32_eproc *__restrict);
236 STATIC void
237 fill_user32_externproc(proc_t, struct user32_extern_proc *__restrict);
238 STATIC void
239 fill_user64_eproc(proc_t, struct user64_eproc *__restrict);
240 STATIC void
241 fill_user64_proc(proc_t, struct user64_kinfo_proc *__restrict);
242 STATIC void
243 fill_user64_externproc(proc_t, struct user64_extern_proc *__restrict);
244 STATIC void
245 fill_user32_proc(proc_t, struct user32_kinfo_proc *__restrict);
246
247 #if CONFIG_NETBOOT
248 extern int
249 netboot_root(void);
250 #endif
251 int
252 sysctl_procargs(int *name, u_int namelen, user_addr_t where,
253 size_t *sizep, proc_t cur_proc);
254 STATIC int
255 sysctl_procargsx(int *name, u_int namelen, user_addr_t where, size_t *sizep,
256 proc_t cur_proc, int argc_yes);
257 int
258 sysctl_struct(user_addr_t oldp, size_t *oldlenp, user_addr_t newp,
259 size_t newlen, void *sp, int len);
260
261 STATIC int sysdoproc_filt_KERN_PROC_PID(proc_t p, void * arg);
262 STATIC int sysdoproc_filt_KERN_PROC_PGRP(proc_t p, void * arg);
263 STATIC int sysdoproc_filt_KERN_PROC_TTY(proc_t p, void * arg);
264 STATIC int sysdoproc_filt_KERN_PROC_UID(proc_t p, void * arg);
265 STATIC int sysdoproc_filt_KERN_PROC_RUID(proc_t p, void * arg);
266 int sysdoproc_callback(proc_t p, void *arg);
267
268 #if CONFIG_THREAD_GROUPS && (DEVELOPMENT || DEBUG)
269 STATIC int sysctl_get_thread_group_id SYSCTL_HANDLER_ARGS;
270 #endif
271
272 /* forward declarations for non-static STATIC */
273 STATIC void fill_loadavg64(struct loadavg *la, struct user64_loadavg *la64);
274 STATIC void fill_loadavg32(struct loadavg *la, struct user32_loadavg *la32);
275 STATIC int sysctl_handle_kern_threadname(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
276 STATIC int sysctl_sched_stats(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
277 STATIC int sysctl_sched_stats_enable(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
278 #if COUNT_SYSCALLS
279 STATIC int sysctl_docountsyscalls SYSCTL_HANDLER_ARGS;
280 #endif /* COUNT_SYSCALLS */
281 #if defined(XNU_TARGET_OS_OSX)
282 STATIC int sysctl_doprocargs SYSCTL_HANDLER_ARGS;
283 #endif /* defined(XNU_TARGET_OS_OSX) */
284 STATIC int sysctl_doprocargs2 SYSCTL_HANDLER_ARGS;
285 STATIC int sysctl_prochandle SYSCTL_HANDLER_ARGS;
286 STATIC int sysctl_aiomax(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
287 STATIC int sysctl_aioprocmax(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
288 STATIC int sysctl_aiothreads(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
289 STATIC int sysctl_maxproc(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
290 STATIC int sysctl_osversion(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
291 STATIC int sysctl_sysctl_bootargs(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
292 STATIC int sysctl_maxvnodes(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
293 STATIC int sysctl_securelvl(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
294 STATIC int sysctl_domainname(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
295 STATIC int sysctl_hostname(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
296 STATIC int sysctl_procname(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
297 STATIC int sysctl_boottime(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
298 STATIC int sysctl_bootuuid(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
299 STATIC int sysctl_symfile(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
300 #if CONFIG_NETBOOT
301 STATIC int sysctl_netboot(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
302 #endif
303 #ifdef CONFIG_IMGSRC_ACCESS
304 STATIC int sysctl_imgsrcdev(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
305 #endif
306 STATIC int sysctl_usrstack(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
307 STATIC int sysctl_usrstack64(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
308 #if CONFIG_COREDUMP
309 STATIC int sysctl_coredump(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
310 STATIC int sysctl_suid_coredump(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
311 #endif
312 STATIC int sysctl_delayterm(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
313 STATIC int sysctl_rage_vnode(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
314 STATIC int sysctl_kern_check_openevt(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
315 #if DEVELOPMENT || DEBUG
316 STATIC int sysctl_nx(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
317 #endif
318 STATIC int sysctl_loadavg(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
319 STATIC int sysctl_vm_toggle_address_reuse(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
320 STATIC int sysctl_swapusage(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
321 STATIC int fetch_process_cputype( proc_t cur_proc, int *name, u_int namelen, cpu_type_t *cputype);
322 STATIC int sysctl_sysctl_native(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
323 STATIC int sysctl_sysctl_cputype(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
324 STATIC int sysctl_safeboot(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
325 STATIC int sysctl_singleuser(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
326 STATIC int sysctl_minimalboot(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
327 STATIC int sysctl_slide(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
328
329 #ifdef CONFIG_XNUPOST
330 #include <tests/xnupost.h>
331
332 STATIC int sysctl_debug_test_oslog_ctl(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
333 STATIC int sysctl_debug_test_stackshot_mutex_owner(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
334 STATIC int sysctl_debug_test_stackshot_rwlck_owner(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req);
335 #endif
336
337 extern void IORegistrySetOSBuildVersion(char * build_version);
338 extern int IOParseWorkloadConfig(workload_config_ctx_t *ctx, const char * buffer, size_t size);
339 extern int IOUnparseWorkloadConfig(char *buffer, size_t *size);
340
341 STATIC void
fill_loadavg64(struct loadavg * la,struct user64_loadavg * la64)342 fill_loadavg64(struct loadavg *la, struct user64_loadavg *la64)
343 {
344 la64->ldavg[0] = la->ldavg[0];
345 la64->ldavg[1] = la->ldavg[1];
346 la64->ldavg[2] = la->ldavg[2];
347 la64->fscale = (user64_long_t)la->fscale;
348 }
349
350 STATIC void
fill_loadavg32(struct loadavg * la,struct user32_loadavg * la32)351 fill_loadavg32(struct loadavg *la, struct user32_loadavg *la32)
352 {
353 la32->ldavg[0] = la->ldavg[0];
354 la32->ldavg[1] = la->ldavg[1];
355 la32->ldavg[2] = la->ldavg[2];
356 la32->fscale = (user32_long_t)la->fscale;
357 }
358
359 #if COUNT_SYSCALLS
360 extern int do_count_syscalls;
361 #endif
362
363 #ifdef INSECURE
364 int securelevel = -1;
365 #else
366 int securelevel;
367 #endif
368
369 STATIC int
sysctl_handle_kern_threadname(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)370 sysctl_handle_kern_threadname( __unused struct sysctl_oid *oidp, __unused void *arg1,
371 __unused int arg2, struct sysctl_req *req)
372 {
373 int error;
374 struct uthread *ut = current_uthread();
375 user_addr_t oldp = 0, newp = 0;
376 size_t *oldlenp = NULL;
377 size_t newlen = 0;
378
379 oldp = req->oldptr;
380 oldlenp = &(req->oldlen);
381 newp = req->newptr;
382 newlen = req->newlen;
383
384 /* We want the current length, and maybe the string itself */
385 if (oldlenp) {
386 /* if we have no thread name yet tell'em we want MAXTHREADNAMESIZE - 1 */
387 size_t currlen = MAXTHREADNAMESIZE - 1;
388
389 if (ut->pth_name) {
390 /* use length of current thread name */
391 currlen = strlen(ut->pth_name);
392 }
393 if (oldp) {
394 if (*oldlenp < currlen) {
395 return ENOMEM;
396 }
397 /* NOTE - we do not copy the NULL terminator */
398 if (ut->pth_name) {
399 error = copyout(ut->pth_name, oldp, currlen);
400 if (error) {
401 return error;
402 }
403 }
404 }
405 /* return length of thread name minus NULL terminator (just like strlen) */
406 req->oldidx = currlen;
407 }
408
409 /* We want to set the name to something */
410 if (newp) {
411 if (newlen > (MAXTHREADNAMESIZE - 1)) {
412 return ENAMETOOLONG;
413 }
414 if (!ut->pth_name) {
415 char *tmp_pth_name = (char *)kalloc_data(MAXTHREADNAMESIZE,
416 Z_WAITOK | Z_ZERO);
417 if (!tmp_pth_name) {
418 return ENOMEM;
419 }
420 if (!OSCompareAndSwapPtr(NULL, tmp_pth_name, &ut->pth_name)) {
421 kfree_data(tmp_pth_name, MAXTHREADNAMESIZE);
422 return EBUSY;
423 }
424 } else {
425 kernel_debug_string_simple(TRACE_STRING_THREADNAME_PREV, ut->pth_name);
426 bzero(ut->pth_name, MAXTHREADNAMESIZE);
427 }
428 error = copyin(newp, ut->pth_name, newlen);
429 if (error) {
430 return error;
431 }
432
433 kernel_debug_string_simple(TRACE_STRING_THREADNAME, ut->pth_name);
434 }
435
436 return 0;
437 }
438
439 SYSCTL_PROC(_kern, KERN_THREADNAME, threadname, CTLFLAG_ANYBODY | CTLTYPE_STRING | CTLFLAG_RW | CTLFLAG_LOCKED, 0, 0, sysctl_handle_kern_threadname, "A", "");
440
441 #define WORKLOAD_CONFIG_MAX_SIZE (128 * 1024 * 1024)
442
443 /* Called locked - sysctl defined without CTLFLAG_LOCKED. */
444 static int
445 sysctl_workload_config SYSCTL_HANDLER_ARGS
446 {
447 #pragma unused(arg1, arg2)
448
449 char *plist_blob = NULL;
450 kern_return_t ret = KERN_FAILURE;
451 int error = -1;
452
453 /* Only allow reading of workload config on non-RELEASE kernels. */
454 #if DEVELOPMENT || DEBUG
455
456 const size_t buf_size = req->oldlen;
457
458 if (!req->oldptr) {
459 /* Just looking for the size to allocate. */
460 size_t size = 0;
461 ret = IOUnparseWorkloadConfig(NULL, &size);
462 if (ret != KERN_SUCCESS) {
463 return ENOMEM;
464 }
465
466 error = SYSCTL_OUT(req, NULL, size);
467 if (error) {
468 return error;
469 }
470 } else {
471 if (buf_size > (WORKLOAD_CONFIG_MAX_SIZE - 1) ||
472 buf_size == 0) {
473 return EINVAL;
474 }
475
476 plist_blob = kalloc_data(buf_size, Z_WAITOK | Z_ZERO);
477 if (!plist_blob) {
478 return ENOMEM;
479 }
480
481 size_t size = buf_size;
482 ret = IOUnparseWorkloadConfig(plist_blob, &size);
483 if (ret != KERN_SUCCESS) {
484 kfree_data(plist_blob, buf_size);
485 return ENOMEM;
486 }
487
488 error = SYSCTL_OUT(req, plist_blob, MIN(buf_size, size));
489
490 /* If the buffer was too small to fit the entire config. */
491 if (buf_size < size) {
492 error = ENOMEM;
493 }
494
495 kfree_data(plist_blob, buf_size);
496 if (error) {
497 return error;
498 }
499 }
500 #endif /* DEVELOPMENT || DEBUG */
501
502 if (req->newptr) {
503 size_t newlen = req->newlen;
504 if (newlen > (WORKLOAD_CONFIG_MAX_SIZE - 1)) {
505 return EINVAL;
506 }
507
508
509 workload_config_ctx_t *ctx = NULL;
510 /*
511 * Only allow workload_config_boot to be loaded once at boot by launchd.
512 */
513 if (current_proc() == initproc &&
514 !workload_config_initialized(&workload_config_boot)) {
515 ctx = &workload_config_boot;
516 } else {
517 #if DEVELOPMENT || DEBUG
518 /*
519 * Use the devel config context otherwise. If a devel config has been
520 * initialized it will be used for lookups in place of the boot config.
521 */
522 ctx = &workload_config_devel;
523 if (workload_config_initialized(ctx)) {
524 workload_config_free(ctx);
525 }
526
527 /* The devel context can be explicitly cleared by an empty string. */
528 if (newlen == 1) {
529 return 0;
530 }
531 #else
532 return EINVAL;
533 #endif
534 }
535
536 plist_blob = kalloc_data(newlen + 1, Z_WAITOK | Z_ZERO);
537 if (!plist_blob) {
538 return ENOMEM;
539 }
540 error = copyin(req->newptr, plist_blob, newlen);
541 if (error) {
542 kfree_data(plist_blob, newlen + 1);
543 return error;
544 }
545 plist_blob[newlen] = '\0';
546 ret = IOParseWorkloadConfig(ctx, plist_blob, newlen + 1);
547
548 kfree_data(plist_blob, newlen + 1);
549 return ret == KERN_SUCCESS ? 0 : EINVAL;
550 }
551
552 return 0;
553 }
554
555 SYSCTL_PROC(_kern, OID_AUTO, workload_config, CTLTYPE_STRING | CTLFLAG_RW | CTLFLAG_MASKED,
556 0, 0, sysctl_workload_config, "A", "global workgroup configuration plist load/unload");
557
558 #define BSD_HOST 1
559 STATIC int
sysctl_sched_stats(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)560 sysctl_sched_stats(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
561 {
562 host_basic_info_data_t hinfo;
563 kern_return_t kret;
564 uint32_t size;
565 uint32_t buf_size = 0;
566 int changed;
567 mach_msg_type_number_t count = HOST_BASIC_INFO_COUNT;
568 struct _processor_statistics_np *buf;
569 int error;
570
571 kret = host_info((host_t)BSD_HOST, HOST_BASIC_INFO, (host_info_t)&hinfo, &count);
572 if (kret != KERN_SUCCESS) {
573 return EINVAL;
574 }
575
576 size = sizeof(struct _processor_statistics_np) * (hinfo.logical_cpu_max + 2); /* One for RT Queue, One for Fair Share Queue */
577
578 if (req->oldlen < size) {
579 return EINVAL;
580 }
581
582 buf_size = size;
583 buf = (struct _processor_statistics_np *)kalloc_data(buf_size, Z_ZERO | Z_WAITOK);
584
585 kret = get_sched_statistics(buf, &size);
586 if (kret != KERN_SUCCESS) {
587 error = EINVAL;
588 goto out;
589 }
590
591 error = sysctl_io_opaque(req, buf, size, &changed);
592 if (error) {
593 goto out;
594 }
595
596 if (changed) {
597 panic("Sched info changed?!");
598 }
599 out:
600 kfree_data(buf, buf_size);
601 return error;
602 }
603
604 SYSCTL_PROC(_kern, OID_AUTO, sched_stats, CTLFLAG_LOCKED, 0, 0, sysctl_sched_stats, "-", "");
605
606 STATIC int
sysctl_sched_stats_enable(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,__unused struct sysctl_req * req)607 sysctl_sched_stats_enable(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, __unused struct sysctl_req *req)
608 {
609 boolean_t active;
610 int res;
611
612 if (req->newlen != sizeof(active)) {
613 return EINVAL;
614 }
615
616 res = copyin(req->newptr, &active, sizeof(active));
617 if (res != 0) {
618 return res;
619 }
620
621 return set_sched_stats_active(active);
622 }
623
624 SYSCTL_PROC(_kern, OID_AUTO, sched_stats_enable, CTLFLAG_LOCKED | CTLFLAG_WR, 0, 0, sysctl_sched_stats_enable, "-", "");
625
626 extern uint32_t sched_debug_flags;
627 SYSCTL_INT(_debug, OID_AUTO, sched, CTLFLAG_RW | CTLFLAG_LOCKED, &sched_debug_flags, 0, "scheduler debug");
628
629 #if (DEBUG || DEVELOPMENT)
630 extern boolean_t doprnt_hide_pointers;
631 SYSCTL_INT(_debug, OID_AUTO, hide_kernel_pointers, CTLFLAG_RW | CTLFLAG_LOCKED, &doprnt_hide_pointers, 0, "hide kernel pointers from log");
632 #endif
633
634
635 extern int get_kernel_symfile(proc_t, char **);
636
637 #if COUNT_SYSCALLS
638 #define KERN_COUNT_SYSCALLS (KERN_OSTYPE + 1000)
639
640 extern const unsigned int nsysent;
641 extern int syscalls_log[];
642 extern const char *syscallnames[];
643
644 STATIC int
645 sysctl_docountsyscalls SYSCTL_HANDLER_ARGS
646 {
647 __unused int cmd = oidp->oid_arg2; /* subcommand*/
648 __unused int *name = arg1; /* oid element argument vector */
649 __unused int namelen = arg2; /* number of oid element arguments */
650 int error, changed;
651
652 int tmp;
653
654 /* valid values passed in:
655 * = 0 means don't keep called counts for each bsd syscall
656 * > 0 means keep called counts for each bsd syscall
657 * = 2 means dump current counts to the system log
658 * = 3 means reset all counts
659 * for example, to dump current counts:
660 * sysctl -w kern.count_calls=2
661 */
662 error = sysctl_io_number(req, do_count_syscalls,
663 sizeof(do_count_syscalls), &tmp, &changed);
664
665 if (error != 0 || !changed) {
666 return error;
667 }
668
669 if (tmp == 1) {
670 do_count_syscalls = 1;
671 } else if (tmp == 0 || tmp == 2 || tmp == 3) {
672 for (int i = 0; i < nsysent; i++) {
673 if (syscalls_log[i] != 0) {
674 if (tmp == 2) {
675 printf("%d calls - name %s \n", syscalls_log[i], syscallnames[i]);
676 } else {
677 syscalls_log[i] = 0;
678 }
679 }
680 }
681 do_count_syscalls = (tmp != 0);
682 }
683
684 return error;
685 }
686 SYSCTL_PROC(_kern, KERN_COUNT_SYSCALLS, count_syscalls, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED,
687 0, /* Pointer argument (arg1) */
688 0, /* Integer argument (arg2) */
689 sysctl_docountsyscalls, /* Handler function */
690 NULL, /* Data pointer */
691 "");
692 #endif /* COUNT_SYSCALLS */
693
694 /*
695 * The following sysctl_* functions should not be used
696 * any more, as they can only cope with callers in
697 * user mode: Use new-style
698 * sysctl_io_number()
699 * sysctl_io_string()
700 * sysctl_io_opaque()
701 * instead.
702 */
703
704 STATIC int
sysdoproc_filt_KERN_PROC_PID(proc_t p,void * arg)705 sysdoproc_filt_KERN_PROC_PID(proc_t p, void * arg)
706 {
707 if (proc_getpid(p) != (pid_t)*(int*)arg) {
708 return 0;
709 } else {
710 return 1;
711 }
712 }
713
714 STATIC int
sysdoproc_filt_KERN_PROC_PGRP(proc_t p,void * arg)715 sysdoproc_filt_KERN_PROC_PGRP(proc_t p, void * arg)
716 {
717 if (p->p_pgrpid != (pid_t)*(int*)arg) {
718 return 0;
719 } else {
720 return 1;
721 }
722 }
723
724 STATIC int
sysdoproc_filt_KERN_PROC_TTY(proc_t p,void * arg)725 sysdoproc_filt_KERN_PROC_TTY(proc_t p, void * arg)
726 {
727 struct pgrp *pg;
728 dev_t dev = NODEV;
729
730 if ((p->p_flag & P_CONTROLT) && (pg = proc_pgrp(p, NULL)) != PGRP_NULL) {
731 dev = os_atomic_load(&pg->pg_session->s_ttydev, relaxed);
732 pgrp_rele(pg);
733 }
734
735 return dev != NODEV && dev == (dev_t)*(int *)arg;
736 }
737
738 STATIC int
sysdoproc_filt_KERN_PROC_UID(proc_t p,void * arg)739 sysdoproc_filt_KERN_PROC_UID(proc_t p, void * arg)
740 {
741 kauth_cred_t my_cred;
742 uid_t uid;
743
744 if (proc_ucred(p) == NULL) {
745 return 0;
746 }
747 my_cred = kauth_cred_proc_ref(p);
748 uid = kauth_cred_getuid(my_cred);
749 kauth_cred_unref(&my_cred);
750
751 if (uid != (uid_t)*(int*)arg) {
752 return 0;
753 } else {
754 return 1;
755 }
756 }
757
758
759 STATIC int
sysdoproc_filt_KERN_PROC_RUID(proc_t p,void * arg)760 sysdoproc_filt_KERN_PROC_RUID(proc_t p, void * arg)
761 {
762 kauth_cred_t my_cred;
763 uid_t ruid;
764
765 if (proc_ucred(p) == NULL) {
766 return 0;
767 }
768 my_cred = kauth_cred_proc_ref(p);
769 ruid = kauth_cred_getruid(my_cred);
770 kauth_cred_unref(&my_cred);
771
772 if (ruid != (uid_t)*(int*)arg) {
773 return 0;
774 } else {
775 return 1;
776 }
777 }
778
779 /*
780 * try over estimating by 5 procs
781 */
782 #define KERN_PROCSLOP (5 * sizeof(struct kinfo_proc))
783 struct sysdoproc_args {
784 size_t buflen;
785 void *kprocp;
786 boolean_t is_64_bit;
787 user_addr_t dp;
788 size_t needed;
789 unsigned int sizeof_kproc;
790 int *errorp;
791 int uidcheck;
792 int ruidcheck;
793 int ttycheck;
794 int uidval;
795 };
796
797 int
sysdoproc_callback(proc_t p,void * arg)798 sysdoproc_callback(proc_t p, void *arg)
799 {
800 struct sysdoproc_args *args = arg;
801
802 if (args->buflen >= args->sizeof_kproc) {
803 if ((args->ruidcheck != 0) && (sysdoproc_filt_KERN_PROC_RUID(p, &args->uidval) == 0)) {
804 return PROC_RETURNED;
805 }
806 if ((args->uidcheck != 0) && (sysdoproc_filt_KERN_PROC_UID(p, &args->uidval) == 0)) {
807 return PROC_RETURNED;
808 }
809 if ((args->ttycheck != 0) && (sysdoproc_filt_KERN_PROC_TTY(p, &args->uidval) == 0)) {
810 return PROC_RETURNED;
811 }
812
813 bzero(args->kprocp, args->sizeof_kproc);
814 if (args->is_64_bit) {
815 fill_user64_proc(p, args->kprocp);
816 } else {
817 fill_user32_proc(p, args->kprocp);
818 }
819 int error = copyout(args->kprocp, args->dp, args->sizeof_kproc);
820 if (error) {
821 *args->errorp = error;
822 return PROC_RETURNED_DONE;
823 }
824 args->dp += args->sizeof_kproc;
825 args->buflen -= args->sizeof_kproc;
826 }
827 args->needed += args->sizeof_kproc;
828 return PROC_RETURNED;
829 }
830
831 SYSCTL_NODE(_kern, KERN_PROC, proc, CTLFLAG_RD | CTLFLAG_LOCKED, 0, "");
832 STATIC int
833 sysctl_prochandle SYSCTL_HANDLER_ARGS
834 {
835 int cmd = oidp->oid_arg2; /* subcommand for multiple nodes */
836 int *name = arg1; /* oid element argument vector */
837 int namelen = arg2; /* number of oid element arguments */
838 user_addr_t where = req->oldptr;/* user buffer copy out address */
839
840 user_addr_t dp = where;
841 size_t needed = 0;
842 size_t buflen = where != USER_ADDR_NULL ? req->oldlen : 0;
843 int error = 0;
844 boolean_t is_64_bit = proc_is64bit(current_proc());
845 struct user32_kinfo_proc user32_kproc;
846 struct user64_kinfo_proc user_kproc;
847 int sizeof_kproc;
848 void *kprocp;
849 int (*filterfn)(proc_t, void *) = 0;
850 struct sysdoproc_args args;
851 int uidcheck = 0;
852 int ruidcheck = 0;
853 int ttycheck = 0;
854
855 if (namelen != 1 && !(namelen == 0 && cmd == KERN_PROC_ALL)) {
856 return EINVAL;
857 }
858
859 if (is_64_bit) {
860 sizeof_kproc = sizeof(user_kproc);
861 kprocp = &user_kproc;
862 } else {
863 sizeof_kproc = sizeof(user32_kproc);
864 kprocp = &user32_kproc;
865 }
866
867 switch (cmd) {
868 case KERN_PROC_PID:
869 filterfn = sysdoproc_filt_KERN_PROC_PID;
870 break;
871
872 case KERN_PROC_PGRP:
873 filterfn = sysdoproc_filt_KERN_PROC_PGRP;
874 break;
875
876 case KERN_PROC_TTY:
877 ttycheck = 1;
878 break;
879
880 case KERN_PROC_UID:
881 uidcheck = 1;
882 break;
883
884 case KERN_PROC_RUID:
885 ruidcheck = 1;
886 break;
887
888 case KERN_PROC_ALL:
889 break;
890
891 default:
892 /* must be kern.proc.<unknown> */
893 return ENOTSUP;
894 }
895
896 error = 0;
897 args.buflen = buflen;
898 args.kprocp = kprocp;
899 args.is_64_bit = is_64_bit;
900 args.dp = dp;
901 args.needed = needed;
902 args.errorp = &error;
903 args.uidcheck = uidcheck;
904 args.ruidcheck = ruidcheck;
905 args.ttycheck = ttycheck;
906 args.sizeof_kproc = sizeof_kproc;
907 if (namelen) {
908 args.uidval = name[0];
909 }
910
911 proc_iterate((PROC_ALLPROCLIST | PROC_ZOMBPROCLIST),
912 sysdoproc_callback, &args, filterfn, name);
913
914 if (error) {
915 return error;
916 }
917
918 dp = args.dp;
919 needed = args.needed;
920
921 if (where != USER_ADDR_NULL) {
922 req->oldlen = dp - where;
923 if (needed > req->oldlen) {
924 return ENOMEM;
925 }
926 } else {
927 needed += KERN_PROCSLOP;
928 req->oldlen = needed;
929 }
930 /* adjust index so we return the right required/consumed amount */
931 req->oldidx += req->oldlen;
932 return 0;
933 }
934
935
936 /*
937 * We specify the subcommand code for multiple nodes as the 'req->arg2' value
938 * in the sysctl declaration itself, which comes into the handler function
939 * as 'oidp->oid_arg2'.
940 *
941 * For these particular sysctls, since they have well known OIDs, we could
942 * have just obtained it from the '((int *)arg1)[0]' parameter, but that would
943 * not demonstrate how to handle multiple sysctls that used OID_AUTO instead
944 * of a well known value with a common handler function. This is desirable,
945 * because we want well known values to "go away" at some future date.
946 *
947 * It should be noted that the value of '((int *)arg1)[1]' is used for many
948 * an integer parameter to the subcommand for many of these sysctls; we'd
949 * rather have used '((int *)arg1)[0]' for that, or even better, an element
950 * in a structure passed in as the the 'newp' argument to sysctlbyname(3),
951 * and then use leaf-node permissions enforcement, but that would have
952 * necessitated modifying user space code to correspond to the interface
953 * change, and we are striving for binary backward compatibility here; even
954 * though these are SPI, and not intended for use by user space applications
955 * which are not themselves system tools or libraries, some applications
956 * have erroneously used them.
957 */
958 SYSCTL_PROC(_kern_proc, KERN_PROC_ALL, all, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED,
959 0, /* Pointer argument (arg1) */
960 KERN_PROC_ALL, /* Integer argument (arg2) */
961 sysctl_prochandle, /* Handler function */
962 NULL, /* Data is size variant on ILP32/LP64 */
963 "");
964 SYSCTL_PROC(_kern_proc, KERN_PROC_PID, pid, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED,
965 0, /* Pointer argument (arg1) */
966 KERN_PROC_PID, /* Integer argument (arg2) */
967 sysctl_prochandle, /* Handler function */
968 NULL, /* Data is size variant on ILP32/LP64 */
969 "");
970 SYSCTL_PROC(_kern_proc, KERN_PROC_TTY, tty, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED,
971 0, /* Pointer argument (arg1) */
972 KERN_PROC_TTY, /* Integer argument (arg2) */
973 sysctl_prochandle, /* Handler function */
974 NULL, /* Data is size variant on ILP32/LP64 */
975 "");
976 SYSCTL_PROC(_kern_proc, KERN_PROC_PGRP, pgrp, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED,
977 0, /* Pointer argument (arg1) */
978 KERN_PROC_PGRP, /* Integer argument (arg2) */
979 sysctl_prochandle, /* Handler function */
980 NULL, /* Data is size variant on ILP32/LP64 */
981 "");
982 SYSCTL_PROC(_kern_proc, KERN_PROC_UID, uid, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED,
983 0, /* Pointer argument (arg1) */
984 KERN_PROC_UID, /* Integer argument (arg2) */
985 sysctl_prochandle, /* Handler function */
986 NULL, /* Data is size variant on ILP32/LP64 */
987 "");
988 SYSCTL_PROC(_kern_proc, KERN_PROC_RUID, ruid, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED,
989 0, /* Pointer argument (arg1) */
990 KERN_PROC_RUID, /* Integer argument (arg2) */
991 sysctl_prochandle, /* Handler function */
992 NULL, /* Data is size variant on ILP32/LP64 */
993 "");
994 SYSCTL_PROC(_kern_proc, KERN_PROC_LCID, lcid, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED,
995 0, /* Pointer argument (arg1) */
996 KERN_PROC_LCID, /* Integer argument (arg2) */
997 sysctl_prochandle, /* Handler function */
998 NULL, /* Data is size variant on ILP32/LP64 */
999 "");
1000
1001
1002 /*
1003 * Fill in non-zero fields of an eproc structure for the specified process.
1004 */
1005 STATIC void
fill_user32_eproc(proc_t p,struct user32_eproc * __restrict ep)1006 fill_user32_eproc(proc_t p, struct user32_eproc *__restrict ep)
1007 {
1008 struct pgrp *pg;
1009 struct session *sessp;
1010 kauth_cred_t my_cred;
1011
1012 pg = proc_pgrp(p, &sessp);
1013
1014 if (pg != PGRP_NULL) {
1015 ep->e_pgid = p->p_pgrpid;
1016 ep->e_jobc = pg->pg_jobc;
1017 if (sessp->s_ttyvp) {
1018 ep->e_flag = EPROC_CTTY;
1019 }
1020 }
1021
1022 ep->e_ppid = p->p_ppid;
1023 if (proc_ucred(p)) {
1024 my_cred = kauth_cred_proc_ref(p);
1025
1026 /* A fake historical pcred */
1027 ep->e_pcred.p_ruid = kauth_cred_getruid(my_cred);
1028 ep->e_pcred.p_svuid = kauth_cred_getsvuid(my_cred);
1029 ep->e_pcred.p_rgid = kauth_cred_getrgid(my_cred);
1030 ep->e_pcred.p_svgid = kauth_cred_getsvgid(my_cred);
1031
1032 /* A fake historical *kauth_cred_t */
1033 unsigned long refcnt = os_atomic_load(&my_cred->cr_ref, relaxed);
1034 ep->e_ucred.cr_ref = (uint32_t)MIN(refcnt, UINT32_MAX);
1035 ep->e_ucred.cr_uid = kauth_cred_getuid(my_cred);
1036 ep->e_ucred.cr_ngroups = (short)posix_cred_get(my_cred)->cr_ngroups;
1037 bcopy(posix_cred_get(my_cred)->cr_groups,
1038 ep->e_ucred.cr_groups, NGROUPS * sizeof(gid_t));
1039
1040 kauth_cred_unref(&my_cred);
1041 }
1042
1043 ep->e_tdev = NODEV;
1044 if (pg != PGRP_NULL) {
1045 if (p->p_flag & P_CONTROLT) {
1046 session_lock(sessp);
1047 ep->e_tdev = os_atomic_load(&sessp->s_ttydev, relaxed);
1048 ep->e_tpgid = sessp->s_ttypgrpid;
1049 session_unlock(sessp);
1050 }
1051 if (SESS_LEADER(p, sessp)) {
1052 ep->e_flag |= EPROC_SLEADER;
1053 }
1054 pgrp_rele(pg);
1055 }
1056 }
1057
1058 /*
1059 * Fill in non-zero fields of an LP64 eproc structure for the specified process.
1060 */
1061 STATIC void
fill_user64_eproc(proc_t p,struct user64_eproc * __restrict ep)1062 fill_user64_eproc(proc_t p, struct user64_eproc *__restrict ep)
1063 {
1064 struct pgrp *pg;
1065 struct session *sessp;
1066 kauth_cred_t my_cred;
1067
1068 pg = proc_pgrp(p, &sessp);
1069
1070 if (pg != PGRP_NULL) {
1071 ep->e_pgid = p->p_pgrpid;
1072 ep->e_jobc = pg->pg_jobc;
1073 if (sessp->s_ttyvp) {
1074 ep->e_flag = EPROC_CTTY;
1075 }
1076 }
1077
1078 ep->e_ppid = p->p_ppid;
1079 if (proc_ucred(p)) {
1080 my_cred = kauth_cred_proc_ref(p);
1081
1082 /* A fake historical pcred */
1083 ep->e_pcred.p_ruid = kauth_cred_getruid(my_cred);
1084 ep->e_pcred.p_svuid = kauth_cred_getsvuid(my_cred);
1085 ep->e_pcred.p_rgid = kauth_cred_getrgid(my_cred);
1086 ep->e_pcred.p_svgid = kauth_cred_getsvgid(my_cred);
1087
1088 /* A fake historical *kauth_cred_t */
1089 unsigned long refcnt = os_atomic_load(&my_cred->cr_ref, relaxed);
1090 ep->e_ucred.cr_ref = (uint32_t)MIN(refcnt, UINT32_MAX);
1091 ep->e_ucred.cr_uid = kauth_cred_getuid(my_cred);
1092 ep->e_ucred.cr_ngroups = (short)posix_cred_get(my_cred)->cr_ngroups;
1093 bcopy(posix_cred_get(my_cred)->cr_groups,
1094 ep->e_ucred.cr_groups, NGROUPS * sizeof(gid_t));
1095
1096 kauth_cred_unref(&my_cred);
1097 }
1098
1099 ep->e_tdev = NODEV;
1100 if (pg != PGRP_NULL) {
1101 if (p->p_flag & P_CONTROLT) {
1102 session_lock(sessp);
1103 ep->e_tdev = os_atomic_load(&sessp->s_ttydev, relaxed);
1104 ep->e_tpgid = sessp->s_ttypgrpid;
1105 session_unlock(sessp);
1106 }
1107 if (SESS_LEADER(p, sessp)) {
1108 ep->e_flag |= EPROC_SLEADER;
1109 }
1110 pgrp_rele(pg);
1111 }
1112 }
1113
1114 /*
1115 * Fill in an eproc structure for the specified process.
1116 * bzeroed by our caller, so only set non-zero fields.
1117 */
1118 STATIC void
fill_user32_externproc(proc_t p,struct user32_extern_proc * __restrict exp)1119 fill_user32_externproc(proc_t p, struct user32_extern_proc *__restrict exp)
1120 {
1121 exp->p_starttime.tv_sec = (user32_time_t)p->p_start.tv_sec;
1122 exp->p_starttime.tv_usec = p->p_start.tv_usec;
1123 exp->p_flag = p->p_flag;
1124 if (p->p_lflag & P_LTRACED) {
1125 exp->p_flag |= P_TRACED;
1126 }
1127 if (p->p_lflag & P_LPPWAIT) {
1128 exp->p_flag |= P_PPWAIT;
1129 }
1130 if (p->p_lflag & P_LEXIT) {
1131 exp->p_flag |= P_WEXIT;
1132 }
1133 exp->p_stat = p->p_stat;
1134 exp->p_pid = proc_getpid(p);
1135 exp->p_oppid = p->p_oppid;
1136 /* Mach related */
1137 exp->p_debugger = p->p_debugger;
1138 exp->sigwait = p->sigwait;
1139 /* scheduling */
1140 #ifdef _PROC_HAS_SCHEDINFO_
1141 exp->p_estcpu = p->p_estcpu;
1142 exp->p_pctcpu = p->p_pctcpu;
1143 exp->p_slptime = p->p_slptime;
1144 #endif
1145 exp->p_realtimer.it_interval.tv_sec =
1146 (user32_time_t)p->p_realtimer.it_interval.tv_sec;
1147 exp->p_realtimer.it_interval.tv_usec =
1148 (__int32_t)p->p_realtimer.it_interval.tv_usec;
1149
1150 exp->p_realtimer.it_value.tv_sec =
1151 (user32_time_t)p->p_realtimer.it_value.tv_sec;
1152 exp->p_realtimer.it_value.tv_usec =
1153 (__int32_t)p->p_realtimer.it_value.tv_usec;
1154
1155 exp->p_rtime.tv_sec = (user32_time_t)p->p_rtime.tv_sec;
1156 exp->p_rtime.tv_usec = (__int32_t)p->p_rtime.tv_usec;
1157
1158 exp->p_sigignore = p->p_sigignore;
1159 exp->p_sigcatch = p->p_sigcatch;
1160 exp->p_priority = p->p_priority;
1161 exp->p_nice = p->p_nice;
1162 bcopy(&p->p_comm, &exp->p_comm, MAXCOMLEN);
1163 exp->p_xstat = (u_short)MIN(p->p_xstat, USHRT_MAX);
1164 exp->p_acflag = p->p_acflag;
1165 }
1166
1167 /*
1168 * Fill in an LP64 version of extern_proc structure for the specified process.
1169 */
1170 STATIC void
fill_user64_externproc(proc_t p,struct user64_extern_proc * __restrict exp)1171 fill_user64_externproc(proc_t p, struct user64_extern_proc *__restrict exp)
1172 {
1173 exp->p_starttime.tv_sec = p->p_start.tv_sec;
1174 exp->p_starttime.tv_usec = p->p_start.tv_usec;
1175 exp->p_flag = p->p_flag;
1176 if (p->p_lflag & P_LTRACED) {
1177 exp->p_flag |= P_TRACED;
1178 }
1179 if (p->p_lflag & P_LPPWAIT) {
1180 exp->p_flag |= P_PPWAIT;
1181 }
1182 if (p->p_lflag & P_LEXIT) {
1183 exp->p_flag |= P_WEXIT;
1184 }
1185 exp->p_stat = p->p_stat;
1186 exp->p_pid = proc_getpid(p);
1187 exp->p_oppid = p->p_oppid;
1188 /* Mach related */
1189 exp->p_debugger = p->p_debugger;
1190 exp->sigwait = p->sigwait;
1191 /* scheduling */
1192 #ifdef _PROC_HAS_SCHEDINFO_
1193 exp->p_estcpu = p->p_estcpu;
1194 exp->p_pctcpu = p->p_pctcpu;
1195 exp->p_slptime = p->p_slptime;
1196 #endif
1197 exp->p_realtimer.it_interval.tv_sec = p->p_realtimer.it_interval.tv_sec;
1198 exp->p_realtimer.it_interval.tv_usec = p->p_realtimer.it_interval.tv_usec;
1199
1200 exp->p_realtimer.it_value.tv_sec = p->p_realtimer.it_value.tv_sec;
1201 exp->p_realtimer.it_value.tv_usec = p->p_realtimer.it_value.tv_usec;
1202
1203 exp->p_rtime.tv_sec = p->p_rtime.tv_sec;
1204 exp->p_rtime.tv_usec = p->p_rtime.tv_usec;
1205
1206 exp->p_sigignore = p->p_sigignore;
1207 exp->p_sigcatch = p->p_sigcatch;
1208 exp->p_priority = p->p_priority;
1209 exp->p_nice = p->p_nice;
1210 bcopy(&p->p_comm, &exp->p_comm, MAXCOMLEN);
1211 exp->p_xstat = (u_short)MIN(p->p_xstat, USHRT_MAX);
1212 exp->p_acflag = p->p_acflag;
1213 }
1214
1215 STATIC void
fill_user32_proc(proc_t p,struct user32_kinfo_proc * __restrict kp)1216 fill_user32_proc(proc_t p, struct user32_kinfo_proc *__restrict kp)
1217 {
1218 /* on a 64 bit kernel, 32 bit users get some truncated information */
1219 fill_user32_externproc(p, &kp->kp_proc);
1220 fill_user32_eproc(p, &kp->kp_eproc);
1221 }
1222
1223 STATIC void
fill_user64_proc(proc_t p,struct user64_kinfo_proc * __restrict kp)1224 fill_user64_proc(proc_t p, struct user64_kinfo_proc *__restrict kp)
1225 {
1226 fill_user64_externproc(p, &kp->kp_proc);
1227 fill_user64_eproc(p, &kp->kp_eproc);
1228 }
1229
1230 #if defined(XNU_TARGET_OS_OSX)
1231 /*
1232 * Return the top *sizep bytes of the user stack, or the entire area of the
1233 * user stack down through the saved exec_path, whichever is smaller.
1234 */
1235 STATIC int
1236 sysctl_doprocargs SYSCTL_HANDLER_ARGS
1237 {
1238 __unused int cmd = oidp->oid_arg2; /* subcommand*/
1239 int *name = arg1; /* oid element argument vector */
1240 int namelen = arg2; /* number of oid element arguments */
1241 user_addr_t oldp = req->oldptr; /* user buffer copy out address */
1242 size_t *oldlenp = &req->oldlen; /* user buffer copy out size */
1243 // user_addr_t newp = req->newptr; /* user buffer copy in address */
1244 // size_t newlen = req->newlen; /* user buffer copy in size */
1245 int error;
1246
1247 error = sysctl_procargsx( name, namelen, oldp, oldlenp, current_proc(), 0);
1248
1249 /* adjust index so we return the right required/consumed amount */
1250 if (!error) {
1251 req->oldidx += req->oldlen;
1252 }
1253
1254 return error;
1255 }
1256 SYSCTL_PROC(_kern, KERN_PROCARGS, procargs, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED,
1257 0, /* Pointer argument (arg1) */
1258 0, /* Integer argument (arg2) */
1259 sysctl_doprocargs, /* Handler function */
1260 NULL, /* Data pointer */
1261 "");
1262 #endif /* defined(XNU_TARGET_OS_OSX) */
1263
1264 STATIC int
1265 sysctl_doprocargs2 SYSCTL_HANDLER_ARGS
1266 {
1267 __unused int cmd = oidp->oid_arg2; /* subcommand*/
1268 int *name = arg1; /* oid element argument vector */
1269 int namelen = arg2; /* number of oid element arguments */
1270 user_addr_t oldp = req->oldptr; /* user buffer copy out address */
1271 size_t *oldlenp = &req->oldlen; /* user buffer copy out size */
1272 // user_addr_t newp = req->newptr; /* user buffer copy in address */
1273 // size_t newlen = req->newlen; /* user buffer copy in size */
1274 int error;
1275
1276 error = sysctl_procargsx( name, namelen, oldp, oldlenp, current_proc(), 1);
1277
1278 /* adjust index so we return the right required/consumed amount */
1279 if (!error) {
1280 req->oldidx += req->oldlen;
1281 }
1282
1283 return error;
1284 }
1285 SYSCTL_PROC(_kern, KERN_PROCARGS2, procargs2, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED,
1286 0, /* Pointer argument (arg1) */
1287 0, /* Integer argument (arg2) */
1288 sysctl_doprocargs2, /* Handler function */
1289 NULL, /* Data pointer */
1290 "");
1291
1292 #define SYSCTL_PROCARGS_READ_ENVVARS_ENTITLEMENT "com.apple.private.read-environment-variables"
1293 STATIC int
sysctl_procargsx(int * name,u_int namelen,user_addr_t where,size_t * sizep,proc_t cur_proc,int argc_yes)1294 sysctl_procargsx(int *name, u_int namelen, user_addr_t where,
1295 size_t *sizep, proc_t cur_proc, int argc_yes)
1296 {
1297 assert(sizep != NULL);
1298 proc_t p = NULL;
1299 size_t buflen = where != USER_ADDR_NULL ? *sizep : 0;
1300 int error = 0;
1301 struct _vm_map *proc_map = NULL;
1302 struct task * task;
1303 vm_map_copy_t tmp = NULL;
1304 user_addr_t arg_addr;
1305 size_t arg_size;
1306 caddr_t data;
1307 size_t argslen = 0;
1308 size_t size = 0;
1309 vm_offset_t copy_start = 0, copy_end;
1310 vm_offset_t smallbuffer_start;
1311 kern_return_t ret;
1312 int pid;
1313 kauth_cred_t my_cred;
1314 uid_t uid;
1315 int argc = -1;
1316 size_t argvsize;
1317 size_t remaining;
1318 size_t current_arg_index;
1319 size_t current_arg_len;
1320 const char * current_arg;
1321 bool omit_env_vars = true;
1322 user_addr_t user_stack;
1323 vm_map_offset_t effective_page_mask;
1324
1325 if (namelen < 1) {
1326 error = EINVAL;
1327 goto finish;
1328 }
1329
1330 if (argc_yes) {
1331 buflen -= sizeof(int); /* reserve first word to return argc */
1332 }
1333 /* we only care about buflen when where (oldp from sysctl) is not NULL. */
1334 /* when where (oldp from sysctl) is NULL and sizep (oldlenp from sysctl */
1335 /* is not NULL then the caller wants us to return the length needed to */
1336 /* hold the data we would return */
1337 if (where != USER_ADDR_NULL && (buflen <= 0 || buflen > ARG_MAX)) {
1338 error = EINVAL;
1339 goto finish;
1340 }
1341
1342 /*
1343 * Lookup process by pid
1344 */
1345 pid = name[0];
1346 p = proc_find(pid);
1347 if (p == NULL) {
1348 error = EINVAL;
1349 goto finish;
1350 }
1351
1352 /* Allow reading environment variables if any of the following are true:
1353 * - kernel is DEVELOPMENT || DEBUG
1354 * - target process is same as current_proc()
1355 * - target process is not cs_restricted
1356 * - SIP is off
1357 * - caller has an entitlement
1358 */
1359
1360 #if DEVELOPMENT || DEBUG
1361 omit_env_vars = false;
1362 #endif
1363 if (p == current_proc() ||
1364 !cs_restricted(p) ||
1365 #if CONFIG_CSR
1366 csr_check(CSR_ALLOW_UNRESTRICTED_DTRACE) == 0 ||
1367 #endif
1368 IOCurrentTaskHasEntitlement(SYSCTL_PROCARGS_READ_ENVVARS_ENTITLEMENT)
1369 ) {
1370 omit_env_vars = false;
1371 }
1372
1373 /*
1374 * Copy the top N bytes of the stack.
1375 * On all machines we have so far, the stack grows
1376 * downwards.
1377 *
1378 * If the user expects no more than N bytes of
1379 * argument list, use that as a guess for the
1380 * size.
1381 */
1382
1383 if (!p->user_stack) {
1384 error = EINVAL;
1385 goto finish;
1386 }
1387
1388 /* save off argc, argslen, user_stack before releasing the proc */
1389 argc = p->p_argc;
1390 argslen = p->p_argslen;
1391 user_stack = p->user_stack;
1392
1393 /*
1394 * When these sysctls were introduced, the first string in the strings
1395 * section was just the bare path of the executable. However, for security
1396 * reasons we now prefix this string with executable_path= so it can be
1397 * parsed getenv style. To avoid binary compatability issues with exising
1398 * callers of this sysctl, we strip it off here.
1399 * (rdar://problem/13746466)
1400 */
1401 #define EXECUTABLE_KEY "executable_path="
1402 argslen -= strlen(EXECUTABLE_KEY);
1403
1404 if (where == USER_ADDR_NULL && !omit_env_vars) {
1405 /* caller only wants to know length of proc args data.
1406 * If we don't need to omit environment variables, we can skip
1407 * copying the target process stack */
1408 goto calculate_size;
1409 }
1410
1411 my_cred = kauth_cred_proc_ref(p);
1412 uid = kauth_cred_getuid(my_cred);
1413 kauth_cred_unref(&my_cred);
1414
1415 if ((uid != kauth_cred_getuid(kauth_cred_get()))
1416 && suser(kauth_cred_get(), &cur_proc->p_acflag)) {
1417 error = EINVAL;
1418 goto finish;
1419 }
1420
1421 /*
1422 * Before we can block (any VM code), make another
1423 * reference to the map to keep it alive. We do
1424 * that by getting a reference on the task itself.
1425 */
1426 task = proc_task(p);
1427 if (task == NULL) {
1428 error = EINVAL;
1429 goto finish;
1430 }
1431
1432 /*
1433 * Once we have a task reference we can convert that into a
1434 * map reference, which we will use in the calls below. The
1435 * task/process may change its map after we take this reference
1436 * (see execve), but the worst that will happen then is a return
1437 * of stale info (which is always a possibility).
1438 */
1439 task_reference(task);
1440 proc_rele(p);
1441 p = NULL;
1442 proc_map = get_task_map_reference(task);
1443 task_deallocate(task);
1444
1445 if (proc_map == NULL) {
1446 error = EINVAL;
1447 goto finish;
1448 }
1449
1450 effective_page_mask = vm_map_page_mask(proc_map);
1451
1452 arg_size = vm_map_round_page(argslen, effective_page_mask);
1453
1454 arg_addr = user_stack - arg_size;
1455
1456 ret = kmem_alloc(kernel_map, ©_start, arg_size,
1457 KMA_DATA | KMA_ZERO, VM_KERN_MEMORY_BSD);
1458 if (ret != KERN_SUCCESS) {
1459 error = ENOMEM;
1460 goto finish;
1461 }
1462
1463 copy_end = copy_start + arg_size;
1464
1465 if (vm_map_copyin(proc_map, (vm_map_address_t)arg_addr,
1466 (vm_map_size_t)arg_size, FALSE, &tmp) != KERN_SUCCESS) {
1467 error = EIO;
1468 goto finish;
1469 }
1470
1471 /*
1472 * Now that we've done the copyin from the process'
1473 * map, we can release the reference to it.
1474 */
1475 vm_map_deallocate(proc_map);
1476 proc_map = NULL;
1477
1478 if (vm_map_copy_overwrite(kernel_map,
1479 (vm_map_address_t)copy_start,
1480 tmp, (vm_map_size_t) arg_size, FALSE) != KERN_SUCCESS) {
1481 error = EIO;
1482 goto finish;
1483 }
1484 /* tmp was consumed */
1485 tmp = NULL;
1486
1487 if (omit_env_vars) {
1488 argvsize = 0;
1489
1490 /* Iterate over everything in argv, plus one for the bare executable path */
1491 for (current_arg_index = 0; current_arg_index < argc + 1 && argvsize < argslen; ++current_arg_index) {
1492 current_arg = (const char *)(copy_end - argslen) + argvsize;
1493 remaining = argslen - argvsize;
1494 current_arg_len = strnlen(current_arg, remaining);
1495 if (current_arg_len < remaining) {
1496 /* We have space for the null terminator */
1497 current_arg_len += 1;
1498
1499 if (current_arg_index == 0) {
1500 /* The bare executable path may have multiple null bytes after it for alignment */
1501 while (current_arg_len < remaining && current_arg[current_arg_len] == 0) {
1502 current_arg_len += 1;
1503 }
1504 }
1505 }
1506 argvsize += current_arg_len;
1507 }
1508 assert(argvsize <= argslen);
1509
1510 /* Adjust argslen and copy_end to make the copyout range extend to the end of argv */
1511 copy_end = copy_end - argslen + argvsize;
1512 argslen = argvsize;
1513 }
1514
1515 if (where == USER_ADDR_NULL) {
1516 /* Skip copyout */
1517 goto calculate_size;
1518 }
1519
1520 if (buflen >= argslen) {
1521 data = (caddr_t) (copy_end - argslen);
1522 size = argslen;
1523 } else {
1524 /*
1525 * Before rdar://25397314, this function contained incorrect logic when buflen is less
1526 * than argslen. The problem was that it copied in `buflen` bytes from the end of the target
1527 * process user stack into the beginning of a buffer of size round_page(buflen), and then
1528 * copied out `buflen` bytes from the end of this buffer. The effect of this was that
1529 * the caller of this sysctl would get zeros at the end of their buffer.
1530 *
1531 * To preserve this behavior, bzero everything from copy_end-round_page(buflen)+buflen to the
1532 * end of the buffer. This emulates copying in only `buflen` bytes.
1533 *
1534 *
1535 * In the old code:
1536 *
1537 * copy_start .... size: round_page(buflen) .... copy_end
1538 * [---copied in data (size: buflen)---|--- zeros ----------]
1539 * ^
1540 * data = copy_end - buflen
1541 *
1542 *
1543 * In the new code:
1544 * copy_start .... size: round_page(p->argslen) .... full copy_end
1545 * ^ ....................... p->argslen ...............................^
1546 * ^ ^ truncated copy_end ^
1547 * ^ ^ ^ ^
1548 * ^ ................ argslen ........................ ^
1549 * ^ ^ ^ ^
1550 * [-------copied in data (size: round_page(p->argslen))-------:----env vars---]
1551 * ^ ^
1552 * ^ data = copy_end - buflen
1553 * smallbuffer_start = max(copy_end - round_page(buflen), copy_start)
1554 *
1555 *
1556 * Full copy_end: copy_end calculated from copy_start + round_page(p->argslen)
1557 * Truncated copy_end: copy_end after truncation to remove environment variables.
1558 *
1559 * If environment variables were omitted, then we use the truncated copy_end, otherwise
1560 * we use full copy_end.
1561 *
1562 * smallbuffer_start: represents where copy_start would be in the old code.
1563 * data: The beginning of the region we copyout
1564 */
1565 smallbuffer_start = copy_end - vm_map_round_page(buflen, effective_page_mask);
1566 if (smallbuffer_start < copy_start) {
1567 smallbuffer_start = copy_start;
1568 }
1569 bzero((void *)(smallbuffer_start + buflen), copy_end - (smallbuffer_start + buflen));
1570 data = (caddr_t) (copy_end - buflen);
1571 size = buflen;
1572 }
1573
1574 if (argc_yes) {
1575 /* Put processes argc as the first word in the copyout buffer */
1576 suword(where, argc);
1577 error = copyout(data, (where + sizeof(int)), size);
1578 size += sizeof(int);
1579 } else {
1580 error = copyout(data, where, size);
1581
1582 /*
1583 * Make the old PROCARGS work to return the executable's path
1584 * But, only if there is enough space in the provided buffer
1585 *
1586 * on entry: data [possibily] points to the beginning of the path
1587 *
1588 * Note: we keep all pointers&sizes aligned to word boundries
1589 */
1590 if ((!error) && (buflen > 0 && (u_int)buflen > size)) {
1591 int binPath_sz, alignedBinPath_sz = 0;
1592 int extraSpaceNeeded, addThis;
1593 user_addr_t placeHere;
1594 char * str = (char *) data;
1595 size_t max_len = size;
1596
1597 /* Some apps are really bad about messing up their stacks
1598 * So, we have to be extra careful about getting the length
1599 * of the executing binary. If we encounter an error, we bail.
1600 */
1601
1602 /* Limit ourselves to PATH_MAX paths */
1603 if (max_len > PATH_MAX) {
1604 max_len = PATH_MAX;
1605 }
1606
1607 binPath_sz = 0;
1608
1609 while ((binPath_sz < max_len - 1) && (*str++ != 0)) {
1610 binPath_sz++;
1611 }
1612
1613 /* If we have a NUL terminator, copy it, too */
1614 if (binPath_sz < max_len - 1) {
1615 binPath_sz += 1;
1616 }
1617
1618 /* Pre-Flight the space requiremnts */
1619
1620 /* Account for the padding that fills out binPath to the next word */
1621 alignedBinPath_sz += (binPath_sz & (sizeof(int) - 1)) ? (sizeof(int) - (binPath_sz & (sizeof(int) - 1))) : 0;
1622
1623 placeHere = where + size;
1624
1625 /* Account for the bytes needed to keep placeHere word aligned */
1626 addThis = (placeHere & (sizeof(int) - 1)) ? (sizeof(int) - (placeHere & (sizeof(int) - 1))) : 0;
1627
1628 /* Add up all the space that is needed */
1629 extraSpaceNeeded = alignedBinPath_sz + addThis + binPath_sz + (4 * sizeof(int));
1630
1631 /* is there is room to tack on argv[0]? */
1632 if ((buflen & ~(sizeof(int) - 1)) >= (size + extraSpaceNeeded)) {
1633 placeHere += addThis;
1634 suword(placeHere, 0);
1635 placeHere += sizeof(int);
1636 suword(placeHere, 0xBFFF0000);
1637 placeHere += sizeof(int);
1638 suword(placeHere, 0);
1639 placeHere += sizeof(int);
1640 error = copyout(data, placeHere, binPath_sz);
1641 if (!error) {
1642 placeHere += binPath_sz;
1643 suword(placeHere, 0);
1644 size += extraSpaceNeeded;
1645 }
1646 }
1647 }
1648 }
1649
1650 calculate_size:
1651 /* Size has already been calculated for the where != NULL case */
1652 if (where == USER_ADDR_NULL) {
1653 size = argslen;
1654 if (argc_yes) {
1655 size += sizeof(int);
1656 } else {
1657 /*
1658 * old PROCARGS will return the executable's path and plus some
1659 * extra space for work alignment and data tags
1660 */
1661 size += PATH_MAX + (6 * sizeof(int));
1662 }
1663 size += (size & (sizeof(int) - 1)) ? (sizeof(int) - (size & (sizeof(int) - 1))) : 0;
1664 }
1665
1666 *sizep = size;
1667
1668 finish:
1669 if (p != NULL) {
1670 proc_rele(p);
1671 }
1672 if (tmp != NULL) {
1673 vm_map_copy_discard(tmp);
1674 }
1675 if (proc_map != NULL) {
1676 vm_map_deallocate(proc_map);
1677 }
1678 if (copy_start != (vm_offset_t) 0) {
1679 kmem_free(kernel_map, copy_start, arg_size);
1680 }
1681 return error;
1682 }
1683
1684
1685 /*
1686 * Max number of concurrent aio requests
1687 */
1688 STATIC int
sysctl_aiomax(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)1689 sysctl_aiomax
1690 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
1691 {
1692 int new_value, changed;
1693 int error = sysctl_io_number(req, aio_max_requests, sizeof(int), &new_value, &changed);
1694 if (changed) {
1695 /* make sure the system-wide limit is greater than the per process limit */
1696 if (new_value >= aio_max_requests_per_process && new_value <= AIO_MAX_REQUESTS) {
1697 aio_max_requests = new_value;
1698 } else {
1699 error = EINVAL;
1700 }
1701 }
1702 return error;
1703 }
1704
1705
1706 /*
1707 * Max number of concurrent aio requests per process
1708 */
1709 STATIC int
sysctl_aioprocmax(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)1710 sysctl_aioprocmax
1711 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
1712 {
1713 int new_value, changed;
1714 int error = sysctl_io_number(req, aio_max_requests_per_process, sizeof(int), &new_value, &changed);
1715 if (changed) {
1716 /* make sure per process limit is less than the system-wide limit */
1717 if (new_value <= aio_max_requests && new_value >= AIO_LISTIO_MAX) {
1718 aio_max_requests_per_process = new_value;
1719 } else {
1720 error = EINVAL;
1721 }
1722 }
1723 return error;
1724 }
1725
1726
1727 /*
1728 * Max number of async IO worker threads
1729 */
1730 STATIC int
sysctl_aiothreads(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)1731 sysctl_aiothreads
1732 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
1733 {
1734 int new_value, changed;
1735 int error = sysctl_io_number(req, aio_worker_threads, sizeof(int), &new_value, &changed);
1736 if (changed) {
1737 /* we only allow an increase in the number of worker threads */
1738 if (new_value > aio_worker_threads) {
1739 _aio_create_worker_threads((new_value - aio_worker_threads));
1740 aio_worker_threads = new_value;
1741 } else {
1742 error = EINVAL;
1743 }
1744 }
1745 return error;
1746 }
1747
1748
1749 /*
1750 * System-wide limit on the max number of processes
1751 */
1752 STATIC int
sysctl_maxproc(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)1753 sysctl_maxproc
1754 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
1755 {
1756 int new_value, changed;
1757 int error = sysctl_io_number(req, maxproc, sizeof(int), &new_value, &changed);
1758 if (changed) {
1759 AUDIT_ARG(value32, new_value);
1760 /* make sure the system-wide limit is less than the configured hard
1761 * limit set at kernel compilation */
1762 if (new_value <= hard_maxproc && new_value > 0) {
1763 maxproc = new_value;
1764 } else {
1765 error = EINVAL;
1766 }
1767 }
1768 return error;
1769 }
1770
1771 extern int sched_enable_smt;
1772 STATIC int
sysctl_sched_enable_smt(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)1773 sysctl_sched_enable_smt
1774 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
1775 {
1776 int new_value, changed;
1777 int error = sysctl_io_number(req, sched_enable_smt, sizeof(int), &new_value, &changed);
1778 if (error) {
1779 return error;
1780 }
1781 kern_return_t kret = KERN_SUCCESS;
1782 if (changed) {
1783 AUDIT_ARG(value32, new_value);
1784 if (new_value == 0) {
1785 sched_enable_smt = 0;
1786 kret = enable_smt_processors(false);
1787 } else {
1788 sched_enable_smt = 1;
1789 kret = enable_smt_processors(true);
1790 }
1791 }
1792 switch (kret) {
1793 case KERN_SUCCESS:
1794 error = 0;
1795 break;
1796 case KERN_INVALID_ARGUMENT:
1797 error = EINVAL;
1798 break;
1799 case KERN_FAILURE:
1800 error = EBUSY;
1801 break;
1802 default:
1803 error = ENOENT;
1804 break;
1805 }
1806
1807 return error;
1808 }
1809
1810 SYSCTL_STRING(_kern, KERN_OSTYPE, ostype,
1811 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
1812 ostype, 0, "");
1813 SYSCTL_STRING(_kern, KERN_OSRELEASE, osrelease,
1814 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
1815 osrelease, 0, "");
1816 SYSCTL_INT(_kern, KERN_OSREV, osrevision,
1817 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
1818 (int *)NULL, BSD, "");
1819 SYSCTL_STRING(_kern, KERN_VERSION, version,
1820 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
1821 version, 0, "");
1822 SYSCTL_STRING(_kern, OID_AUTO, uuid,
1823 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
1824 &kernel_uuid_string[0], 0, "");
1825
1826 SYSCTL_STRING(_kern, OID_AUTO, osbuildconfig,
1827 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED | CTLFLAG_MASKED,
1828 &osbuild_config[0], 0, "");
1829
1830 #if DEBUG
1831 #ifndef DKPR
1832 #define DKPR 1
1833 #endif
1834 #endif
1835
1836 #if DKPR
1837 int debug_kprint_syscall = 0;
1838 char debug_kprint_syscall_process[MAXCOMLEN + 1];
1839
1840 /* Thread safe: bits and string value are not used to reclaim state */
1841 SYSCTL_INT(_debug, OID_AUTO, kprint_syscall,
1842 CTLFLAG_RW | CTLFLAG_LOCKED, &debug_kprint_syscall, 0, "kprintf syscall tracing");
1843 SYSCTL_STRING(_debug, OID_AUTO, kprint_syscall_process,
1844 CTLFLAG_RW | CTLFLAG_LOCKED, debug_kprint_syscall_process, sizeof(debug_kprint_syscall_process),
1845 "name of process for kprintf syscall tracing");
1846
1847 int
debug_kprint_current_process(const char ** namep)1848 debug_kprint_current_process(const char **namep)
1849 {
1850 struct proc *p = current_proc();
1851
1852 if (p == NULL) {
1853 return 0;
1854 }
1855
1856 if (debug_kprint_syscall_process[0]) {
1857 /* user asked to scope tracing to a particular process name */
1858 if (0 == strncmp(debug_kprint_syscall_process,
1859 p->p_comm, sizeof(debug_kprint_syscall_process))) {
1860 /* no value in telling the user that we traced what they asked */
1861 if (namep) {
1862 *namep = NULL;
1863 }
1864
1865 return 1;
1866 } else {
1867 return 0;
1868 }
1869 }
1870
1871 /* trace all processes. Tell user what we traced */
1872 if (namep) {
1873 *namep = p->p_comm;
1874 }
1875
1876 return 1;
1877 }
1878 #endif
1879
1880 /* PR-5293665: need to use a callback function for kern.osversion to set
1881 * osversion in IORegistry */
1882
1883 STATIC int
sysctl_osversion(__unused struct sysctl_oid * oidp,void * arg1,int arg2,struct sysctl_req * req)1884 sysctl_osversion(__unused struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
1885 {
1886 int rval = 0;
1887
1888 rval = sysctl_handle_string(oidp, arg1, arg2, req);
1889
1890 if (req->newptr) {
1891 IORegistrySetOSBuildVersion((char *)arg1);
1892 }
1893
1894 return rval;
1895 }
1896
1897 SYSCTL_PROC(_kern, KERN_OSVERSION, osversion,
1898 CTLFLAG_RW | CTLFLAG_KERN | CTLTYPE_STRING | CTLFLAG_LOCKED,
1899 osversion, 256 /* OSVERSIZE*/,
1900 sysctl_osversion, "A", "");
1901
1902 static bool
_already_set_or_not_launchd(struct sysctl_req * req,char * val)1903 _already_set_or_not_launchd(struct sysctl_req *req, char *val)
1904 {
1905 if (req->newptr != 0) {
1906 /*
1907 * Can only ever be set by launchd, and only once at boot.
1908 */
1909 if (proc_getpid(req->p) != 1 || val[0] != '\0') {
1910 return true;
1911 }
1912 }
1913 return false;
1914 }
1915
1916 #define kRootsInstalledReadWriteEntitlement "com.apple.private.roots-installed-read-write"
1917 #define kRootsInstalledReadOnlyEntitlement "com.apple.private.roots-installed-read-only"
1918 uint64_t roots_installed = 0;
1919
1920 static int
sysctl_roots_installed(__unused struct sysctl_oid * oidp,void * arg1,int arg2,struct sysctl_req * req)1921 sysctl_roots_installed
1922 (__unused struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
1923 {
1924 int error = 0;
1925
1926 if (req->newptr != 0) {
1927 /* a ReadWrite entitlement is required for updating this syscl
1928 * meanwhile, only allow write once
1929 */
1930 if (!IOCurrentTaskHasEntitlement(kRootsInstalledReadWriteEntitlement) || (roots_installed != 0)) {
1931 return EPERM;
1932 }
1933 } else {
1934 /* for reader of this sysctl, need either ReadWrite or ReadOnly entitlement */
1935 if (!IOCurrentTaskHasEntitlement(kRootsInstalledReadWriteEntitlement) &&
1936 !IOCurrentTaskHasEntitlement(kRootsInstalledReadOnlyEntitlement)) {
1937 return EPERM;
1938 }
1939 }
1940
1941 error = sysctl_handle_quad(oidp, arg1, arg2, req);
1942
1943 return error;
1944 }
1945
1946 SYSCTL_PROC(_kern, OID_AUTO, roots_installed,
1947 CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_ANYBODY | CTLFLAG_LOCKED,
1948 &roots_installed, sizeof(roots_installed),
1949 sysctl_roots_installed, "Q", "");
1950
1951 #if XNU_TARGET_OS_OSX
1952 static int
sysctl_system_version_compat(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)1953 sysctl_system_version_compat
1954 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
1955 {
1956 int oldval = (task_has_system_version_compat_enabled(current_task()));
1957 int new_value = 0, changed = 0;
1958
1959 int error = sysctl_io_number(req, oldval, sizeof(int), &new_value, &changed);
1960 if (changed) {
1961 task_set_system_version_compat_enabled(current_task(), (new_value));
1962 }
1963 return error;
1964 }
1965
1966 SYSCTL_PROC(_kern, OID_AUTO, system_version_compat,
1967 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_ANYBODY | CTLFLAG_LOCKED,
1968 0, 0, sysctl_system_version_compat, "A", "");
1969
1970 char osproductversioncompat[48] = { '\0' };
1971
1972 static int
sysctl_osproductversioncompat(struct sysctl_oid * oidp,void * arg1,int arg2,struct sysctl_req * req)1973 sysctl_osproductversioncompat(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
1974 {
1975 if (_already_set_or_not_launchd(req, osproductversioncompat)) {
1976 return EPERM;
1977 }
1978 return sysctl_handle_string(oidp, arg1, arg2, req);
1979 }
1980
1981
1982 SYSCTL_PROC(_kern, OID_AUTO, osproductversioncompat,
1983 CTLFLAG_RW | CTLFLAG_KERN | CTLTYPE_STRING | CTLFLAG_LOCKED,
1984 osproductversioncompat, sizeof(osproductversioncompat),
1985 sysctl_osproductversioncompat, "A", "The ProductVersion from SystemVersionCompat.plist");
1986 #endif
1987
1988 char osproductversion[48] = { '\0' };
1989
1990 static char iossupportversion_string[48] = { '\0' };
1991
1992 static int
sysctl_osproductversion(__unused struct sysctl_oid * oidp,void * arg1,int arg2,struct sysctl_req * req)1993 sysctl_osproductversion(__unused struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
1994 {
1995 if (_already_set_or_not_launchd(req, osproductversion)) {
1996 return EPERM;
1997 }
1998
1999 #if XNU_TARGET_OS_OSX
2000 if (task_has_system_version_compat_enabled(current_task()) && (osproductversioncompat[0] != '\0')) {
2001 return sysctl_handle_string(oidp, osproductversioncompat, arg2, req);
2002 } else {
2003 return sysctl_handle_string(oidp, arg1, arg2, req);
2004 }
2005 #else
2006 return sysctl_handle_string(oidp, arg1, arg2, req);
2007 #endif
2008 }
2009
2010 #if XNU_TARGET_OS_OSX
2011 static_assert(sizeof(osproductversioncompat) == sizeof(osproductversion),
2012 "osproductversion size matches osproductversioncompat size");
2013 #endif
2014
2015 SYSCTL_PROC(_kern, OID_AUTO, osproductversion,
2016 CTLFLAG_RW | CTLFLAG_KERN | CTLTYPE_STRING | CTLFLAG_LOCKED,
2017 osproductversion, sizeof(osproductversion),
2018 sysctl_osproductversion, "A", "The ProductVersion from SystemVersion.plist");
2019
2020 char osreleasetype[48] = { '\0' };
2021
2022 STATIC int
sysctl_osreleasetype(__unused struct sysctl_oid * oidp,void * arg1,int arg2,struct sysctl_req * req)2023 sysctl_osreleasetype(__unused struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
2024 {
2025 if (_already_set_or_not_launchd(req, osreleasetype)) {
2026 return EPERM;
2027 }
2028 return sysctl_handle_string(oidp, arg1, arg2, req);
2029 }
2030
2031 void reset_osreleasetype(void);
2032
2033 void
reset_osreleasetype(void)2034 reset_osreleasetype(void)
2035 {
2036 memset(osreleasetype, 0, sizeof(osreleasetype));
2037 }
2038
2039 SYSCTL_PROC(_kern, OID_AUTO, osreleasetype,
2040 CTLFLAG_RW | CTLFLAG_KERN | CTLTYPE_STRING | CTLFLAG_LOCKED,
2041 osreleasetype, sizeof(osreleasetype),
2042 sysctl_osreleasetype, "A", "The ReleaseType from SystemVersion.plist");
2043
2044 STATIC int
sysctl_iossupportversion(__unused struct sysctl_oid * oidp,void * arg1,int arg2,struct sysctl_req * req)2045 sysctl_iossupportversion(__unused struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
2046 {
2047 if (_already_set_or_not_launchd(req, iossupportversion_string)) {
2048 return EPERM;
2049 }
2050
2051 return sysctl_handle_string(oidp, arg1, arg2, req);
2052 }
2053
2054 SYSCTL_PROC(_kern, OID_AUTO, iossupportversion,
2055 CTLFLAG_RW | CTLFLAG_KERN | CTLTYPE_STRING | CTLFLAG_LOCKED,
2056 iossupportversion_string, sizeof(iossupportversion_string),
2057 sysctl_iossupportversion, "A", "The iOSSupportVersion from SystemVersion.plist");
2058
2059 static uint64_t osvariant_status = 0;
2060
2061 STATIC int
sysctl_osvariant_status(__unused struct sysctl_oid * oidp,void * arg1,int arg2,struct sysctl_req * req)2062 sysctl_osvariant_status(__unused struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
2063 {
2064 if (req->newptr != 0) {
2065 /*
2066 * Can only ever be set by launchd, and only once.
2067 * Reset by usrctl() -> reset_osvariant_status() during
2068 * userspace reboot, since userspace could reboot into
2069 * a different variant.
2070 */
2071 if (proc_getpid(req->p) != 1 || osvariant_status != 0) {
2072 return EPERM;
2073 }
2074 }
2075
2076 int err = sysctl_handle_quad(oidp, arg1, arg2, req);
2077
2078 reset_debug_syscall_rejection_mode();
2079
2080 return err;
2081 }
2082
2083 SYSCTL_PROC(_kern, OID_AUTO, osvariant_status,
2084 CTLFLAG_RW | CTLTYPE_QUAD | CTLFLAG_LOCKED | CTLFLAG_MASKED,
2085 &osvariant_status, sizeof(osvariant_status),
2086 sysctl_osvariant_status, "Q", "Opaque flags used to cache OS variant information");
2087
2088 static bool
_os_variant_check_disabled(enum os_variant_property property)2089 _os_variant_check_disabled(enum os_variant_property property)
2090 {
2091 return (osvariant_status >> (32 + property)) & 0x1;
2092 }
2093
2094 static bool
_os_variant_has(enum os_variant_status_flags_positions p)2095 _os_variant_has(enum os_variant_status_flags_positions p)
2096 {
2097 return ((osvariant_status >> (p * OS_VARIANT_STATUS_BIT_WIDTH)) & OS_VARIANT_STATUS_MASK) == OS_VARIANT_S_YES;
2098 }
2099
2100 bool
os_variant_has_internal_diagnostics(__unused const char * subsystem)2101 os_variant_has_internal_diagnostics(__unused const char *subsystem)
2102 {
2103 if (_os_variant_check_disabled(OS_VARIANT_PROPERTY_DIAGNOSTICS)) {
2104 return false;
2105 }
2106 #if XNU_TARGET_OS_OSX
2107 return _os_variant_has(OS_VARIANT_SFP_INTERNAL_CONTENT) || _os_variant_has(OS_VARIANT_SFP_INTERNAL_DIAGS_PROFILE);
2108 #else
2109 return _os_variant_has(OS_VARIANT_SFP_INTERNAL_RELEASE_TYPE);
2110 #endif /* XNU_TARGET_OS_OSX */
2111 }
2112
2113 void reset_osvariant_status(void);
2114
2115 void
reset_osvariant_status(void)2116 reset_osvariant_status(void)
2117 {
2118 osvariant_status = 0;
2119 reset_debug_syscall_rejection_mode();
2120 }
2121
2122 extern void commpage_update_dyld_flags(uint64_t);
2123 TUNABLE_WRITEABLE(uint64_t, dyld_flags, "dyld_flags", 0);
2124
2125 STATIC int
sysctl_dyld_flags(__unused struct sysctl_oid * oidp,void * arg1,int arg2,struct sysctl_req * req)2126 sysctl_dyld_flags(__unused struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
2127 {
2128 /*
2129 * Can only ever be set by launchd, possibly several times
2130 * as dyld may change its mind after a userspace reboot.
2131 */
2132 if (req->newptr != 0 && proc_getpid(req->p) != 1) {
2133 return EPERM;
2134 }
2135
2136 int res = sysctl_handle_quad(oidp, arg1, arg2, req);
2137 if (req->newptr && res == 0) {
2138 commpage_update_dyld_flags(dyld_flags);
2139 }
2140 return res;
2141 }
2142
2143 SYSCTL_PROC(_kern, OID_AUTO, dyld_flags,
2144 CTLFLAG_RW | CTLTYPE_QUAD | CTLFLAG_LOCKED | CTLFLAG_MASKED,
2145 &dyld_flags, sizeof(dyld_flags),
2146 sysctl_dyld_flags, "Q", "Opaque flags used to cache dyld system-wide configuration");
2147
2148 #if defined(XNU_TARGET_OS_BRIDGE)
2149 char macosproductversion[MACOS_VERS_LEN] = { '\0' };
2150
2151 SYSCTL_STRING(_kern, OID_AUTO, macosproductversion,
2152 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2153 &macosproductversion[0], MACOS_VERS_LEN, "The currently running macOS ProductVersion (from SystemVersion.plist on macOS)");
2154
2155 char macosversion[MACOS_VERS_LEN] = { '\0' };
2156
2157 SYSCTL_STRING(_kern, OID_AUTO, macosversion,
2158 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2159 &macosversion[0], MACOS_VERS_LEN, "The currently running macOS build version");
2160 #endif
2161
2162 STATIC int
sysctl_sysctl_bootargs(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)2163 sysctl_sysctl_bootargs
2164 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2165 {
2166 int error;
2167 char buf[BOOT_LINE_LENGTH];
2168
2169 strlcpy(buf, PE_boot_args(), BOOT_LINE_LENGTH);
2170 error = sysctl_io_string(req, buf, BOOT_LINE_LENGTH, 0, NULL);
2171 return error;
2172 }
2173
2174 SYSCTL_PROC(_kern, OID_AUTO, bootargs,
2175 CTLFLAG_LOCKED | CTLFLAG_RD | CTLFLAG_KERN | CTLTYPE_STRING,
2176 NULL, 0,
2177 sysctl_sysctl_bootargs, "A", "bootargs");
2178
2179 STATIC int
sysctl_kernelcacheuuid(struct sysctl_oid * oidp,void * arg1,int arg2,struct sysctl_req * req)2180 sysctl_kernelcacheuuid(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
2181 {
2182 int rval = ENOENT;
2183 if (kernelcache_uuid_valid) {
2184 rval = sysctl_handle_string(oidp, arg1, arg2, req);
2185 }
2186 return rval;
2187 }
2188
2189 SYSCTL_PROC(_kern, OID_AUTO, kernelcacheuuid,
2190 CTLFLAG_RD | CTLFLAG_KERN | CTLTYPE_STRING | CTLFLAG_LOCKED,
2191 kernelcache_uuid_string, sizeof(kernelcache_uuid_string),
2192 sysctl_kernelcacheuuid, "A", "");
2193
2194 STATIC int
sysctl_systemfilesetuuid(struct sysctl_oid * oidp,void * arg1,int arg2,struct sysctl_req * req)2195 sysctl_systemfilesetuuid(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
2196 {
2197 int rval = ENOENT;
2198 if (pageablekc_uuid_valid) {
2199 rval = sysctl_handle_string(oidp, arg1, arg2, req);
2200 }
2201 return rval;
2202 }
2203
2204 SYSCTL_PROC(_kern, OID_AUTO, systemfilesetuuid,
2205 CTLFLAG_RD | CTLFLAG_KERN | CTLTYPE_STRING | CTLFLAG_LOCKED,
2206 pageablekc_uuid_string, sizeof(pageablekc_uuid_string),
2207 sysctl_systemfilesetuuid, "A", "");
2208
2209 STATIC int
sysctl_auxiliaryfilesetuuid(struct sysctl_oid * oidp,void * arg1,int arg2,struct sysctl_req * req)2210 sysctl_auxiliaryfilesetuuid(struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
2211 {
2212 int rval = ENOENT;
2213 if (auxkc_uuid_valid) {
2214 rval = sysctl_handle_string(oidp, arg1, arg2, req);
2215 }
2216 return rval;
2217 }
2218
2219 SYSCTL_PROC(_kern, OID_AUTO, auxiliaryfilesetuuid,
2220 CTLFLAG_RD | CTLFLAG_KERN | CTLTYPE_STRING | CTLFLAG_LOCKED,
2221 auxkc_uuid_string, sizeof(auxkc_uuid_string),
2222 sysctl_auxiliaryfilesetuuid, "A", "");
2223
2224 STATIC int
sysctl_filesetuuid(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)2225 sysctl_filesetuuid(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2226 {
2227 int rval = ENOENT;
2228 kc_format_t kcformat;
2229 kernel_mach_header_t *mh;
2230 void *uuid = NULL;
2231 unsigned long uuidlen = 0;
2232 uuid_string_t uuid_str;
2233
2234 if (!PE_get_primary_kc_format(&kcformat) || kcformat != KCFormatFileset) {
2235 return rval;
2236 }
2237
2238 mh = (kernel_mach_header_t *)PE_get_kc_header(KCKindPrimary);
2239 uuid = getuuidfromheader(mh, &uuidlen);
2240
2241 if ((uuid != NULL) && (uuidlen == sizeof(uuid_t))) {
2242 uuid_unparse_upper(*(uuid_t *)uuid, uuid_str);
2243 rval = sysctl_io_string(req, (char *)uuid_str, sizeof(uuid_str), 0, NULL);
2244 }
2245
2246 return rval;
2247 }
2248
2249 SYSCTL_PROC(_kern, OID_AUTO, filesetuuid,
2250 CTLFLAG_RD | CTLFLAG_KERN | CTLTYPE_STRING | CTLFLAG_LOCKED,
2251 NULL, 0,
2252 sysctl_filesetuuid, "A", "");
2253
2254
2255 SYSCTL_INT(_kern, KERN_MAXFILES, maxfiles,
2256 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2257 &maxfiles, 0, "");
2258 SYSCTL_INT(_kern, KERN_ARGMAX, argmax,
2259 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
2260 (int *)NULL, ARG_MAX, "");
2261 SYSCTL_INT(_kern, KERN_POSIX1, posix1version,
2262 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
2263 (int *)NULL, _POSIX_VERSION, "");
2264 SYSCTL_INT(_kern, KERN_NGROUPS, ngroups,
2265 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
2266 (int *)NULL, NGROUPS_MAX, "");
2267 SYSCTL_INT(_kern, KERN_JOB_CONTROL, job_control,
2268 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
2269 (int *)NULL, 1, "");
2270 #if 1 /* _POSIX_SAVED_IDS from <unistd.h> */
2271 SYSCTL_INT(_kern, KERN_SAVED_IDS, saved_ids,
2272 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
2273 (int *)NULL, 1, "");
2274 #else
2275 SYSCTL_INT(_kern, KERN_SAVED_IDS, saved_ids,
2276 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
2277 NULL, 0, "");
2278 #endif
2279 SYSCTL_INT(_kern, OID_AUTO, num_files,
2280 CTLFLAG_RD | CTLFLAG_LOCKED,
2281 &nfiles, 0, "");
2282 SYSCTL_COMPAT_INT(_kern, OID_AUTO, num_vnodes,
2283 CTLFLAG_RD | CTLFLAG_LOCKED,
2284 &numvnodes, 0, "");
2285 SYSCTL_INT(_kern, OID_AUTO, num_tasks,
2286 CTLFLAG_RD | CTLFLAG_LOCKED,
2287 &task_max, 0, "");
2288 SYSCTL_INT(_kern, OID_AUTO, num_threads,
2289 CTLFLAG_RD | CTLFLAG_LOCKED,
2290 &thread_max, 0, "");
2291 SYSCTL_INT(_kern, OID_AUTO, num_taskthreads,
2292 CTLFLAG_RD | CTLFLAG_LOCKED,
2293 &task_threadmax, 0, "");
2294 SYSCTL_LONG(_kern, OID_AUTO, num_recycledvnodes,
2295 CTLFLAG_RD | CTLFLAG_LOCKED,
2296 &num_recycledvnodes, "");
2297 SYSCTL_COMPAT_INT(_kern, OID_AUTO, free_vnodes,
2298 CTLFLAG_RD | CTLFLAG_LOCKED,
2299 &freevnodes, 0, "");
2300
2301 STATIC int
sysctl_maxvnodes(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)2302 sysctl_maxvnodes(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2303 {
2304 int oldval = desiredvnodes;
2305 int error = sysctl_io_number(req, desiredvnodes, sizeof(int), &desiredvnodes, NULL);
2306
2307 if (oldval != desiredvnodes) {
2308 resize_namecache(desiredvnodes);
2309 }
2310
2311 return error;
2312 }
2313
2314 SYSCTL_INT(_kern, OID_AUTO, namecache_disabled,
2315 CTLFLAG_RW | CTLFLAG_LOCKED,
2316 &nc_disabled, 0, "");
2317
2318 SYSCTL_PROC(_kern, KERN_MAXVNODES, maxvnodes,
2319 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2320 0, 0, sysctl_maxvnodes, "I", "");
2321
2322 SYSCTL_PROC(_kern, KERN_MAXPROC, maxproc,
2323 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2324 0, 0, sysctl_maxproc, "I", "");
2325
2326 SYSCTL_PROC(_kern, KERN_AIOMAX, aiomax,
2327 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2328 0, 0, sysctl_aiomax, "I", "");
2329
2330 SYSCTL_PROC(_kern, KERN_AIOPROCMAX, aioprocmax,
2331 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2332 0, 0, sysctl_aioprocmax, "I", "");
2333
2334 SYSCTL_PROC(_kern, KERN_AIOTHREADS, aiothreads,
2335 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2336 0, 0, sysctl_aiothreads, "I", "");
2337
2338 SYSCTL_PROC(_kern, OID_AUTO, sched_enable_smt,
2339 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_KERN,
2340 0, 0, sysctl_sched_enable_smt, "I", "");
2341
2342 extern int sched_allow_NO_SMT_threads;
2343 SYSCTL_INT(_kern, OID_AUTO, sched_allow_NO_SMT_threads,
2344 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2345 &sched_allow_NO_SMT_threads, 0, "");
2346
2347 extern int sched_avoid_cpu0;
2348 SYSCTL_INT(_kern, OID_AUTO, sched_rt_avoid_cpu0,
2349 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2350 &sched_avoid_cpu0, 0, "If 1, choose cpu0 after all other primaries; if 2, choose cpu0 and cpu1 last, after all other cpus including secondaries");
2351
2352 #if (DEVELOPMENT || DEBUG)
2353
2354 static int
sysctl_kern_max_unsafe_rt_quanta(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)2355 sysctl_kern_max_unsafe_rt_quanta(__unused struct sysctl_oid *oidp,
2356 __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2357 {
2358 extern void sched_set_max_unsafe_rt_quanta(int);
2359 extern int max_unsafe_rt_quanta;
2360
2361 int new_value, changed;
2362 int old_value = max_unsafe_rt_quanta;
2363 int error = sysctl_io_number(req, old_value, sizeof(int), &new_value,
2364 &changed);
2365 if (changed) {
2366 sched_set_max_unsafe_rt_quanta(new_value);
2367 }
2368
2369 return error;
2370 }
2371
2372 SYSCTL_PROC(_kern, OID_AUTO, max_unsafe_rt_quanta,
2373 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2374 0, 0, sysctl_kern_max_unsafe_rt_quanta, "I",
2375 "Number of quanta to allow a realtime "
2376 "thread to run before being penalized");
2377
2378 static int
sysctl_kern_max_unsafe_fixed_quanta(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)2379 sysctl_kern_max_unsafe_fixed_quanta(__unused struct sysctl_oid *oidp,
2380 __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2381 {
2382 extern void sched_set_max_unsafe_fixed_quanta(int);
2383 extern int max_unsafe_fixed_quanta;
2384
2385 int new_value, changed;
2386 int old_value = max_unsafe_fixed_quanta;
2387 int error = sysctl_io_number(req, old_value, sizeof(int), &new_value,
2388 &changed);
2389 if (changed) {
2390 sched_set_max_unsafe_fixed_quanta(new_value);
2391 }
2392
2393 return error;
2394 }
2395
2396 SYSCTL_PROC(_kern, OID_AUTO, max_unsafe_fixed_quanta,
2397 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2398 0, 0, sysctl_kern_max_unsafe_fixed_quanta, "I",
2399 "Number of quanta to allow a fixed sched mode "
2400 "thread to run before being penalized");
2401
2402 static int
sysctl_kern_quantum_us(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)2403 sysctl_kern_quantum_us(__unused struct sysctl_oid *oidp, __unused void *arg1,
2404 __unused int arg2, struct sysctl_req *req)
2405 {
2406 extern uint64_t sysctl_get_quantum_us(void);
2407 const uint64_t quantum_us = sysctl_get_quantum_us();
2408
2409 return sysctl_io_number(req, quantum_us, sizeof(quantum_us), NULL, NULL);
2410 }
2411
2412 SYSCTL_PROC(_kern, OID_AUTO, quantum_us,
2413 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
2414 0, 0, sysctl_kern_quantum_us, "Q",
2415 "Length of scheduling quantum in microseconds");
2416
2417 extern int smt_sched_bonus_16ths;
2418 SYSCTL_INT(_kern, OID_AUTO, smt_sched_bonus_16ths,
2419 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2420 &smt_sched_bonus_16ths, 0, "");
2421
2422 extern int smt_timeshare_enabled;
2423 SYSCTL_INT(_kern, OID_AUTO, sched_smt_timeshare_enable,
2424 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2425 &smt_timeshare_enabled, 0, "");
2426
2427 extern int sched_smt_balance;
2428 SYSCTL_INT(_kern, OID_AUTO, sched_smt_balance,
2429 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2430 &sched_smt_balance, 0, "");
2431 extern int sched_allow_rt_smt;
2432 SYSCTL_INT(_kern, OID_AUTO, sched_allow_rt_smt,
2433 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2434 &sched_allow_rt_smt, 0, "");
2435 extern int sched_allow_rt_steal;
2436 SYSCTL_INT(_kern, OID_AUTO, sched_allow_rt_steal,
2437 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2438 &sched_allow_rt_steal, 0, "");
2439 extern int sched_backup_cpu_timeout_count;
2440 SYSCTL_INT(_kern, OID_AUTO, sched_backup_cpu_timeout_count,
2441 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2442 &sched_backup_cpu_timeout_count, 0, "The maximum number of 10us delays before allowing a backup cpu to select a thread");
2443 #if __arm64__
2444 extern uint32_t perfcontrol_requested_recommended_cores;
2445 SYSCTL_UINT(_kern, OID_AUTO, sched_recommended_cores,
2446 CTLFLAG_KERN | CTLFLAG_RD | CTLFLAG_LOCKED,
2447 &perfcontrol_requested_recommended_cores, 0, "");
2448
2449 /* Scheduler perfcontrol callouts sysctls */
2450 SYSCTL_DECL(_kern_perfcontrol_callout);
2451 SYSCTL_NODE(_kern, OID_AUTO, perfcontrol_callout, CTLFLAG_RW | CTLFLAG_LOCKED, 0,
2452 "scheduler perfcontrol callouts");
2453
2454 extern int perfcontrol_callout_stats_enabled;
2455 SYSCTL_INT(_kern_perfcontrol_callout, OID_AUTO, stats_enabled,
2456 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2457 &perfcontrol_callout_stats_enabled, 0, "");
2458
2459 extern uint64_t perfcontrol_callout_stat_avg(perfcontrol_callout_type_t type,
2460 perfcontrol_callout_stat_t stat);
2461
2462 /* On-Core Callout */
2463 STATIC int
sysctl_perfcontrol_callout_stat(__unused struct sysctl_oid * oidp,void * arg1,int arg2,struct sysctl_req * req)2464 sysctl_perfcontrol_callout_stat
2465 (__unused struct sysctl_oid *oidp, void *arg1, int arg2, struct sysctl_req *req)
2466 {
2467 perfcontrol_callout_stat_t stat = (perfcontrol_callout_stat_t)arg1;
2468 perfcontrol_callout_type_t type = (perfcontrol_callout_type_t)arg2;
2469 return sysctl_io_number(req, (int)perfcontrol_callout_stat_avg(type, stat),
2470 sizeof(int), NULL, NULL);
2471 }
2472
2473 SYSCTL_PROC(_kern_perfcontrol_callout, OID_AUTO, oncore_instr,
2474 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
2475 (void *)PERFCONTROL_STAT_INSTRS, PERFCONTROL_CALLOUT_ON_CORE,
2476 sysctl_perfcontrol_callout_stat, "I", "");
2477 SYSCTL_PROC(_kern_perfcontrol_callout, OID_AUTO, oncore_cycles,
2478 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
2479 (void *)PERFCONTROL_STAT_CYCLES, PERFCONTROL_CALLOUT_ON_CORE,
2480 sysctl_perfcontrol_callout_stat, "I", "");
2481 SYSCTL_PROC(_kern_perfcontrol_callout, OID_AUTO, offcore_instr,
2482 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
2483 (void *)PERFCONTROL_STAT_INSTRS, PERFCONTROL_CALLOUT_OFF_CORE,
2484 sysctl_perfcontrol_callout_stat, "I", "");
2485 SYSCTL_PROC(_kern_perfcontrol_callout, OID_AUTO, offcore_cycles,
2486 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
2487 (void *)PERFCONTROL_STAT_CYCLES, PERFCONTROL_CALLOUT_OFF_CORE,
2488 sysctl_perfcontrol_callout_stat, "I", "");
2489 SYSCTL_PROC(_kern_perfcontrol_callout, OID_AUTO, context_instr,
2490 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
2491 (void *)PERFCONTROL_STAT_INSTRS, PERFCONTROL_CALLOUT_CONTEXT,
2492 sysctl_perfcontrol_callout_stat, "I", "");
2493 SYSCTL_PROC(_kern_perfcontrol_callout, OID_AUTO, context_cycles,
2494 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
2495 (void *)PERFCONTROL_STAT_CYCLES, PERFCONTROL_CALLOUT_CONTEXT,
2496 sysctl_perfcontrol_callout_stat, "I", "");
2497 SYSCTL_PROC(_kern_perfcontrol_callout, OID_AUTO, update_instr,
2498 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
2499 (void *)PERFCONTROL_STAT_INSTRS, PERFCONTROL_CALLOUT_STATE_UPDATE,
2500 sysctl_perfcontrol_callout_stat, "I", "");
2501 SYSCTL_PROC(_kern_perfcontrol_callout, OID_AUTO, update_cycles,
2502 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
2503 (void *)PERFCONTROL_STAT_CYCLES, PERFCONTROL_CALLOUT_STATE_UPDATE,
2504 sysctl_perfcontrol_callout_stat, "I", "");
2505
2506 #if __AMP__
2507 extern int sched_amp_idle_steal;
2508 SYSCTL_INT(_kern, OID_AUTO, sched_amp_idle_steal,
2509 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2510 &sched_amp_idle_steal, 0, "");
2511 extern int sched_amp_spill_steal;
2512 SYSCTL_INT(_kern, OID_AUTO, sched_amp_spill_steal,
2513 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2514 &sched_amp_spill_steal, 0, "");
2515 extern int sched_amp_spill_count;
2516 SYSCTL_INT(_kern, OID_AUTO, sched_amp_spill_count,
2517 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2518 &sched_amp_spill_count, 0, "");
2519 extern int sched_amp_spill_deferred_ipi;
2520 SYSCTL_INT(_kern, OID_AUTO, sched_amp_spill_deferred_ipi,
2521 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2522 &sched_amp_spill_deferred_ipi, 0, "");
2523 extern int sched_amp_pcores_preempt_immediate_ipi;
2524 SYSCTL_INT(_kern, OID_AUTO, sched_amp_pcores_preempt_immediate_ipi,
2525 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2526 &sched_amp_pcores_preempt_immediate_ipi, 0, "");
2527 #endif /* __AMP__ */
2528 #endif /* __arm64__ */
2529
2530 #if __arm64__
2531 extern int legacy_footprint_entitlement_mode;
2532 SYSCTL_INT(_kern, OID_AUTO, legacy_footprint_entitlement_mode,
2533 CTLFLAG_KERN | CTLFLAG_RD | CTLFLAG_LOCKED,
2534 &legacy_footprint_entitlement_mode, 0, "");
2535 #endif /* __arm64__ */
2536
2537 /*
2538 * Realtime threads are ordered by highest priority first then,
2539 * for threads of the same priority, by earliest deadline first.
2540 * But if sched_rt_runq_strict_priority is false (the default),
2541 * a lower priority thread with an earlier deadline will be preferred
2542 * over a higher priority thread with a later deadline, as long as
2543 * both threads' computations will fit before the later deadline.
2544 */
2545 extern int sched_rt_runq_strict_priority;
2546 SYSCTL_INT(_kern, OID_AUTO, sched_rt_runq_strict_priority,
2547 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2548 &sched_rt_runq_strict_priority, 0, "");
2549
2550 static int
sysctl_kern_sched_rt_n_backup_processors(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)2551 sysctl_kern_sched_rt_n_backup_processors(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2552 {
2553 int new_value, changed;
2554 int old_value = sched_get_rt_n_backup_processors();
2555 int error = sysctl_io_number(req, old_value, sizeof(int), &new_value, &changed);
2556 if (changed) {
2557 sched_set_rt_n_backup_processors(new_value);
2558 }
2559
2560 return error;
2561 }
2562
2563 SYSCTL_PROC(_kern, OID_AUTO, sched_rt_n_backup_processors,
2564 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2565 0, 0, sysctl_kern_sched_rt_n_backup_processors, "I", "");
2566
2567 static int
sysctl_kern_sched_rt_deadline_epsilon_us(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)2568 sysctl_kern_sched_rt_deadline_epsilon_us(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2569 {
2570 int new_value, changed;
2571 int old_value = sched_get_rt_deadline_epsilon();
2572 int error = sysctl_io_number(req, old_value, sizeof(int), &new_value, &changed);
2573 if (changed) {
2574 sched_set_rt_deadline_epsilon(new_value);
2575 }
2576
2577 return error;
2578 }
2579
2580 SYSCTL_PROC(_kern, OID_AUTO, sched_rt_deadline_epsilon_us,
2581 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2582 0, 0, sysctl_kern_sched_rt_deadline_epsilon_us, "I", "");
2583
2584 extern int sched_idle_delay_cpuid;
2585 SYSCTL_INT(_kern, OID_AUTO, sched_idle_delay_cpuid,
2586 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
2587 &sched_idle_delay_cpuid, 0, "This cpuid will be delayed by 500us on exiting idle, to simulate interrupt or preemption delays when testing the scheduler");
2588
2589 static int
sysctl_kern_sched_powered_cores(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)2590 sysctl_kern_sched_powered_cores(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2591 {
2592 int new_value, changed;
2593 int old_value = sched_get_powered_cores();
2594 int error = sysctl_io_number(req, old_value, sizeof(int), &new_value, &changed);
2595 if (changed) {
2596 sched_set_powered_cores(new_value);
2597 }
2598
2599 return error;
2600 }
2601
2602 SYSCTL_PROC(_kern, OID_AUTO, sched_powered_cores,
2603 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2604 0, 0, sysctl_kern_sched_powered_cores, "I", "");
2605
2606 #endif /* (DEVELOPMENT || DEBUG) */
2607
2608 static int
sysctl_kern_suspend_cluster_powerdown(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)2609 sysctl_kern_suspend_cluster_powerdown(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2610 {
2611 int new_value, changed;
2612 int old_value = get_cluster_powerdown_user_suspended();
2613 int error = sysctl_io_number(req, old_value, sizeof(int), &new_value, &changed);
2614 if (!error && changed) {
2615 if (new_value > 0) {
2616 error = suspend_cluster_powerdown_from_user();
2617 } else {
2618 error = resume_cluster_powerdown_from_user();
2619 }
2620 if (error) {
2621 error = EALREADY;
2622 }
2623 }
2624
2625 return error;
2626 }
2627
2628 SYSCTL_PROC(_kern, OID_AUTO, suspend_cluster_powerdown,
2629 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2630 0, 0, sysctl_kern_suspend_cluster_powerdown, "I", "");
2631
2632
2633 STATIC int
sysctl_securelvl(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)2634 sysctl_securelvl
2635 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2636 {
2637 int new_value, changed;
2638 int error = sysctl_io_number(req, securelevel, sizeof(int), &new_value, &changed);
2639 if (changed) {
2640 if (!(new_value < securelevel && proc_getpid(req->p) != 1)) {
2641 proc_list_lock();
2642 securelevel = new_value;
2643 proc_list_unlock();
2644 } else {
2645 error = EPERM;
2646 }
2647 }
2648 return error;
2649 }
2650
2651 SYSCTL_PROC(_kern, KERN_SECURELVL, securelevel,
2652 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
2653 0, 0, sysctl_securelvl, "I", "");
2654
2655
2656 STATIC int
sysctl_domainname(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)2657 sysctl_domainname
2658 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2659 {
2660 int error, changed;
2661 char tmpname[MAXHOSTNAMELEN] = {};
2662
2663 lck_mtx_lock(&domainname_lock);
2664 strlcpy(tmpname, domainname, sizeof(tmpname));
2665 lck_mtx_unlock(&domainname_lock);
2666
2667 error = sysctl_io_string(req, tmpname, sizeof(tmpname), 0, &changed);
2668 if (!error && changed) {
2669 lck_mtx_lock(&hostname_lock);
2670 strlcpy(domainname, tmpname, sizeof(domainname));
2671 lck_mtx_unlock(&hostname_lock);
2672 }
2673 return error;
2674 }
2675
2676 SYSCTL_PROC(_kern, KERN_DOMAINNAME, nisdomainname,
2677 CTLTYPE_STRING | CTLFLAG_RW | CTLFLAG_LOCKED,
2678 0, 0, sysctl_domainname, "A", "");
2679
2680 SYSCTL_COMPAT_INT(_kern, KERN_HOSTID, hostid,
2681 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2682 &hostid, 0, "");
2683
2684 STATIC int
sysctl_hostname(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)2685 sysctl_hostname
2686 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2687 {
2688 int error, changed;
2689 char tmpname[MAXHOSTNAMELEN] = {};
2690
2691 lck_mtx_lock(&hostname_lock);
2692 strlcpy(tmpname, hostname, sizeof(tmpname));
2693 lck_mtx_unlock(&hostname_lock);
2694
2695 error = sysctl_io_string(req, tmpname, sizeof(tmpname), 1, &changed);
2696 if (!error && changed) {
2697 lck_mtx_lock(&hostname_lock);
2698 strlcpy(hostname, tmpname, sizeof(hostname));
2699 lck_mtx_unlock(&hostname_lock);
2700 }
2701 return error;
2702 }
2703
2704 SYSCTL_PROC(_kern, KERN_HOSTNAME, hostname,
2705 CTLTYPE_STRING | CTLFLAG_RW | CTLFLAG_LOCKED,
2706 0, 0, sysctl_hostname, "A", "");
2707
2708 STATIC int
sysctl_procname(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)2709 sysctl_procname
2710 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2711 {
2712 /* Original code allowed writing, I'm copying this, although this all makes
2713 * no sense to me. Besides, this sysctl is never used. */
2714 return sysctl_io_string(req, &req->p->p_name[0], (2 * MAXCOMLEN + 1), 1, NULL);
2715 }
2716
2717 SYSCTL_PROC(_kern, KERN_PROCNAME, procname,
2718 CTLTYPE_STRING | CTLFLAG_RW | CTLFLAG_ANYBODY | CTLFLAG_LOCKED,
2719 0, 0, sysctl_procname, "A", "");
2720
2721 SYSCTL_INT(_kern, KERN_SPECULATIVE_READS, speculative_reads_disabled,
2722 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2723 &speculative_reads_disabled, 0, "");
2724
2725 SYSCTL_UINT(_kern, OID_AUTO, preheat_max_bytes,
2726 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2727 &preheat_max_bytes, 0, "");
2728
2729 SYSCTL_UINT(_kern, OID_AUTO, preheat_min_bytes,
2730 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2731 &preheat_min_bytes, 0, "");
2732
2733 SYSCTL_UINT(_kern, OID_AUTO, speculative_prefetch_max,
2734 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2735 &speculative_prefetch_max, 0, "");
2736
2737 SYSCTL_UINT(_kern, OID_AUTO, speculative_prefetch_max_iosize,
2738 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2739 &speculative_prefetch_max_iosize, 0, "");
2740
2741 SYSCTL_UINT(_kern, OID_AUTO, vm_page_free_target,
2742 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2743 &vm_page_free_target, 0, "");
2744
2745 SYSCTL_UINT(_kern, OID_AUTO, vm_page_free_min,
2746 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2747 &vm_page_free_min, 0, "");
2748
2749 SYSCTL_UINT(_kern, OID_AUTO, vm_page_free_reserved,
2750 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2751 &vm_page_free_reserved, 0, "");
2752
2753 SYSCTL_UINT(_kern, OID_AUTO, vm_page_speculative_percentage,
2754 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2755 &vm_pageout_state.vm_page_speculative_percentage, 0, "");
2756
2757 SYSCTL_UINT(_kern, OID_AUTO, vm_page_speculative_q_age_ms,
2758 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2759 &vm_pageout_state.vm_page_speculative_q_age_ms, 0, "");
2760
2761 SYSCTL_UINT(_kern, OID_AUTO, vm_max_delayed_work_limit,
2762 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2763 &vm_max_delayed_work_limit, 0, "");
2764
2765 SYSCTL_UINT(_kern, OID_AUTO, vm_max_batch,
2766 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
2767 &vm_max_batch, 0, "");
2768
2769 SYSCTL_STRING(_kern, OID_AUTO, bootsessionuuid,
2770 CTLFLAG_RD | CTLFLAG_LOCKED,
2771 &bootsessionuuid_string, sizeof(bootsessionuuid_string), "");
2772
2773
2774 STATIC int
sysctl_boottime(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)2775 sysctl_boottime
2776 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2777 {
2778 struct timeval tv;
2779 boottime_timeval(&tv);
2780 struct proc *p = req->p;
2781
2782 if (proc_is64bit(p)) {
2783 struct user64_timeval t = {};
2784 t.tv_sec = tv.tv_sec;
2785 t.tv_usec = tv.tv_usec;
2786 return sysctl_io_opaque(req, &t, sizeof(t), NULL);
2787 } else {
2788 struct user32_timeval t = {};
2789 t.tv_sec = (user32_time_t)tv.tv_sec;
2790 t.tv_usec = tv.tv_usec;
2791 return sysctl_io_opaque(req, &t, sizeof(t), NULL);
2792 }
2793 }
2794
2795 SYSCTL_PROC(_kern, KERN_BOOTTIME, boottime,
2796 CTLTYPE_STRUCT | CTLFLAG_KERN | CTLFLAG_RD | CTLFLAG_LOCKED,
2797 0, 0, sysctl_boottime, "S,timeval", "");
2798
2799 extern bool IOGetBootUUID(char *);
2800
2801 /* non-static: written by imageboot.c */
2802 uuid_string_t fake_bootuuid;
2803
2804 STATIC int
sysctl_bootuuid(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)2805 sysctl_bootuuid
2806 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2807 {
2808 int error = ENOENT;
2809
2810 /* check the first byte to see if the string has been
2811 * populated. this is a uuid_STRING_t, this check would
2812 * not work with a uuid_t.
2813 */
2814 if (fake_bootuuid[0] != '\0') {
2815 error = sysctl_io_string(req, fake_bootuuid, 0, 0, NULL);
2816 goto out;
2817 }
2818
2819 uuid_string_t uuid_string;
2820 if (IOGetBootUUID(uuid_string)) {
2821 uuid_t boot_uuid;
2822 error = uuid_parse(uuid_string, boot_uuid);
2823 if (!error) {
2824 error = sysctl_io_string(req, __DECONST(char *, uuid_string), 0, 0, NULL);
2825 }
2826 }
2827
2828 out:
2829 return error;
2830 }
2831
2832 SYSCTL_PROC(_kern, OID_AUTO, bootuuid,
2833 CTLTYPE_STRING | CTLFLAG_KERN | CTLFLAG_RD | CTLFLAG_LOCKED,
2834 0, 0, sysctl_bootuuid, "A", "");
2835
2836
2837 extern bool IOGetApfsPrebootUUID(char *);
2838 extern bool IOGetAssociatedApfsVolgroupUUID(char *);
2839
2840 STATIC int
sysctl_apfsprebootuuid(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)2841 sysctl_apfsprebootuuid
2842 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2843 {
2844 int error = ENOENT;
2845
2846 uuid_string_t uuid_string;
2847 if (IOGetApfsPrebootUUID(uuid_string)) {
2848 uuid_t apfs_preboot_uuid;
2849 error = uuid_parse(uuid_string, apfs_preboot_uuid);
2850 if (!error) {
2851 error = sysctl_io_string(req, __DECONST(char *, uuid_string), 0, 0, NULL);
2852 }
2853 }
2854
2855 return error;
2856 }
2857
2858 SYSCTL_PROC(_kern, OID_AUTO, apfsprebootuuid,
2859 CTLTYPE_STRING | CTLFLAG_KERN | CTLFLAG_RD | CTLFLAG_LOCKED,
2860 0, 0, sysctl_apfsprebootuuid, "A", "");
2861
2862 STATIC int
sysctl_targetsystemvolgroupuuid(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)2863 sysctl_targetsystemvolgroupuuid
2864 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2865 {
2866 int error = ENOENT;
2867
2868 uuid_string_t uuid_string;
2869 if (IOGetApfsPrebootUUID(uuid_string)) {
2870 uuid_t apfs_preboot_uuid;
2871 error = uuid_parse(uuid_string, apfs_preboot_uuid);
2872 if (!error) {
2873 error = sysctl_io_string(req, __DECONST(char *, uuid_string), 0, 0, NULL);
2874 }
2875 } else {
2876 /*
2877 * In special boot modes, such as kcgen-mode, the
2878 * apfs-preboot-uuid property will not be set. Instead, a
2879 * different property, associated-volume-group, will be set
2880 * which indicates the UUID of the VolumeGroup containing the
2881 * system volume into which you will boot.
2882 */
2883 if (IOGetAssociatedApfsVolgroupUUID(uuid_string)) {
2884 uuid_t apfs_preboot_uuid;
2885 error = uuid_parse(uuid_string, apfs_preboot_uuid);
2886 if (!error) {
2887 error = sysctl_io_string(req, __DECONST(char *, uuid_string), 0, 0, NULL);
2888 }
2889 }
2890 }
2891
2892 return error;
2893 }
2894
2895 SYSCTL_PROC(_kern, OID_AUTO, targetsystemvolgroupuuid,
2896 CTLTYPE_STRING | CTLFLAG_KERN | CTLFLAG_RD | CTLFLAG_MASKED | CTLFLAG_LOCKED,
2897 0, 0, sysctl_targetsystemvolgroupuuid, "A", "");
2898
2899
2900 extern bool IOGetBootManifestHash(char *, size_t *);
2901 extern bool IOGetBootObjectsPath(char *);
2902
2903 STATIC int
sysctl_bootobjectspath(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)2904 sysctl_bootobjectspath
2905 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2906 {
2907 int error = ENOENT;
2908
2909 #if defined(__x86_64__)
2910 /* auth-root-dmg is used for the Intel BaseSystem in some flows,
2911 * e.g. createinstallmedia and as part of upgrading from 10.15 or earlier
2912 * under these scenarios, set_fake_bootuuid will be called when pivoting to
2913 * the new root filesystem. need honor the fake bootuuid.
2914 */
2915 if (fake_bootuuid[0] != '\0') {
2916 error = sysctl_io_string(req, fake_bootuuid, 0, 0, NULL);
2917 } else {
2918 /* for intel mac, boot objects reside in [preboot volume]/[bootuuid]
2919 * bootuuid and apfsprebootuuid are populated by efiboot and they are alias.
2920 */
2921 uuid_string_t uuid_string;
2922 if (IOGetBootUUID(uuid_string)) {
2923 uuid_t boot_uuid;
2924 error = uuid_parse(uuid_string, boot_uuid);
2925 if (!error) {
2926 error = sysctl_io_string(req, (char *)uuid_string, 0, 0, NULL);
2927 }
2928 }
2929 }
2930 #else
2931 char boot_obj_path[MAXPATHLEN] = { "\0" };
2932 static const char kAsciiHexChars[] = "0123456789ABCDEF";
2933 unsigned int i, j;
2934
2935 /* Hashed with SHA2-384 or SHA1, boot manifest hash is 48 bytes or 20 bytes
2936 * hence, need a 97 bytes char array for the string.
2937 */
2938 size_t hash_data_size = CCSHA384_OUTPUT_SIZE;
2939 char hash_data[CCSHA384_OUTPUT_SIZE] = { "\0" };
2940 char boot_manifest_hash[CCSHA384_OUTPUT_SIZE * 2 + 1] = { "\0" };;
2941
2942 /* for Apple Silicon Macs, there is a boot-objects-path under IODeviceTree:/chosen
2943 * and boot objects reside in [preboot volume]/[boot-objects-path]
2944 * for embedded platforms, there would be a boot-manifest-hash under IODeviceTree:/chosen
2945 * and boot objects reside in [preboot volume]/[boot-manifest-hash]
2946 */
2947 if (IOGetBootObjectsPath(boot_obj_path)) {
2948 error = sysctl_io_string(req, (char *)boot_obj_path, 0, 0, NULL);
2949 } else if (IOGetBootManifestHash(hash_data, &hash_data_size)) {
2950 j = 0;
2951 for (i = 0; i < hash_data_size; ++i) {
2952 char octet = hash_data[i];
2953 boot_manifest_hash[j++] = kAsciiHexChars[((octet & 0xF0) >> 4)];
2954 boot_manifest_hash[j++] = kAsciiHexChars[(octet & 0x0F)];
2955 }
2956 /* make sure string has null termination */
2957 boot_manifest_hash[j] = '\0';
2958 error = sysctl_io_string(req, (char *)boot_manifest_hash, 0, 0, NULL);
2959 }
2960 #endif
2961 return error;
2962 }
2963
2964 SYSCTL_PROC(_kern, OID_AUTO, bootobjectspath,
2965 CTLTYPE_STRING | CTLFLAG_KERN | CTLFLAG_RD | CTLFLAG_LOCKED,
2966 0, 0, sysctl_bootobjectspath, "A", "");
2967
2968
2969 STATIC int
sysctl_symfile(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)2970 sysctl_symfile
2971 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2972 {
2973 char *str;
2974 int error = get_kernel_symfile(req->p, &str);
2975 if (error) {
2976 return error;
2977 }
2978 return sysctl_io_string(req, str, 0, 0, NULL);
2979 }
2980
2981
2982 SYSCTL_PROC(_kern, KERN_SYMFILE, symfile,
2983 CTLTYPE_STRING | CTLFLAG_RD | CTLFLAG_LOCKED,
2984 0, 0, sysctl_symfile, "A", "");
2985
2986 #if CONFIG_NETBOOT
2987 STATIC int
sysctl_netboot(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)2988 sysctl_netboot
2989 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
2990 {
2991 return sysctl_io_number(req, netboot_root(), sizeof(int), NULL, NULL);
2992 }
2993
2994 SYSCTL_PROC(_kern, KERN_NETBOOT, netboot,
2995 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
2996 0, 0, sysctl_netboot, "I", "");
2997 #endif
2998
2999 #ifdef CONFIG_IMGSRC_ACCESS
3000 /*
3001 * Legacy--act as if only one layer of nesting is possible.
3002 */
3003 STATIC int
sysctl_imgsrcdev(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)3004 sysctl_imgsrcdev
3005 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3006 {
3007 vfs_context_t ctx = vfs_context_current();
3008 vnode_t devvp;
3009 int result;
3010
3011 if (!vfs_context_issuser(ctx)) {
3012 return EPERM;
3013 }
3014
3015 if (imgsrc_rootvnodes[0] == NULL) {
3016 return ENOENT;
3017 }
3018
3019 result = vnode_getwithref(imgsrc_rootvnodes[0]);
3020 if (result != 0) {
3021 return result;
3022 }
3023
3024 devvp = vnode_mount(imgsrc_rootvnodes[0])->mnt_devvp;
3025 result = vnode_getwithref(devvp);
3026 if (result != 0) {
3027 goto out;
3028 }
3029
3030 result = sysctl_io_number(req, vnode_specrdev(devvp), sizeof(dev_t), NULL, NULL);
3031
3032 vnode_put(devvp);
3033 out:
3034 vnode_put(imgsrc_rootvnodes[0]);
3035 return result;
3036 }
3037
3038 SYSCTL_PROC(_kern, OID_AUTO, imgsrcdev,
3039 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
3040 0, 0, sysctl_imgsrcdev, "I", "");
3041
3042 STATIC int
sysctl_imgsrcinfo(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)3043 sysctl_imgsrcinfo
3044 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3045 {
3046 int error;
3047 struct imgsrc_info info[MAX_IMAGEBOOT_NESTING] = {}; /* 2 for now, no problem */
3048 uint32_t i;
3049 vnode_t rvp, devvp;
3050
3051 if (imgsrc_rootvnodes[0] == NULLVP) {
3052 return ENXIO;
3053 }
3054
3055 for (i = 0; i < MAX_IMAGEBOOT_NESTING; i++) {
3056 /*
3057 * Go get the root vnode.
3058 */
3059 rvp = imgsrc_rootvnodes[i];
3060 if (rvp == NULLVP) {
3061 break;
3062 }
3063
3064 error = vnode_get(rvp);
3065 if (error != 0) {
3066 return error;
3067 }
3068
3069 /*
3070 * For now, no getting at a non-local volume.
3071 */
3072 devvp = vnode_mount(rvp)->mnt_devvp;
3073 if (devvp == NULL) {
3074 vnode_put(rvp);
3075 return EINVAL;
3076 }
3077
3078 error = vnode_getwithref(devvp);
3079 if (error != 0) {
3080 vnode_put(rvp);
3081 return error;
3082 }
3083
3084 /*
3085 * Fill in info.
3086 */
3087 info[i].ii_dev = vnode_specrdev(devvp);
3088 info[i].ii_flags = 0;
3089 info[i].ii_height = i;
3090 bzero(info[i].ii_reserved, sizeof(info[i].ii_reserved));
3091
3092 vnode_put(devvp);
3093 vnode_put(rvp);
3094 }
3095
3096 return sysctl_io_opaque(req, info, i * sizeof(info[0]), NULL);
3097 }
3098
3099 SYSCTL_PROC(_kern, OID_AUTO, imgsrcinfo,
3100 CTLTYPE_OPAQUE | CTLFLAG_RD | CTLFLAG_LOCKED,
3101 0, 0, sysctl_imgsrcinfo, "I", "");
3102
3103 #endif /* CONFIG_IMGSRC_ACCESS */
3104
3105
3106 SYSCTL_DECL(_kern_timer);
3107 SYSCTL_NODE(_kern, OID_AUTO, timer, CTLFLAG_RW | CTLFLAG_LOCKED, 0, "timer");
3108
3109
3110 SYSCTL_INT(_kern_timer, OID_AUTO, coalescing_enabled,
3111 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
3112 &mach_timer_coalescing_enabled, 0, "");
3113
3114 SYSCTL_QUAD(_kern_timer, OID_AUTO, deadline_tracking_bin_1,
3115 CTLFLAG_RW | CTLFLAG_LOCKED,
3116 &timer_deadline_tracking_bin_1, "");
3117 SYSCTL_QUAD(_kern_timer, OID_AUTO, deadline_tracking_bin_2,
3118 CTLFLAG_RW | CTLFLAG_LOCKED,
3119 &timer_deadline_tracking_bin_2, "");
3120
3121 SYSCTL_DECL(_kern_timer_longterm);
3122 SYSCTL_NODE(_kern_timer, OID_AUTO, longterm, CTLFLAG_RW | CTLFLAG_LOCKED, 0, "longterm");
3123
3124
3125 /* Must match definition in osfmk/kern/timer_call.c */
3126 enum {
3127 THRESHOLD, QCOUNT,
3128 ENQUEUES, DEQUEUES, ESCALATES, SCANS, PREEMPTS,
3129 LATENCY, LATENCY_MIN, LATENCY_MAX, LONG_TERM_SCAN_LIMIT,
3130 LONG_TERM_SCAN_INTERVAL, LONG_TERM_SCAN_PAUSES,
3131 SCAN_LIMIT, SCAN_INTERVAL, SCAN_PAUSES, SCAN_POSTPONES,
3132 };
3133 extern uint64_t timer_sysctl_get(int);
3134 extern int timer_sysctl_set(int, uint64_t);
3135
3136 STATIC int
sysctl_timer(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)3137 sysctl_timer
3138 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3139 {
3140 int oid = (int)arg1;
3141 uint64_t value = timer_sysctl_get(oid);
3142 uint64_t new_value;
3143 int error;
3144 int changed;
3145
3146 error = sysctl_io_number(req, value, sizeof(value), &new_value, &changed);
3147 if (changed) {
3148 error = timer_sysctl_set(oid, new_value);
3149 }
3150
3151 return error;
3152 }
3153
3154 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, threshold,
3155 CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_LOCKED,
3156 (void *) THRESHOLD, 0, sysctl_timer, "Q", "");
3157 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, scan_limit,
3158 CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_LOCKED,
3159 (void *) LONG_TERM_SCAN_LIMIT, 0, sysctl_timer, "Q", "");
3160 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, scan_interval,
3161 CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_LOCKED,
3162 (void *) LONG_TERM_SCAN_INTERVAL, 0, sysctl_timer, "Q", "");
3163
3164 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, qlen,
3165 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3166 (void *) QCOUNT, 0, sysctl_timer, "Q", "");
3167 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, scan_pauses,
3168 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3169 (void *) LONG_TERM_SCAN_PAUSES, 0, sysctl_timer, "Q", "");
3170
3171 #if DEBUG
3172 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, enqueues,
3173 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3174 (void *) ENQUEUES, 0, sysctl_timer, "Q", "");
3175 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, dequeues,
3176 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3177 (void *) DEQUEUES, 0, sysctl_timer, "Q", "");
3178 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, escalates,
3179 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3180 (void *) ESCALATES, 0, sysctl_timer, "Q", "");
3181 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, scans,
3182 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3183 (void *) SCANS, 0, sysctl_timer, "Q", "");
3184 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, preempts,
3185 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3186 (void *) PREEMPTS, 0, sysctl_timer, "Q", "");
3187 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, latency,
3188 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3189 (void *) LATENCY, 0, sysctl_timer, "Q", "");
3190 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, latency_min,
3191 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3192 (void *) LATENCY_MIN, 0, sysctl_timer, "Q", "");
3193 SYSCTL_PROC(_kern_timer_longterm, OID_AUTO, latency_max,
3194 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3195 (void *) LATENCY_MAX, 0, sysctl_timer, "Q", "");
3196 #endif /* DEBUG */
3197
3198 SYSCTL_PROC(_kern_timer, OID_AUTO, scan_limit,
3199 CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_LOCKED,
3200 (void *) SCAN_LIMIT, 0, sysctl_timer, "Q", "");
3201 SYSCTL_PROC(_kern_timer, OID_AUTO, scan_interval,
3202 CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_LOCKED,
3203 (void *) SCAN_INTERVAL, 0, sysctl_timer, "Q", "");
3204 SYSCTL_PROC(_kern_timer, OID_AUTO, scan_pauses,
3205 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3206 (void *) SCAN_PAUSES, 0, sysctl_timer, "Q", "");
3207 SYSCTL_PROC(_kern_timer, OID_AUTO, scan_postpones,
3208 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3209 (void *) SCAN_POSTPONES, 0, sysctl_timer, "Q", "");
3210
3211 STATIC int
sysctl_usrstack(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)3212 sysctl_usrstack
3213 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3214 {
3215 return sysctl_io_number(req, (int)req->p->user_stack, sizeof(int), NULL, NULL);
3216 }
3217
3218 SYSCTL_PROC(_kern, KERN_USRSTACK32, usrstack,
3219 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
3220 0, 0, sysctl_usrstack, "I", "");
3221
3222 STATIC int
sysctl_usrstack64(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)3223 sysctl_usrstack64
3224 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3225 {
3226 return sysctl_io_number(req, req->p->user_stack, sizeof(req->p->user_stack), NULL, NULL);
3227 }
3228
3229 SYSCTL_PROC(_kern, KERN_USRSTACK64, usrstack64,
3230 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED,
3231 0, 0, sysctl_usrstack64, "Q", "");
3232
3233 #if CONFIG_COREDUMP
3234
3235 SYSCTL_STRING(_kern, KERN_COREFILE, corefile,
3236 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
3237 corefilename, sizeof(corefilename), "");
3238
3239 SYSCTL_STRING(_kern, OID_AUTO, drivercorefile,
3240 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
3241 drivercorefilename, sizeof(drivercorefilename), "");
3242
3243 STATIC int
sysctl_coredump(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)3244 sysctl_coredump
3245 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3246 {
3247 #ifdef SECURE_KERNEL
3248 (void)req;
3249 return ENOTSUP;
3250 #else
3251 int new_value, changed;
3252 int error = sysctl_io_number(req, do_coredump, sizeof(int), &new_value, &changed);
3253 if (changed) {
3254 if ((new_value == 0) || (new_value == 1)) {
3255 do_coredump = new_value;
3256 } else {
3257 error = EINVAL;
3258 }
3259 }
3260 return error;
3261 #endif
3262 }
3263
3264 SYSCTL_PROC(_kern, KERN_COREDUMP, coredump,
3265 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
3266 0, 0, sysctl_coredump, "I", "");
3267
3268 STATIC int
sysctl_suid_coredump(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)3269 sysctl_suid_coredump
3270 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3271 {
3272 #ifdef SECURE_KERNEL
3273 (void)req;
3274 return ENOTSUP;
3275 #else
3276 int new_value, changed;
3277 int error = sysctl_io_number(req, sugid_coredump, sizeof(int), &new_value, &changed);
3278 if (changed) {
3279 if ((new_value == 0) || (new_value == 1)) {
3280 sugid_coredump = new_value;
3281 } else {
3282 error = EINVAL;
3283 }
3284 }
3285 return error;
3286 #endif
3287 }
3288
3289 SYSCTL_PROC(_kern, KERN_SUGID_COREDUMP, sugid_coredump,
3290 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
3291 0, 0, sysctl_suid_coredump, "I", "");
3292
3293 #endif /* CONFIG_COREDUMP */
3294
3295 STATIC int
sysctl_delayterm(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)3296 sysctl_delayterm
3297 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3298 {
3299 struct proc *p = req->p;
3300 int new_value, changed;
3301 int error = sysctl_io_number(req, (req->p->p_lflag & P_LDELAYTERM)? 1: 0, sizeof(int), &new_value, &changed);
3302 if (changed) {
3303 proc_lock(p);
3304 if (new_value) {
3305 req->p->p_lflag |= P_LDELAYTERM;
3306 } else {
3307 req->p->p_lflag &= ~P_LDELAYTERM;
3308 }
3309 proc_unlock(p);
3310 }
3311 return error;
3312 }
3313
3314 SYSCTL_PROC(_kern, KERN_PROCDELAYTERM, delayterm,
3315 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
3316 0, 0, sysctl_delayterm, "I", "");
3317
3318
3319 STATIC int
sysctl_rage_vnode(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)3320 sysctl_rage_vnode
3321 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3322 {
3323 struct proc *p = req->p;
3324 struct uthread *ut;
3325 int new_value, old_value, changed;
3326 int error;
3327
3328 ut = current_uthread();
3329
3330 if (ut->uu_flag & UT_RAGE_VNODES) {
3331 old_value = KERN_RAGE_THREAD;
3332 } else if (p->p_lflag & P_LRAGE_VNODES) {
3333 old_value = KERN_RAGE_PROC;
3334 } else {
3335 old_value = 0;
3336 }
3337
3338 error = sysctl_io_number(req, old_value, sizeof(int), &new_value, &changed);
3339
3340 if ((error == 0) && (changed != 0)) {
3341 switch (new_value) {
3342 case KERN_RAGE_PROC:
3343 proc_lock(p);
3344 p->p_lflag |= P_LRAGE_VNODES;
3345 proc_unlock(p);
3346 break;
3347 case KERN_UNRAGE_PROC:
3348 proc_lock(p);
3349 p->p_lflag &= ~P_LRAGE_VNODES;
3350 proc_unlock(p);
3351 break;
3352
3353 case KERN_RAGE_THREAD:
3354 ut->uu_flag |= UT_RAGE_VNODES;
3355 break;
3356 case KERN_UNRAGE_THREAD:
3357 ut = current_uthread();
3358 ut->uu_flag &= ~UT_RAGE_VNODES;
3359 break;
3360 }
3361 }
3362 return error;
3363 }
3364
3365 SYSCTL_PROC(_kern, KERN_RAGEVNODE, rage_vnode,
3366 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_ANYBODY | CTLFLAG_LOCKED,
3367 0, 0, sysctl_rage_vnode, "I", "");
3368
3369 /* XXX until filecoordinationd fixes a bit of inverted logic. */
3370 STATIC int
sysctl_vfsnspace(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)3371 sysctl_vfsnspace
3372 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3373 {
3374 int old_value = 0, new_value, changed;
3375
3376 return sysctl_io_number(req, old_value, sizeof(int), &new_value,
3377 &changed);
3378 }
3379
3380 SYSCTL_PROC(_kern, OID_AUTO, vfsnspace,
3381 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_ANYBODY | CTLFLAG_LOCKED,
3382 0, 0, sysctl_vfsnspace, "I", "");
3383
3384 /* XXX move this interface into libproc and remove this sysctl */
3385 STATIC int
sysctl_setthread_cpupercent(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)3386 sysctl_setthread_cpupercent
3387 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3388 {
3389 int new_value, old_value;
3390 int error = 0;
3391 kern_return_t kret = KERN_SUCCESS;
3392 uint8_t percent = 0;
3393 int ms_refill = 0;
3394
3395 if (!req->newptr) {
3396 return 0;
3397 }
3398
3399 old_value = 0;
3400
3401 if ((error = sysctl_io_number(req, old_value, sizeof(old_value), &new_value, NULL)) != 0) {
3402 return error;
3403 }
3404
3405 percent = new_value & 0xff; /* low 8 bytes for perent */
3406 ms_refill = (new_value >> 8) & 0xffffff; /* upper 24bytes represent ms refill value */
3407 if (percent > 100) {
3408 return EINVAL;
3409 }
3410
3411 /*
3412 * If the caller is specifying a percentage of 0, this will unset the CPU limit, if present.
3413 */
3414 if ((kret = thread_set_cpulimit(THREAD_CPULIMIT_BLOCK, percent, ms_refill * (int)NSEC_PER_MSEC)) != 0) {
3415 return EIO;
3416 }
3417
3418 return 0;
3419 }
3420
3421 SYSCTL_PROC(_kern, OID_AUTO, setthread_cpupercent,
3422 CTLTYPE_INT | CTLFLAG_WR | CTLFLAG_ANYBODY,
3423 0, 0, sysctl_setthread_cpupercent, "I", "set thread cpu percentage limit");
3424
3425
3426 STATIC int
sysctl_kern_check_openevt(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)3427 sysctl_kern_check_openevt
3428 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3429 {
3430 struct proc *p = req->p;
3431 int new_value, old_value, changed;
3432 int error;
3433
3434 if (p->p_flag & P_CHECKOPENEVT) {
3435 old_value = KERN_OPENEVT_PROC;
3436 } else {
3437 old_value = 0;
3438 }
3439
3440 error = sysctl_io_number(req, old_value, sizeof(int), &new_value, &changed);
3441
3442 if ((error == 0) && (changed != 0)) {
3443 switch (new_value) {
3444 case KERN_OPENEVT_PROC:
3445 OSBitOrAtomic(P_CHECKOPENEVT, &p->p_flag);
3446 break;
3447
3448 case KERN_UNOPENEVT_PROC:
3449 OSBitAndAtomic(~((uint32_t)P_CHECKOPENEVT), &p->p_flag);
3450 break;
3451
3452 default:
3453 error = EINVAL;
3454 }
3455 }
3456 return error;
3457 }
3458
3459 SYSCTL_PROC(_kern, KERN_CHECKOPENEVT, check_openevt, CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_ANYBODY | CTLFLAG_LOCKED,
3460 0, 0, sysctl_kern_check_openevt, "I", "set the per-process check-open-evt flag");
3461
3462
3463 #if DEVELOPMENT || DEBUG
3464 STATIC int
sysctl_nx(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)3465 sysctl_nx
3466 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3467 {
3468 #ifdef SECURE_KERNEL
3469 (void)req;
3470 return ENOTSUP;
3471 #else
3472 int new_value, changed;
3473 int error;
3474
3475 error = sysctl_io_number(req, nx_enabled, sizeof(nx_enabled), &new_value, &changed);
3476 if (error) {
3477 return error;
3478 }
3479
3480 if (changed) {
3481 #if defined(__x86_64__)
3482 /*
3483 * Only allow setting if NX is supported on the chip
3484 */
3485 if (!(cpuid_extfeatures() & CPUID_EXTFEATURE_XD)) {
3486 return ENOTSUP;
3487 }
3488 #endif
3489 nx_enabled = new_value;
3490 }
3491 return error;
3492 #endif /* SECURE_KERNEL */
3493 }
3494 #endif
3495
3496 #if DEVELOPMENT || DEBUG
3497 SYSCTL_PROC(_kern, KERN_NX_PROTECTION, nx,
3498 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
3499 0, 0, sysctl_nx, "I", "");
3500 #endif
3501
3502 STATIC int
sysctl_loadavg(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)3503 sysctl_loadavg
3504 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3505 {
3506 if (proc_is64bit(req->p)) {
3507 struct user64_loadavg loadinfo64 = {};
3508 fill_loadavg64(&averunnable, &loadinfo64);
3509 return sysctl_io_opaque(req, &loadinfo64, sizeof(loadinfo64), NULL);
3510 } else {
3511 struct user32_loadavg loadinfo32 = {};
3512 fill_loadavg32(&averunnable, &loadinfo32);
3513 return sysctl_io_opaque(req, &loadinfo32, sizeof(loadinfo32), NULL);
3514 }
3515 }
3516
3517 SYSCTL_PROC(_vm, VM_LOADAVG, loadavg,
3518 CTLTYPE_STRUCT | CTLFLAG_RD | CTLFLAG_LOCKED,
3519 0, 0, sysctl_loadavg, "S,loadavg", "");
3520
3521 /*
3522 * Note: Thread safe; vm_map_lock protects in vm_toggle_entry_reuse()
3523 */
3524 STATIC int
sysctl_vm_toggle_address_reuse(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)3525 sysctl_vm_toggle_address_reuse(__unused struct sysctl_oid *oidp, __unused void *arg1,
3526 __unused int arg2, struct sysctl_req *req)
3527 {
3528 int old_value = 0, new_value = 0, error = 0;
3529
3530 if (vm_toggle_entry_reuse( VM_TOGGLE_GETVALUE, &old_value )) {
3531 return error;
3532 }
3533 error = sysctl_io_number(req, old_value, sizeof(int), &new_value, NULL);
3534 if (!error) {
3535 return vm_toggle_entry_reuse(new_value, NULL);
3536 }
3537 return error;
3538 }
3539
3540 SYSCTL_PROC(_debug, OID_AUTO, toggle_address_reuse, CTLFLAG_ANYBODY | CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED, 0, 0, sysctl_vm_toggle_address_reuse, "I", "");
3541
3542 #ifdef CONFIG_XNUPOST
3543
3544 extern uint32_t xnupost_get_estimated_testdata_size(void);
3545 extern int xnupost_reset_all_tests(void);
3546
3547 STATIC int
3548 sysctl_handle_xnupost_get_tests SYSCTL_HANDLER_ARGS
3549 {
3550 /* fixup unused arguments warnings */
3551 __unused int _oa2 = arg2;
3552 __unused void * _oa1 = arg1;
3553 __unused struct sysctl_oid * _oidp = oidp;
3554
3555 int error = 0;
3556 user_addr_t oldp = 0;
3557 user_addr_t newp = 0;
3558 uint32_t usedbytes = 0;
3559
3560 oldp = req->oldptr;
3561 newp = req->newptr;
3562
3563 if (newp) {
3564 return ENOTSUP;
3565 }
3566
3567 if ((void *)oldp == NULL) {
3568 /* return estimated size for second call where info can be placed */
3569 req->oldidx = xnupost_get_estimated_testdata_size();
3570 } else {
3571 error = xnupost_export_testdata((void *)oldp, req->oldlen, &usedbytes);
3572 req->oldidx = usedbytes;
3573 }
3574
3575 return error;
3576 }
3577
3578 SYSCTL_PROC(_debug,
3579 OID_AUTO,
3580 xnupost_get_tests,
3581 CTLFLAG_MASKED | CTLFLAG_ANYBODY | CTLTYPE_OPAQUE | CTLFLAG_RD | CTLFLAG_LOCKED,
3582 0,
3583 0,
3584 sysctl_handle_xnupost_get_tests,
3585 "-",
3586 "read xnupost test data in kernel");
3587
3588 STATIC int
3589 sysctl_debug_xnupost_ctl SYSCTL_HANDLER_ARGS
3590 {
3591 /* fixup unused arguments warnings */
3592 __unused int _oa2 = arg2;
3593 __unused void * _oa1 = arg1;
3594 __unused struct sysctl_oid * _oidp = oidp;
3595
3596 #define ARRCOUNT 4
3597 /*
3598 * INPUT: ACTION, PARAM1, PARAM2, PARAM3
3599 * OUTPUT: RESULTCODE, ADDITIONAL DATA
3600 */
3601 int32_t outval[ARRCOUNT] = {0};
3602 int32_t input[ARRCOUNT] = {0};
3603 int32_t out_size = sizeof(outval);
3604 int32_t in_size = sizeof(input);
3605 int error = 0;
3606
3607 /* if this is NULL call to find out size, send out size info */
3608 if (!req->newptr) {
3609 goto out;
3610 }
3611
3612 /* pull in provided value from userspace */
3613 error = SYSCTL_IN(req, &input[0], in_size);
3614 if (error) {
3615 return error;
3616 }
3617
3618 if (input[0] == XTCTL_RESET_TESTDATA) {
3619 outval[0] = xnupost_reset_all_tests();
3620 goto out;
3621 }
3622
3623 out:
3624 error = SYSCTL_OUT(req, &outval[0], out_size);
3625 return error;
3626 }
3627
3628 SYSCTL_PROC(_debug,
3629 OID_AUTO,
3630 xnupost_testctl,
3631 CTLFLAG_MASKED | CTLFLAG_ANYBODY | CTLTYPE_OPAQUE | CTLFLAG_RW | CTLFLAG_LOCKED,
3632 0,
3633 0,
3634 sysctl_debug_xnupost_ctl,
3635 "I",
3636 "xnupost control for kernel testing");
3637
3638 extern void test_oslog_handleOSLogCtl(int32_t * in, int32_t * out, int32_t arraycount);
3639
3640 STATIC int
sysctl_debug_test_oslog_ctl(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)3641 sysctl_debug_test_oslog_ctl(__unused struct sysctl_oid * oidp, __unused void * arg1, __unused int arg2, struct sysctl_req * req)
3642 {
3643 #define ARRCOUNT 4
3644 int32_t outval[ARRCOUNT] = {0};
3645 int32_t input[ARRCOUNT] = {0};
3646 int32_t size_outval = sizeof(outval);
3647 int32_t size_inval = sizeof(input);
3648 int32_t error;
3649
3650 /* if this is NULL call to find out size, send out size info */
3651 if (!req->newptr) {
3652 error = SYSCTL_OUT(req, &outval[0], size_outval);
3653 return error;
3654 }
3655
3656 /* pull in provided value from userspace */
3657 error = SYSCTL_IN(req, &input[0], size_inval);
3658 if (error) {
3659 return error;
3660 }
3661
3662 test_oslog_handleOSLogCtl(input, outval, ARRCOUNT);
3663
3664 error = SYSCTL_OUT(req, &outval[0], size_outval);
3665
3666 return error;
3667 }
3668
3669 SYSCTL_PROC(_debug,
3670 OID_AUTO,
3671 test_OSLogCtl,
3672 CTLFLAG_MASKED | CTLFLAG_ANYBODY | CTLTYPE_OPAQUE | CTLFLAG_RW | CTLFLAG_LOCKED,
3673 0,
3674 0,
3675 sysctl_debug_test_oslog_ctl,
3676 "I",
3677 "testing oslog in kernel");
3678
3679 #include <mach/task.h>
3680 #include <mach/semaphore.h>
3681
3682 static LCK_GRP_DECLARE(sysctl_debug_test_stackshot_owner_grp, "test-stackshot-owner-grp");
3683 static LCK_MTX_DECLARE(sysctl_debug_test_stackshot_owner_init_mtx,
3684 &sysctl_debug_test_stackshot_owner_grp);
3685
3686 /* This is a sysctl for testing collection of owner info on a lock in kernel space. A multi-threaded
3687 * test from userland sets this sysctl in such a way that a thread blocks in kernel mode, and a
3688 * stackshot is taken to see if the owner of the lock can be identified.
3689 *
3690 * We can't return to userland with a kernel lock held, so be sure to unlock before we leave.
3691 * the semaphores allow us to artificially create cases where the lock is being held and the
3692 * thread is hanging / taking a long time to do something. */
3693
3694 volatile char sysctl_debug_test_stackshot_mtx_inited = 0;
3695 semaphore_t sysctl_debug_test_stackshot_mutex_sem;
3696 lck_mtx_t sysctl_debug_test_stackshot_owner_lck;
3697
3698 #define SYSCTL_DEBUG_MTX_ACQUIRE_WAIT 1
3699 #define SYSCTL_DEBUG_MTX_ACQUIRE_NOWAIT 2
3700 #define SYSCTL_DEBUG_MTX_SIGNAL 3
3701 #define SYSCTL_DEBUG_MTX_TEARDOWN 4
3702
3703 STATIC int
sysctl_debug_test_stackshot_mutex_owner(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)3704 sysctl_debug_test_stackshot_mutex_owner(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3705 {
3706 long long option = -1;
3707 /* if the user tries to read the sysctl, we tell them what the address of the lock is (to test against stackshot's output) */
3708 long long mtx_unslid_addr = (long long)VM_KERNEL_UNSLIDE_OR_PERM(&sysctl_debug_test_stackshot_owner_lck);
3709 int error = sysctl_io_number(req, mtx_unslid_addr, sizeof(long long), (void*)&option, NULL);
3710
3711 lck_mtx_lock(&sysctl_debug_test_stackshot_owner_init_mtx);
3712 if (!sysctl_debug_test_stackshot_mtx_inited) {
3713 lck_mtx_init(&sysctl_debug_test_stackshot_owner_lck,
3714 &sysctl_debug_test_stackshot_owner_grp,
3715 LCK_ATTR_NULL);
3716 semaphore_create(kernel_task,
3717 &sysctl_debug_test_stackshot_mutex_sem,
3718 SYNC_POLICY_FIFO, 0);
3719 sysctl_debug_test_stackshot_mtx_inited = 1;
3720 }
3721 lck_mtx_unlock(&sysctl_debug_test_stackshot_owner_init_mtx);
3722
3723 if (!error) {
3724 switch (option) {
3725 case SYSCTL_DEBUG_MTX_ACQUIRE_NOWAIT:
3726 lck_mtx_lock(&sysctl_debug_test_stackshot_owner_lck);
3727 lck_mtx_unlock(&sysctl_debug_test_stackshot_owner_lck);
3728 break;
3729 case SYSCTL_DEBUG_MTX_ACQUIRE_WAIT:
3730 lck_mtx_lock(&sysctl_debug_test_stackshot_owner_lck);
3731 semaphore_wait(sysctl_debug_test_stackshot_mutex_sem);
3732 lck_mtx_unlock(&sysctl_debug_test_stackshot_owner_lck);
3733 break;
3734 case SYSCTL_DEBUG_MTX_SIGNAL:
3735 semaphore_signal(sysctl_debug_test_stackshot_mutex_sem);
3736 break;
3737 case SYSCTL_DEBUG_MTX_TEARDOWN:
3738 lck_mtx_lock(&sysctl_debug_test_stackshot_owner_init_mtx);
3739
3740 lck_mtx_destroy(&sysctl_debug_test_stackshot_owner_lck,
3741 &sysctl_debug_test_stackshot_owner_grp);
3742 semaphore_destroy(kernel_task,
3743 sysctl_debug_test_stackshot_mutex_sem);
3744 sysctl_debug_test_stackshot_mtx_inited = 0;
3745
3746 lck_mtx_unlock(&sysctl_debug_test_stackshot_owner_init_mtx);
3747 break;
3748 case -1: /* user just wanted to read the value, so do nothing */
3749 break;
3750 default:
3751 error = EINVAL;
3752 break;
3753 }
3754 }
3755 return error;
3756 }
3757
3758 /* we can't return to userland with a kernel rwlock held, so be sure to unlock before we leave.
3759 * the semaphores allow us to artificially create cases where the lock is being held and the
3760 * thread is hanging / taking a long time to do something. */
3761
3762 SYSCTL_PROC(_debug,
3763 OID_AUTO,
3764 test_MutexOwnerCtl,
3765 CTLFLAG_MASKED | CTLFLAG_ANYBODY | CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_LOCKED,
3766 0,
3767 0,
3768 sysctl_debug_test_stackshot_mutex_owner,
3769 "-",
3770 "Testing mutex owner in kernel");
3771
3772 volatile char sysctl_debug_test_stackshot_rwlck_inited = 0;
3773 lck_rw_t sysctl_debug_test_stackshot_owner_rwlck;
3774 semaphore_t sysctl_debug_test_stackshot_rwlck_sem;
3775
3776 #define SYSCTL_DEBUG_KRWLCK_RACQUIRE_NOWAIT 1
3777 #define SYSCTL_DEBUG_KRWLCK_RACQUIRE_WAIT 2
3778 #define SYSCTL_DEBUG_KRWLCK_WACQUIRE_NOWAIT 3
3779 #define SYSCTL_DEBUG_KRWLCK_WACQUIRE_WAIT 4
3780 #define SYSCTL_DEBUG_KRWLCK_SIGNAL 5
3781 #define SYSCTL_DEBUG_KRWLCK_TEARDOWN 6
3782
3783 STATIC int
sysctl_debug_test_stackshot_rwlck_owner(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)3784 sysctl_debug_test_stackshot_rwlck_owner(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3785 {
3786 long long option = -1;
3787 /* if the user tries to read the sysctl, we tell them what the address of the lock is
3788 * (to test against stackshot's output) */
3789 long long rwlck_unslid_addr = (long long)VM_KERNEL_UNSLIDE_OR_PERM(&sysctl_debug_test_stackshot_owner_rwlck);
3790 int error = sysctl_io_number(req, rwlck_unslid_addr, sizeof(long long), (void*)&option, NULL);
3791
3792 lck_mtx_lock(&sysctl_debug_test_stackshot_owner_init_mtx);
3793 if (!sysctl_debug_test_stackshot_rwlck_inited) {
3794 lck_rw_init(&sysctl_debug_test_stackshot_owner_rwlck,
3795 &sysctl_debug_test_stackshot_owner_grp,
3796 LCK_ATTR_NULL);
3797 semaphore_create(kernel_task,
3798 &sysctl_debug_test_stackshot_rwlck_sem,
3799 SYNC_POLICY_FIFO,
3800 0);
3801 sysctl_debug_test_stackshot_rwlck_inited = 1;
3802 }
3803 lck_mtx_unlock(&sysctl_debug_test_stackshot_owner_init_mtx);
3804
3805 if (!error) {
3806 switch (option) {
3807 case SYSCTL_DEBUG_KRWLCK_RACQUIRE_NOWAIT:
3808 lck_rw_lock(&sysctl_debug_test_stackshot_owner_rwlck, LCK_RW_TYPE_SHARED);
3809 lck_rw_unlock(&sysctl_debug_test_stackshot_owner_rwlck, LCK_RW_TYPE_SHARED);
3810 break;
3811 case SYSCTL_DEBUG_KRWLCK_RACQUIRE_WAIT:
3812 lck_rw_lock(&sysctl_debug_test_stackshot_owner_rwlck, LCK_RW_TYPE_SHARED);
3813 semaphore_wait(sysctl_debug_test_stackshot_rwlck_sem);
3814 lck_rw_unlock(&sysctl_debug_test_stackshot_owner_rwlck, LCK_RW_TYPE_SHARED);
3815 break;
3816 case SYSCTL_DEBUG_KRWLCK_WACQUIRE_NOWAIT:
3817 lck_rw_lock(&sysctl_debug_test_stackshot_owner_rwlck, LCK_RW_TYPE_EXCLUSIVE);
3818 lck_rw_unlock(&sysctl_debug_test_stackshot_owner_rwlck, LCK_RW_TYPE_EXCLUSIVE);
3819 break;
3820 case SYSCTL_DEBUG_KRWLCK_WACQUIRE_WAIT:
3821 lck_rw_lock(&sysctl_debug_test_stackshot_owner_rwlck, LCK_RW_TYPE_EXCLUSIVE);
3822 semaphore_wait(sysctl_debug_test_stackshot_rwlck_sem);
3823 lck_rw_unlock(&sysctl_debug_test_stackshot_owner_rwlck, LCK_RW_TYPE_EXCLUSIVE);
3824 break;
3825 case SYSCTL_DEBUG_KRWLCK_SIGNAL:
3826 semaphore_signal(sysctl_debug_test_stackshot_rwlck_sem);
3827 break;
3828 case SYSCTL_DEBUG_KRWLCK_TEARDOWN:
3829 lck_mtx_lock(&sysctl_debug_test_stackshot_owner_init_mtx);
3830
3831 lck_rw_destroy(&sysctl_debug_test_stackshot_owner_rwlck,
3832 &sysctl_debug_test_stackshot_owner_grp);
3833 semaphore_destroy(kernel_task,
3834 sysctl_debug_test_stackshot_rwlck_sem);
3835 sysctl_debug_test_stackshot_rwlck_inited = 0;
3836
3837 lck_mtx_unlock(&sysctl_debug_test_stackshot_owner_init_mtx);
3838 break;
3839 case -1: /* user just wanted to read the value, so do nothing */
3840 break;
3841 default:
3842 error = EINVAL;
3843 break;
3844 }
3845 }
3846 return error;
3847 }
3848
3849
3850 SYSCTL_PROC(_debug,
3851 OID_AUTO,
3852 test_RWLockOwnerCtl,
3853 CTLFLAG_MASKED | CTLFLAG_ANYBODY | CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_LOCKED,
3854 0,
3855 0,
3856 sysctl_debug_test_stackshot_rwlck_owner,
3857 "-",
3858 "Testing rwlock owner in kernel");
3859 #endif /* !CONFIG_XNUPOST */
3860
3861 STATIC int
sysctl_swapusage(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)3862 sysctl_swapusage
3863 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
3864 {
3865 int error;
3866 uint64_t swap_total;
3867 uint64_t swap_avail;
3868 vm_size_t swap_pagesize;
3869 boolean_t swap_encrypted;
3870 struct xsw_usage xsu = {};
3871
3872 error = macx_swapinfo(&swap_total,
3873 &swap_avail,
3874 &swap_pagesize,
3875 &swap_encrypted);
3876 if (error) {
3877 return error;
3878 }
3879
3880 xsu.xsu_total = swap_total;
3881 xsu.xsu_avail = swap_avail;
3882 xsu.xsu_used = swap_total - swap_avail;
3883 xsu.xsu_pagesize = (u_int32_t)MIN(swap_pagesize, UINT32_MAX);
3884 xsu.xsu_encrypted = swap_encrypted;
3885 return sysctl_io_opaque(req, &xsu, sizeof(xsu), NULL);
3886 }
3887
3888
3889
3890 SYSCTL_PROC(_vm, VM_SWAPUSAGE, swapusage,
3891 CTLTYPE_STRUCT | CTLFLAG_RD | CTLFLAG_LOCKED,
3892 0, 0, sysctl_swapusage, "S,xsw_usage", "");
3893
3894 #if DEVELOPMENT || DEBUG
3895 extern int vm_num_swap_files_config;
3896 extern int vm_num_swap_files;
3897 extern lck_mtx_t vm_swap_data_lock;
3898 #define VM_MAX_SWAP_FILE_NUM 100
3899
3900 static int
3901 sysctl_vm_config_num_swap_files SYSCTL_HANDLER_ARGS
3902 {
3903 #pragma unused(arg1, arg2)
3904 int error = 0, val = vm_num_swap_files_config;
3905
3906 error = sysctl_handle_int(oidp, &val, 0, req);
3907 if (error || !req->newptr) {
3908 goto out;
3909 }
3910
3911 if (!VM_CONFIG_SWAP_IS_ACTIVE && !VM_CONFIG_FREEZER_SWAP_IS_ACTIVE) {
3912 printf("Swap is disabled\n");
3913 error = EINVAL;
3914 goto out;
3915 }
3916
3917 lck_mtx_lock(&vm_swap_data_lock);
3918
3919 if (val < vm_num_swap_files) {
3920 printf("Cannot configure fewer swap files than already exist.\n");
3921 error = EINVAL;
3922 lck_mtx_unlock(&vm_swap_data_lock);
3923 goto out;
3924 }
3925
3926 if (val > VM_MAX_SWAP_FILE_NUM) {
3927 printf("Capping number of swap files to upper bound.\n");
3928 val = VM_MAX_SWAP_FILE_NUM;
3929 }
3930
3931 vm_num_swap_files_config = val;
3932 lck_mtx_unlock(&vm_swap_data_lock);
3933 out:
3934
3935 return 0;
3936 }
3937
3938 SYSCTL_PROC(_debug, OID_AUTO, num_swap_files_configured, CTLFLAG_ANYBODY | CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED, 0, 0, sysctl_vm_config_num_swap_files, "I", "");
3939 #endif /* DEVELOPMENT || DEBUG */
3940
3941 /* this kernel does NOT implement shared_region_make_private_np() */
3942 SYSCTL_INT(_kern, KERN_SHREG_PRIVATIZABLE, shreg_private,
3943 CTLFLAG_RD | CTLFLAG_LOCKED,
3944 (int *)NULL, 0, "");
3945
3946 STATIC int
fetch_process_cputype(proc_t cur_proc,int * name,u_int namelen,cpu_type_t * cputype)3947 fetch_process_cputype(
3948 proc_t cur_proc,
3949 int *name,
3950 u_int namelen,
3951 cpu_type_t *cputype)
3952 {
3953 proc_t p = PROC_NULL;
3954 int refheld = 0;
3955 cpu_type_t ret = 0;
3956 int error = 0;
3957
3958 if (namelen == 0) {
3959 p = cur_proc;
3960 } else if (namelen == 1) {
3961 p = proc_find(name[0]);
3962 if (p == NULL) {
3963 return EINVAL;
3964 }
3965 refheld = 1;
3966 } else {
3967 error = EINVAL;
3968 goto out;
3969 }
3970
3971 ret = cpu_type() & ~CPU_ARCH_MASK;
3972 if (IS_64BIT_PROCESS(p)) {
3973 ret |= CPU_ARCH_ABI64;
3974 }
3975
3976 *cputype = ret;
3977
3978 if (refheld != 0) {
3979 proc_rele(p);
3980 }
3981 out:
3982 return error;
3983 }
3984
3985
3986 STATIC int
sysctl_sysctl_native(__unused struct sysctl_oid * oidp,void * arg1,int arg2,struct sysctl_req * req)3987 sysctl_sysctl_native(__unused struct sysctl_oid *oidp, void *arg1, int arg2,
3988 struct sysctl_req *req)
3989 {
3990 int error;
3991 cpu_type_t proc_cputype = 0;
3992 if ((error = fetch_process_cputype(req->p, (int *)arg1, arg2, &proc_cputype)) != 0) {
3993 return error;
3994 }
3995 int res = 1;
3996 if ((proc_cputype & ~CPU_ARCH_MASK) != (cpu_type() & ~CPU_ARCH_MASK)) {
3997 res = 0;
3998 }
3999 return SYSCTL_OUT(req, &res, sizeof(res));
4000 }
4001 SYSCTL_PROC(_sysctl, OID_AUTO, proc_native, CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED, 0, 0, sysctl_sysctl_native, "I", "proc_native");
4002
4003 STATIC int
sysctl_sysctl_cputype(__unused struct sysctl_oid * oidp,void * arg1,int arg2,struct sysctl_req * req)4004 sysctl_sysctl_cputype(__unused struct sysctl_oid *oidp, void *arg1, int arg2,
4005 struct sysctl_req *req)
4006 {
4007 int error;
4008 cpu_type_t proc_cputype = 0;
4009 if ((error = fetch_process_cputype(req->p, (int *)arg1, arg2, &proc_cputype)) != 0) {
4010 return error;
4011 }
4012 return SYSCTL_OUT(req, &proc_cputype, sizeof(proc_cputype));
4013 }
4014 SYSCTL_PROC(_sysctl, OID_AUTO, proc_cputype, CTLTYPE_NODE | CTLFLAG_RD | CTLFLAG_LOCKED, 0, 0, sysctl_sysctl_cputype, "I", "proc_cputype");
4015
4016 STATIC int
sysctl_safeboot(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)4017 sysctl_safeboot
4018 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4019 {
4020 return sysctl_io_number(req, boothowto & RB_SAFEBOOT ? 1 : 0, sizeof(int), NULL, NULL);
4021 }
4022
4023 SYSCTL_PROC(_kern, KERN_SAFEBOOT, safeboot,
4024 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
4025 0, 0, sysctl_safeboot, "I", "");
4026
4027 STATIC int
sysctl_singleuser(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)4028 sysctl_singleuser
4029 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4030 {
4031 return sysctl_io_number(req, boothowto & RB_SINGLE ? 1 : 0, sizeof(int), NULL, NULL);
4032 }
4033
4034 SYSCTL_PROC(_kern, OID_AUTO, singleuser,
4035 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
4036 0, 0, sysctl_singleuser, "I", "");
4037
4038 STATIC int
sysctl_minimalboot(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)4039 sysctl_minimalboot
4040 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4041 {
4042 return sysctl_io_number(req, minimalboot, sizeof(int), NULL, NULL);
4043 }
4044
4045 SYSCTL_PROC(_kern, OID_AUTO, minimalboot,
4046 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
4047 0, 0, sysctl_minimalboot, "I", "");
4048
4049 /*
4050 * Controls for debugging affinity sets - see osfmk/kern/affinity.c
4051 */
4052 extern boolean_t affinity_sets_enabled;
4053 extern int affinity_sets_mapping;
4054
4055 SYSCTL_INT(_kern, OID_AUTO, affinity_sets_enabled,
4056 CTLFLAG_RW | CTLFLAG_LOCKED, (int *) &affinity_sets_enabled, 0, "hinting enabled");
4057 SYSCTL_INT(_kern, OID_AUTO, affinity_sets_mapping,
4058 CTLFLAG_RW | CTLFLAG_LOCKED, &affinity_sets_mapping, 0, "mapping policy");
4059
4060 /*
4061 * Boolean indicating if KASLR is active.
4062 */
4063 STATIC int
sysctl_slide(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)4064 sysctl_slide
4065 (__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4066 {
4067 uint32_t slide;
4068
4069 slide = vm_kernel_slide ? 1 : 0;
4070
4071 return sysctl_io_number( req, slide, sizeof(int), NULL, NULL);
4072 }
4073
4074 SYSCTL_PROC(_kern, OID_AUTO, slide,
4075 CTLTYPE_INT | CTLFLAG_RD | CTLFLAG_LOCKED,
4076 0, 0, sysctl_slide, "I", "");
4077
4078 #if DEBUG || DEVELOPMENT
4079 #if defined(__arm64__)
4080 extern vm_offset_t segTEXTEXECB;
4081
4082 static int
4083 sysctl_kernel_text_exec_base_slide SYSCTL_HANDLER_ARGS
4084 {
4085 #pragma unused(arg1, arg2, oidp)
4086 unsigned long slide = 0;
4087 kc_format_t kc_format;
4088
4089 PE_get_primary_kc_format(&kc_format);
4090
4091 if (kc_format == KCFormatFileset) {
4092 void *kch = PE_get_kc_header(KCKindPrimary);
4093 slide = (unsigned long)segTEXTEXECB - (unsigned long)kch + vm_kernel_slide;
4094 }
4095 return SYSCTL_OUT(req, &slide, sizeof(slide));
4096 }
4097
4098 SYSCTL_QUAD(_kern, OID_AUTO, kernel_slide, CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED, &vm_kernel_slide, "");
4099 SYSCTL_QUAD(_kern, OID_AUTO, kernel_text_exec_base, CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED, &segTEXTEXECB, "");
4100 SYSCTL_PROC(_kern, OID_AUTO, kernel_text_exec_base_slide, CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED, 0, 0, sysctl_kernel_text_exec_base_slide, "Q", "");
4101 #endif /* defined(__arm64__) */
4102
4103 /* User address of the PFZ */
4104 extern user32_addr_t commpage_text32_location;
4105 extern user64_addr_t commpage_text64_location;
4106
4107 STATIC int
4108 sysctl_pfz_start SYSCTL_HANDLER_ARGS
4109 {
4110 #pragma unused(oidp, arg1, arg2)
4111
4112 #ifdef __LP64__
4113 return sysctl_io_number(req, commpage_text64_location, sizeof(user64_addr_t), NULL, NULL);
4114 #else
4115 return sysctl_io_number(req, commpage_text32_location, sizeof(user32_addr_t), NULL, NULL);
4116 #endif
4117 }
4118
4119 SYSCTL_PROC(_kern, OID_AUTO, pfz,
4120 CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED | CTLFLAG_MASKED,
4121 0, 0, sysctl_pfz_start, "I", "");
4122 #endif
4123
4124
4125 /*
4126 * Limit on total memory users can wire.
4127 *
4128 * vm_global_user_wire_limit - system wide limit on wired memory from all processes combined.
4129 *
4130 * vm_per_task_user_wire_limit - per address space limit on wired memory. This puts a cap on the process's rlimit value.
4131 *
4132 * These values are initialized to reasonable defaults at boot time based on the available physical memory in
4133 * kmem_init().
4134 *
4135 * All values are in bytes.
4136 */
4137
4138 vm_map_size_t vm_global_user_wire_limit;
4139 vm_map_size_t vm_per_task_user_wire_limit;
4140 extern uint64_t max_mem_actual, max_mem;
4141
4142 uint64_t vm_add_wire_count_over_global_limit;
4143 uint64_t vm_add_wire_count_over_user_limit;
4144 /*
4145 * We used to have a global in the kernel called vm_global_no_user_wire_limit which was the inverse
4146 * of vm_global_user_wire_limit. But maintaining both of those is silly, and vm_global_user_wire_limit is the
4147 * real limit.
4148 * This function is for backwards compatibility with userspace
4149 * since we exposed the old global via a sysctl.
4150 */
4151 STATIC int
sysctl_global_no_user_wire_amount(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)4152 sysctl_global_no_user_wire_amount(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4153 {
4154 vm_map_size_t old_value;
4155 vm_map_size_t new_value;
4156 int changed;
4157 int error;
4158 uint64_t config_memsize = max_mem;
4159 #if defined(XNU_TARGET_OS_OSX)
4160 config_memsize = max_mem_actual;
4161 #endif /* defined(XNU_TARGET_OS_OSX) */
4162
4163 old_value = (vm_map_size_t)(config_memsize - vm_global_user_wire_limit);
4164 error = sysctl_io_number(req, old_value, sizeof(vm_map_size_t), &new_value, &changed);
4165 if (changed) {
4166 if ((uint64_t)new_value > config_memsize) {
4167 error = EINVAL;
4168 } else {
4169 vm_global_user_wire_limit = (vm_map_size_t)(config_memsize - new_value);
4170 }
4171 }
4172 return error;
4173 }
4174 /*
4175 * There needs to be a more automatic/elegant way to do this
4176 */
4177 SYSCTL_QUAD(_vm, OID_AUTO, global_user_wire_limit, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_global_user_wire_limit, "");
4178 SYSCTL_QUAD(_vm, OID_AUTO, user_wire_limit, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_per_task_user_wire_limit, "");
4179 SYSCTL_PROC(_vm, OID_AUTO, global_no_user_wire_amount, CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_LOCKED, 0, 0, &sysctl_global_no_user_wire_amount, "Q", "");
4180
4181 /*
4182 * Relaxed atomic RW of a 64bit value via sysctl.
4183 */
4184 STATIC int
sysctl_r_64bit_atomic(uint64_t * ptr,struct sysctl_req * req)4185 sysctl_r_64bit_atomic(uint64_t *ptr, struct sysctl_req *req)
4186 {
4187 uint64_t old_value;
4188 uint64_t new_value;
4189 int error;
4190
4191 old_value = os_atomic_load_wide(ptr, relaxed);
4192 error = sysctl_io_number(req, old_value, sizeof(vm_map_size_t), &new_value, NULL);
4193 return error;
4194 }
4195 STATIC int
sysctl_add_wire_count_over_global_limit(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)4196 sysctl_add_wire_count_over_global_limit(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4197 {
4198 return sysctl_r_64bit_atomic(&vm_add_wire_count_over_global_limit, req);
4199 }
4200 STATIC int
sysctl_add_wire_count_over_user_limit(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)4201 sysctl_add_wire_count_over_user_limit(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4202 {
4203 return sysctl_r_64bit_atomic(&vm_add_wire_count_over_user_limit, req);
4204 }
4205
4206 SYSCTL_PROC(_vm, OID_AUTO, add_wire_count_over_global_limit, CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED, 0, 0, &sysctl_add_wire_count_over_global_limit, "Q", "");
4207 SYSCTL_PROC(_vm, OID_AUTO, add_wire_count_over_user_limit, CTLTYPE_QUAD | CTLFLAG_RD | CTLFLAG_LOCKED, 0, 0, &sysctl_add_wire_count_over_user_limit, "Q", "");
4208
4209 #if DEVELOPMENT || DEBUG
4210 /* These sysctls are used to test the wired limit. */
4211 extern unsigned int vm_page_wire_count;
4212 extern uint32_t vm_lopage_free_count;
4213 SYSCTL_INT(_vm, OID_AUTO, page_wire_count, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_page_wire_count, 0, "");
4214 SYSCTL_INT(_vm, OID_AUTO, lopage_free_count, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_lopage_free_count, 0, "");
4215
4216 /*
4217 * Setting the per task variable exclude_physfootprint_ledger to 1 will allow the calling task to exclude memory entries that are
4218 * tagged by VM_LEDGER_TAG_DEFAULT and flagged by VM_LEDGER_FLAG_EXCLUDE_FOOTPRINT_DEBUG from its phys_footprint ledger.
4219 */
4220
4221 STATIC int
sysctl_rw_task_no_footprint_for_debug(struct sysctl_oid * oidp __unused,void * arg1 __unused,int arg2 __unused,struct sysctl_req * req)4222 sysctl_rw_task_no_footprint_for_debug(struct sysctl_oid *oidp __unused, void *arg1 __unused, int arg2 __unused, struct sysctl_req *req)
4223 {
4224 int error;
4225 int value;
4226 proc_t p = current_proc();
4227
4228 if (req->newptr) {
4229 // Write request
4230 error = SYSCTL_IN(req, &value, sizeof(value));
4231 if (!error) {
4232 if (value == 1) {
4233 task_set_no_footprint_for_debug(proc_task(p), TRUE);
4234 } else if (value == 0) {
4235 task_set_no_footprint_for_debug(proc_task(p), FALSE);
4236 } else {
4237 error = EINVAL;
4238 }
4239 }
4240 } else {
4241 // Read request
4242 value = task_get_no_footprint_for_debug(proc_task(p));
4243 error = SYSCTL_OUT(req, &value, sizeof(value));
4244 }
4245 return error;
4246 }
4247
4248 SYSCTL_PROC(_vm, OID_AUTO, task_no_footprint_for_debug,
4249 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED | CTLFLAG_ANYBODY,
4250 0, 0, &sysctl_rw_task_no_footprint_for_debug, "I", "Allow debug memory to be excluded from this task's memory footprint (debug only)");
4251
4252 #endif /* DEVELOPMENT || DEBUG */
4253
4254
4255 extern int vm_map_copy_overwrite_aligned_src_not_internal;
4256 extern int vm_map_copy_overwrite_aligned_src_not_symmetric;
4257 extern int vm_map_copy_overwrite_aligned_src_large;
4258 SYSCTL_INT(_vm, OID_AUTO, vm_copy_src_not_internal, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_map_copy_overwrite_aligned_src_not_internal, 0, "");
4259 SYSCTL_INT(_vm, OID_AUTO, vm_copy_src_not_symmetric, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_map_copy_overwrite_aligned_src_not_symmetric, 0, "");
4260 SYSCTL_INT(_vm, OID_AUTO, vm_copy_src_large, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_map_copy_overwrite_aligned_src_large, 0, "");
4261
4262
4263 extern uint32_t vm_page_external_count;
4264
4265 SYSCTL_INT(_vm, OID_AUTO, vm_page_external_count, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_page_external_count, 0, "");
4266
4267 SYSCTL_INT(_vm, OID_AUTO, vm_page_filecache_min, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_pageout_state.vm_page_filecache_min, 0, "");
4268 SYSCTL_INT(_vm, OID_AUTO, vm_page_xpmapped_min, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_pageout_state.vm_page_xpmapped_min, 0, "");
4269
4270 #if DEVELOPMENT || DEBUG
4271 SYSCTL_INT(_vm, OID_AUTO, vm_page_filecache_min_divisor, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_pageout_state.vm_page_filecache_min_divisor, 0, "");
4272 SYSCTL_INT(_vm, OID_AUTO, vm_page_xpmapped_min_divisor, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_pageout_state.vm_page_xpmapped_min_divisor, 0, "");
4273 extern boolean_t vps_yield_for_pgqlockwaiters;
4274 SYSCTL_INT(_vm, OID_AUTO, vm_pageoutscan_yields_for_pageQlockwaiters, CTLFLAG_RW | CTLFLAG_LOCKED, &vps_yield_for_pgqlockwaiters, 0, "");
4275 #endif
4276
4277 extern int vm_compressor_mode;
4278 extern int vm_compressor_is_active;
4279 extern int vm_compressor_available;
4280 extern uint32_t c_seg_bufsize;
4281 extern uint64_t compressor_pool_size;
4282 extern uint32_t vm_ripe_target_age;
4283 extern uint32_t swapout_target_age;
4284 extern int64_t compressor_bytes_used;
4285 extern int64_t c_segment_input_bytes;
4286 extern int64_t c_segment_compressed_bytes;
4287 extern uint32_t compressor_eval_period_in_msecs;
4288 extern uint32_t compressor_sample_min_in_msecs;
4289 extern uint32_t compressor_sample_max_in_msecs;
4290 extern uint32_t compressor_thrashing_threshold_per_10msecs;
4291 extern uint32_t compressor_thrashing_min_per_10msecs;
4292 extern uint32_t vm_compressor_time_thread;
4293
4294 #if DEVELOPMENT || DEBUG
4295 extern uint32_t vm_compressor_minorcompact_threshold_divisor;
4296 extern uint32_t vm_compressor_majorcompact_threshold_divisor;
4297 extern uint32_t vm_compressor_unthrottle_threshold_divisor;
4298 extern uint32_t vm_compressor_catchup_threshold_divisor;
4299
4300 extern uint32_t vm_compressor_minorcompact_threshold_divisor_overridden;
4301 extern uint32_t vm_compressor_majorcompact_threshold_divisor_overridden;
4302 extern uint32_t vm_compressor_unthrottle_threshold_divisor_overridden;
4303 extern uint32_t vm_compressor_catchup_threshold_divisor_overridden;
4304
4305 extern vmct_stats_t vmct_stats;
4306
4307
4308 STATIC int
sysctl_minorcompact_threshold_divisor(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)4309 sysctl_minorcompact_threshold_divisor(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4310 {
4311 int new_value, changed;
4312 int error = sysctl_io_number(req, vm_compressor_minorcompact_threshold_divisor, sizeof(int), &new_value, &changed);
4313
4314 if (changed) {
4315 vm_compressor_minorcompact_threshold_divisor = new_value;
4316 vm_compressor_minorcompact_threshold_divisor_overridden = 1;
4317 }
4318 return error;
4319 }
4320
4321 SYSCTL_PROC(_vm, OID_AUTO, compressor_minorcompact_threshold_divisor,
4322 CTLTYPE_INT | CTLFLAG_LOCKED | CTLFLAG_RW,
4323 0, 0, sysctl_minorcompact_threshold_divisor, "I", "");
4324
4325
4326 STATIC int
sysctl_majorcompact_threshold_divisor(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)4327 sysctl_majorcompact_threshold_divisor(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4328 {
4329 int new_value, changed;
4330 int error = sysctl_io_number(req, vm_compressor_majorcompact_threshold_divisor, sizeof(int), &new_value, &changed);
4331
4332 if (changed) {
4333 vm_compressor_majorcompact_threshold_divisor = new_value;
4334 vm_compressor_majorcompact_threshold_divisor_overridden = 1;
4335 }
4336 return error;
4337 }
4338
4339 SYSCTL_PROC(_vm, OID_AUTO, compressor_majorcompact_threshold_divisor,
4340 CTLTYPE_INT | CTLFLAG_LOCKED | CTLFLAG_RW,
4341 0, 0, sysctl_majorcompact_threshold_divisor, "I", "");
4342
4343
4344 STATIC int
sysctl_unthrottle_threshold_divisor(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)4345 sysctl_unthrottle_threshold_divisor(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4346 {
4347 int new_value, changed;
4348 int error = sysctl_io_number(req, vm_compressor_unthrottle_threshold_divisor, sizeof(int), &new_value, &changed);
4349
4350 if (changed) {
4351 vm_compressor_unthrottle_threshold_divisor = new_value;
4352 vm_compressor_unthrottle_threshold_divisor_overridden = 1;
4353 }
4354 return error;
4355 }
4356
4357 SYSCTL_PROC(_vm, OID_AUTO, compressor_unthrottle_threshold_divisor,
4358 CTLTYPE_INT | CTLFLAG_LOCKED | CTLFLAG_RW,
4359 0, 0, sysctl_unthrottle_threshold_divisor, "I", "");
4360
4361
4362 STATIC int
sysctl_catchup_threshold_divisor(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)4363 sysctl_catchup_threshold_divisor(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4364 {
4365 int new_value, changed;
4366 int error = sysctl_io_number(req, vm_compressor_catchup_threshold_divisor, sizeof(int), &new_value, &changed);
4367
4368 if (changed) {
4369 vm_compressor_catchup_threshold_divisor = new_value;
4370 vm_compressor_catchup_threshold_divisor_overridden = 1;
4371 }
4372 return error;
4373 }
4374
4375 SYSCTL_PROC(_vm, OID_AUTO, compressor_catchup_threshold_divisor,
4376 CTLTYPE_INT | CTLFLAG_LOCKED | CTLFLAG_RW,
4377 0, 0, sysctl_catchup_threshold_divisor, "I", "");
4378 #endif
4379
4380
4381 SYSCTL_QUAD(_vm, OID_AUTO, compressor_input_bytes, CTLFLAG_RD | CTLFLAG_LOCKED, &c_segment_input_bytes, "");
4382 SYSCTL_QUAD(_vm, OID_AUTO, compressor_compressed_bytes, CTLFLAG_RD | CTLFLAG_LOCKED, &c_segment_compressed_bytes, "");
4383 SYSCTL_QUAD(_vm, OID_AUTO, compressor_bytes_used, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_bytes_used, "");
4384
4385 SYSCTL_INT(_vm, OID_AUTO, compressor_mode, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_compressor_mode, 0, "");
4386 SYSCTL_INT(_vm, OID_AUTO, compressor_is_active, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_compressor_is_active, 0, "");
4387 SYSCTL_INT(_vm, OID_AUTO, compressor_swapout_target_age, CTLFLAG_RD | CTLFLAG_LOCKED, &swapout_target_age, 0, "");
4388 SYSCTL_INT(_vm, OID_AUTO, compressor_available, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_compressor_available, 0, "");
4389 SYSCTL_INT(_vm, OID_AUTO, compressor_segment_buffer_size, CTLFLAG_RD | CTLFLAG_LOCKED, &c_seg_bufsize, 0, "");
4390 SYSCTL_QUAD(_vm, OID_AUTO, compressor_pool_size, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_pool_size, "");
4391
4392 extern int min_csegs_per_major_compaction;
4393 SYSCTL_INT(_vm, OID_AUTO, compressor_min_csegs_per_major_compaction, CTLFLAG_RW | CTLFLAG_LOCKED, &min_csegs_per_major_compaction, 0, "");
4394
4395 SYSCTL_INT(_vm, OID_AUTO, vm_ripe_target_age_in_secs, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_ripe_target_age, 0, "");
4396
4397 SYSCTL_INT(_vm, OID_AUTO, compressor_eval_period_in_msecs, CTLFLAG_RW | CTLFLAG_LOCKED, &compressor_eval_period_in_msecs, 0, "");
4398 SYSCTL_INT(_vm, OID_AUTO, compressor_sample_min_in_msecs, CTLFLAG_RW | CTLFLAG_LOCKED, &compressor_sample_min_in_msecs, 0, "");
4399 SYSCTL_INT(_vm, OID_AUTO, compressor_sample_max_in_msecs, CTLFLAG_RW | CTLFLAG_LOCKED, &compressor_sample_max_in_msecs, 0, "");
4400 SYSCTL_INT(_vm, OID_AUTO, compressor_thrashing_threshold_per_10msecs, CTLFLAG_RW | CTLFLAG_LOCKED, &compressor_thrashing_threshold_per_10msecs, 0, "");
4401 SYSCTL_INT(_vm, OID_AUTO, compressor_thrashing_min_per_10msecs, CTLFLAG_RW | CTLFLAG_LOCKED, &compressor_thrashing_min_per_10msecs, 0, "");
4402
4403 SYSCTL_QUAD(_vm, OID_AUTO, compressor_swapouts_under_30s, CTLFLAG_RD | CTLFLAG_LOCKED, &vmcs_stats.unripe_under_30s, "");
4404 SYSCTL_QUAD(_vm, OID_AUTO, compressor_swapouts_under_60s, CTLFLAG_RD | CTLFLAG_LOCKED, &vmcs_stats.unripe_under_60s, "");
4405 SYSCTL_QUAD(_vm, OID_AUTO, compressor_swapouts_under_300s, CTLFLAG_RD | CTLFLAG_LOCKED, &vmcs_stats.unripe_under_300s, "");
4406 SYSCTL_QUAD(_vm, OID_AUTO, compressor_swapper_reclaim_swapins, CTLFLAG_RD | CTLFLAG_LOCKED, &vmcs_stats.reclaim_swapins, "");
4407 SYSCTL_QUAD(_vm, OID_AUTO, compressor_swapper_defrag_swapins, CTLFLAG_RD | CTLFLAG_LOCKED, &vmcs_stats.defrag_swapins, "");
4408 SYSCTL_QUAD(_vm, OID_AUTO, compressor_swapper_swapout_threshold_exceeded, CTLFLAG_RD | CTLFLAG_LOCKED, &vmcs_stats.compressor_swap_threshold_exceeded, "");
4409 SYSCTL_QUAD(_vm, OID_AUTO, compressor_swapper_swapout_fileq_throttled, CTLFLAG_RD | CTLFLAG_LOCKED, &vmcs_stats.external_q_throttled, "");
4410 SYSCTL_QUAD(_vm, OID_AUTO, compressor_swapper_swapout_free_count_low, CTLFLAG_RD | CTLFLAG_LOCKED, &vmcs_stats.free_count_below_reserve, "");
4411 SYSCTL_QUAD(_vm, OID_AUTO, compressor_swapper_swapout_thrashing_detected, CTLFLAG_RD | CTLFLAG_LOCKED, &vmcs_stats.thrashing_detected, "");
4412 SYSCTL_QUAD(_vm, OID_AUTO, compressor_swapper_swapout_fragmentation_detected, CTLFLAG_RD | CTLFLAG_LOCKED, &vmcs_stats.fragmentation_detected, "");
4413
4414 SYSCTL_STRING(_vm, OID_AUTO, swapfileprefix, CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED, swapfilename, sizeof(swapfilename) - SWAPFILENAME_INDEX_LEN, "");
4415
4416 SYSCTL_INT(_vm, OID_AUTO, compressor_timing_enabled, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_compressor_time_thread, 0, "");
4417
4418 #if DEVELOPMENT || DEBUG
4419 SYSCTL_QUAD(_vm, OID_AUTO, compressor_thread_runtime0, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_runtimes[0], "");
4420 SYSCTL_QUAD(_vm, OID_AUTO, compressor_thread_runtime1, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_runtimes[1], "");
4421
4422 SYSCTL_QUAD(_vm, OID_AUTO, compressor_threads_total_execution_time, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_cthreads_total, "");
4423
4424 SYSCTL_QUAD(_vm, OID_AUTO, compressor_thread_pages0, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_pages[0], "");
4425 SYSCTL_QUAD(_vm, OID_AUTO, compressor_thread_pages1, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_pages[1], "");
4426
4427 SYSCTL_QUAD(_vm, OID_AUTO, compressor_thread_iterations0, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_iterations[0], "");
4428 SYSCTL_QUAD(_vm, OID_AUTO, compressor_thread_iterations1, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_iterations[1], "");
4429
4430 SYSCTL_INT(_vm, OID_AUTO, compressor_thread_minpages0, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_minpages[0], 0, "");
4431 SYSCTL_INT(_vm, OID_AUTO, compressor_thread_minpages1, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_minpages[1], 0, "");
4432
4433 SYSCTL_INT(_vm, OID_AUTO, compressor_thread_maxpages0, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_maxpages[0], 0, "");
4434 SYSCTL_INT(_vm, OID_AUTO, compressor_thread_maxpages1, CTLFLAG_RD | CTLFLAG_LOCKED, &vmct_stats.vmct_maxpages[1], 0, "");
4435
4436 int vm_compressor_injected_error_count;
4437
4438 SYSCTL_INT(_vm, OID_AUTO, compressor_injected_error_count, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_compressor_injected_error_count, 0, "");
4439
4440 static int
sysctl_compressor_inject_error(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)4441 sysctl_compressor_inject_error(__unused struct sysctl_oid *oidp,
4442 __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4443 {
4444 int result;
4445 vm_address_t va = 0;
4446 int changed;
4447
4448 result = sysctl_io_number(req, va, sizeof(va), &va, &changed);
4449 if (result == 0 && changed) {
4450 result = vm_map_inject_error(current_map(), va);
4451 if (result == 0) {
4452 /*
4453 * Count the number of errors injected successfully to detect
4454 * situations where corruption was caused by improper use of this
4455 * sysctl.
4456 */
4457 os_atomic_inc(&vm_compressor_injected_error_count, relaxed);
4458 }
4459 }
4460 return result;
4461 }
4462
4463 SYSCTL_PROC(_vm, OID_AUTO, compressor_inject_error, CTLTYPE_QUAD | CTLFLAG_LOCKED | CTLFLAG_RW,
4464 0, 0, sysctl_compressor_inject_error, "Q", "flips a bit in a compressed page for the current task");
4465
4466 /*
4467 * Opt a process in/out of self donation mode.
4468 */
4469 static int
4470 sysctl_vm_pid_toggle_selfdonate_pages SYSCTL_HANDLER_ARGS
4471 {
4472 #pragma unused(arg1, arg2)
4473 int error, pid = 0;
4474 proc_t p;
4475
4476 error = sysctl_handle_int(oidp, &pid, 0, req);
4477 if (error || !req->newptr) {
4478 return error;
4479 }
4480
4481 p = proc_find(pid);
4482 if (p != NULL) {
4483 (void) vm_toggle_task_selfdonate_pages(proc_task(p));
4484 proc_rele(p);
4485 return error;
4486 } else {
4487 printf("sysctl_vm_pid_selfdonate_pages: Invalid process\n");
4488 }
4489
4490 return EINVAL;
4491 }
4492 SYSCTL_PROC(_vm, OID_AUTO, pid_toggle_selfdonate_pages, CTLTYPE_INT | CTLFLAG_WR | CTLFLAG_LOCKED | CTLFLAG_MASKED,
4493 0, 0, &sysctl_vm_pid_toggle_selfdonate_pages, "I", "");
4494 #endif
4495 extern uint32_t vm_page_donate_mode;
4496 extern uint32_t vm_page_donate_target_high, vm_page_donate_target_low;
4497 SYSCTL_INT(_vm, OID_AUTO, vm_page_donate_mode, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_page_donate_mode, 0, "");
4498 SYSCTL_INT(_vm, OID_AUTO, vm_page_donate_target_high, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_page_donate_target_high, 0, "");
4499 SYSCTL_INT(_vm, OID_AUTO, vm_page_donate_target_low, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_page_donate_target_low, 0, "");
4500
4501 SYSCTL_QUAD(_vm, OID_AUTO, lz4_compressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.lz4_compressions, "");
4502 SYSCTL_QUAD(_vm, OID_AUTO, lz4_compression_failures, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.lz4_compression_failures, "");
4503 SYSCTL_QUAD(_vm, OID_AUTO, lz4_compressed_bytes, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.lz4_compressed_bytes, "");
4504 SYSCTL_QUAD(_vm, OID_AUTO, lz4_wk_compression_delta, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.lz4_wk_compression_delta, "");
4505 SYSCTL_QUAD(_vm, OID_AUTO, lz4_wk_compression_negative_delta, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.lz4_wk_compression_negative_delta, "");
4506
4507 SYSCTL_QUAD(_vm, OID_AUTO, lz4_decompressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.lz4_decompressions, "");
4508 SYSCTL_QUAD(_vm, OID_AUTO, lz4_decompressed_bytes, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.lz4_decompressed_bytes, "");
4509
4510 SYSCTL_QUAD(_vm, OID_AUTO, uc_decompressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.uc_decompressions, "");
4511
4512 SYSCTL_QUAD(_vm, OID_AUTO, wk_compressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_compressions, "");
4513
4514 SYSCTL_QUAD(_vm, OID_AUTO, wk_catime, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_cabstime, "");
4515
4516 SYSCTL_QUAD(_vm, OID_AUTO, wkh_catime, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wkh_cabstime, "");
4517 SYSCTL_QUAD(_vm, OID_AUTO, wkh_compressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wkh_compressions, "");
4518
4519 SYSCTL_QUAD(_vm, OID_AUTO, wks_catime, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wks_cabstime, "");
4520 SYSCTL_QUAD(_vm, OID_AUTO, wks_compressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wks_compressions, "");
4521
4522 SYSCTL_QUAD(_vm, OID_AUTO, wk_compressions_exclusive, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_compressions_exclusive, "");
4523 SYSCTL_QUAD(_vm, OID_AUTO, wk_sv_compressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_sv_compressions, "");
4524 SYSCTL_QUAD(_vm, OID_AUTO, wk_mzv_compressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_mzv_compressions, "");
4525 SYSCTL_QUAD(_vm, OID_AUTO, wk_compression_failures, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_compression_failures, "");
4526 SYSCTL_QUAD(_vm, OID_AUTO, wk_compressed_bytes_exclusive, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_compressed_bytes_exclusive, "");
4527 SYSCTL_QUAD(_vm, OID_AUTO, wk_compressed_bytes_total, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_compressed_bytes_total, "");
4528
4529 SYSCTL_QUAD(_vm, OID_AUTO, wks_compressed_bytes, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wks_compressed_bytes, "");
4530 SYSCTL_QUAD(_vm, OID_AUTO, wks_compression_failures, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wks_compression_failures, "");
4531 SYSCTL_QUAD(_vm, OID_AUTO, wks_sv_compressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wks_sv_compressions, "");
4532
4533
4534 SYSCTL_QUAD(_vm, OID_AUTO, wk_decompressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_decompressions, "");
4535
4536 SYSCTL_QUAD(_vm, OID_AUTO, wk_datime, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_dabstime, "");
4537
4538 SYSCTL_QUAD(_vm, OID_AUTO, wkh_datime, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wkh_dabstime, "");
4539 SYSCTL_QUAD(_vm, OID_AUTO, wkh_decompressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wkh_decompressions, "");
4540
4541 SYSCTL_QUAD(_vm, OID_AUTO, wks_datime, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wks_dabstime, "");
4542 SYSCTL_QUAD(_vm, OID_AUTO, wks_decompressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wks_decompressions, "");
4543
4544 SYSCTL_QUAD(_vm, OID_AUTO, wk_decompressed_bytes, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_decompressed_bytes, "");
4545 SYSCTL_QUAD(_vm, OID_AUTO, wk_sv_decompressions, CTLFLAG_RD | CTLFLAG_LOCKED, &compressor_stats.wk_sv_decompressions, "");
4546
4547 SYSCTL_INT(_vm, OID_AUTO, lz4_threshold, CTLFLAG_RW | CTLFLAG_LOCKED, &vmctune.lz4_threshold, 0, "");
4548 SYSCTL_INT(_vm, OID_AUTO, wkdm_reeval_threshold, CTLFLAG_RW | CTLFLAG_LOCKED, &vmctune.wkdm_reeval_threshold, 0, "");
4549 SYSCTL_INT(_vm, OID_AUTO, lz4_max_failure_skips, CTLFLAG_RW | CTLFLAG_LOCKED, &vmctune.lz4_max_failure_skips, 0, "");
4550 SYSCTL_INT(_vm, OID_AUTO, lz4_max_failure_run_length, CTLFLAG_RW | CTLFLAG_LOCKED, &vmctune.lz4_max_failure_run_length, 0, "");
4551 SYSCTL_INT(_vm, OID_AUTO, lz4_max_preselects, CTLFLAG_RW | CTLFLAG_LOCKED, &vmctune.lz4_max_preselects, 0, "");
4552 SYSCTL_INT(_vm, OID_AUTO, lz4_run_preselection_threshold, CTLFLAG_RW | CTLFLAG_LOCKED, &vmctune.lz4_run_preselection_threshold, 0, "");
4553 SYSCTL_INT(_vm, OID_AUTO, lz4_run_continue_bytes, CTLFLAG_RW | CTLFLAG_LOCKED, &vmctune.lz4_run_continue_bytes, 0, "");
4554 SYSCTL_INT(_vm, OID_AUTO, lz4_profitable_bytes, CTLFLAG_RW | CTLFLAG_LOCKED, &vmctune.lz4_profitable_bytes, 0, "");
4555 #if DEVELOPMENT || DEBUG
4556 extern int vm_compressor_current_codec;
4557 extern int vm_compressor_test_seg_wp;
4558 extern boolean_t vm_compressor_force_sw_wkdm;
4559 SYSCTL_INT(_vm, OID_AUTO, compressor_codec, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_compressor_current_codec, 0, "");
4560 SYSCTL_INT(_vm, OID_AUTO, compressor_test_wp, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_compressor_test_seg_wp, 0, "");
4561
4562 SYSCTL_INT(_vm, OID_AUTO, wksw_force, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_compressor_force_sw_wkdm, 0, "");
4563 extern int precompy, wkswhw;
4564
4565 SYSCTL_INT(_vm, OID_AUTO, precompy, CTLFLAG_RW | CTLFLAG_LOCKED, &precompy, 0, "");
4566 SYSCTL_INT(_vm, OID_AUTO, wkswhw, CTLFLAG_RW | CTLFLAG_LOCKED, &wkswhw, 0, "");
4567 extern unsigned int vm_ktrace_enabled;
4568 SYSCTL_INT(_vm, OID_AUTO, vm_ktrace, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_ktrace_enabled, 0, "");
4569 #endif
4570
4571 #if CONFIG_PHANTOM_CACHE
4572 extern uint32_t phantom_cache_thrashing_threshold;
4573 extern uint32_t phantom_cache_eval_period_in_msecs;
4574 extern uint32_t phantom_cache_thrashing_threshold_ssd;
4575
4576
4577 SYSCTL_INT(_vm, OID_AUTO, phantom_cache_eval_period_in_msecs, CTLFLAG_RW | CTLFLAG_LOCKED, &phantom_cache_eval_period_in_msecs, 0, "");
4578 SYSCTL_INT(_vm, OID_AUTO, phantom_cache_thrashing_threshold, CTLFLAG_RW | CTLFLAG_LOCKED, &phantom_cache_thrashing_threshold, 0, "");
4579 SYSCTL_INT(_vm, OID_AUTO, phantom_cache_thrashing_threshold_ssd, CTLFLAG_RW | CTLFLAG_LOCKED, &phantom_cache_thrashing_threshold_ssd, 0, "");
4580 #endif
4581
4582 #if defined(__LP64__)
4583 extern uint32_t vm_page_background_count;
4584 extern uint32_t vm_page_background_target;
4585 extern uint32_t vm_page_background_internal_count;
4586 extern uint32_t vm_page_background_external_count;
4587 extern uint32_t vm_page_background_mode;
4588 extern uint32_t vm_page_background_exclude_external;
4589 extern uint64_t vm_page_background_promoted_count;
4590 extern uint64_t vm_pageout_rejected_bq_internal;
4591 extern uint64_t vm_pageout_rejected_bq_external;
4592
4593 SYSCTL_INT(_vm, OID_AUTO, vm_page_background_mode, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_page_background_mode, 0, "");
4594 SYSCTL_INT(_vm, OID_AUTO, vm_page_background_exclude_external, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_page_background_exclude_external, 0, "");
4595 SYSCTL_INT(_vm, OID_AUTO, vm_page_background_target, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_page_background_target, 0, "");
4596 SYSCTL_INT(_vm, OID_AUTO, vm_page_background_count, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_page_background_count, 0, "");
4597 SYSCTL_INT(_vm, OID_AUTO, vm_page_background_internal_count, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_page_background_internal_count, 0, "");
4598 SYSCTL_INT(_vm, OID_AUTO, vm_page_background_external_count, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_page_background_external_count, 0, "");
4599
4600 SYSCTL_QUAD(_vm, OID_AUTO, vm_page_background_promoted_count, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_page_background_promoted_count, "");
4601 SYSCTL_QUAD(_vm, OID_AUTO, vm_pageout_considered_bq_internal, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_pageout_vminfo.vm_pageout_considered_bq_internal, "");
4602 SYSCTL_QUAD(_vm, OID_AUTO, vm_pageout_considered_bq_external, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_pageout_vminfo.vm_pageout_considered_bq_external, "");
4603 SYSCTL_QUAD(_vm, OID_AUTO, vm_pageout_rejected_bq_internal, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_pageout_rejected_bq_internal, "");
4604 SYSCTL_QUAD(_vm, OID_AUTO, vm_pageout_rejected_bq_external, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_pageout_rejected_bq_external, "");
4605
4606 #endif /* __LP64__ */
4607
4608 extern void vm_update_darkwake_mode(boolean_t);
4609 extern boolean_t vm_darkwake_mode;
4610
4611 STATIC int
sysctl_toggle_darkwake_mode(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)4612 sysctl_toggle_darkwake_mode(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
4613 {
4614 int new_value, changed;
4615 int error = sysctl_io_number(req, vm_darkwake_mode, sizeof(int), &new_value, &changed);
4616
4617 if (!error && changed) {
4618 if (new_value != 0 && new_value != 1) {
4619 printf("Error: Invalid value passed to darkwake sysctl. Acceptable: 0 or 1.\n");
4620 error = EINVAL;
4621 } else {
4622 vm_update_darkwake_mode((boolean_t) new_value);
4623 }
4624 }
4625
4626 return error;
4627 }
4628
4629 SYSCTL_PROC(_vm, OID_AUTO, darkwake_mode,
4630 CTLTYPE_INT | CTLFLAG_LOCKED | CTLFLAG_RW,
4631 0, 0, sysctl_toggle_darkwake_mode, "I", "");
4632
4633 #if (DEVELOPMENT || DEBUG)
4634
4635 SYSCTL_UINT(_vm, OID_AUTO, vm_page_creation_throttled_hard,
4636 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
4637 &vm_page_creation_throttled_hard, 0, "");
4638
4639 SYSCTL_UINT(_vm, OID_AUTO, vm_page_creation_throttled_soft,
4640 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
4641 &vm_page_creation_throttled_soft, 0, "");
4642
4643 extern uint32_t vm_pageout_memorystatus_fb_factor_nr;
4644 extern uint32_t vm_pageout_memorystatus_fb_factor_dr;
4645 SYSCTL_INT(_vm, OID_AUTO, vm_pageout_memorystatus_fb_factor_nr, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_pageout_memorystatus_fb_factor_nr, 0, "");
4646 SYSCTL_INT(_vm, OID_AUTO, vm_pageout_memorystatus_fb_factor_dr, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_pageout_memorystatus_fb_factor_dr, 0, "");
4647
4648 extern uint32_t vm_grab_anon_nops;
4649
4650 SYSCTL_INT(_vm, OID_AUTO, vm_grab_anon_overrides, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_pageout_debug.vm_grab_anon_overrides, 0, "");
4651 SYSCTL_INT(_vm, OID_AUTO, vm_grab_anon_nops, CTLFLAG_RW | CTLFLAG_LOCKED, &vm_pageout_debug.vm_grab_anon_nops, 0, "");
4652 SYSCTL_INT(_vm, OID_AUTO, vm_pageout_yield_for_free_pages, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_pageout_debug.vm_pageout_yield_for_free_pages, 0, "");
4653
4654
4655 extern int vm_page_delayed_work_ctx_needed;
4656 SYSCTL_INT(_vm, OID_AUTO, vm_page_needed_delayed_work_ctx, CTLFLAG_RD | CTLFLAG_LOCKED, &vm_page_delayed_work_ctx_needed, 0, "");
4657
4658 /* log message counters for persistence mode */
4659 SCALABLE_COUNTER_DECLARE(oslog_p_total_msgcount);
4660 SCALABLE_COUNTER_DECLARE(oslog_p_metadata_saved_msgcount);
4661 SCALABLE_COUNTER_DECLARE(oslog_p_metadata_dropped_msgcount);
4662 SCALABLE_COUNTER_DECLARE(oslog_p_error_count);
4663 SCALABLE_COUNTER_DECLARE(oslog_p_saved_msgcount);
4664 SCALABLE_COUNTER_DECLARE(oslog_p_dropped_msgcount);
4665 SCALABLE_COUNTER_DECLARE(oslog_p_boot_dropped_msgcount);
4666 SCALABLE_COUNTER_DECLARE(oslog_p_coprocessor_total_msgcount);
4667 SCALABLE_COUNTER_DECLARE(oslog_p_coprocessor_dropped_msgcount);
4668 SCALABLE_COUNTER_DECLARE(oslog_p_unresolved_kc_msgcount);
4669 SCALABLE_COUNTER_DECLARE(oslog_p_fmt_invalid_msgcount);
4670 SCALABLE_COUNTER_DECLARE(oslog_p_fmt_max_args_msgcount);
4671 SCALABLE_COUNTER_DECLARE(oslog_p_truncated_msgcount);
4672
4673 SCALABLE_COUNTER_DECLARE(log_queue_cnt_received);
4674 SCALABLE_COUNTER_DECLARE(log_queue_cnt_rejected_fh);
4675 SCALABLE_COUNTER_DECLARE(log_queue_cnt_sent);
4676 SCALABLE_COUNTER_DECLARE(log_queue_cnt_dropped_nomem);
4677 SCALABLE_COUNTER_DECLARE(log_queue_cnt_queued);
4678 SCALABLE_COUNTER_DECLARE(log_queue_cnt_dropped_off);
4679 SCALABLE_COUNTER_DECLARE(log_queue_cnt_mem_active);
4680 SCALABLE_COUNTER_DECLARE(log_queue_cnt_mem_allocated);
4681 SCALABLE_COUNTER_DECLARE(log_queue_cnt_mem_released);
4682 SCALABLE_COUNTER_DECLARE(log_queue_cnt_mem_failed);
4683
4684 /* log message counters for streaming mode */
4685 SCALABLE_COUNTER_DECLARE(oslog_s_total_msgcount);
4686 SCALABLE_COUNTER_DECLARE(oslog_s_metadata_msgcount);
4687 SCALABLE_COUNTER_DECLARE(oslog_s_error_count);
4688 SCALABLE_COUNTER_DECLARE(oslog_s_streamed_msgcount);
4689 SCALABLE_COUNTER_DECLARE(oslog_s_dropped_msgcount);
4690
4691 /* log message counters for msgbuf logging */
4692 SCALABLE_COUNTER_DECLARE(oslog_msgbuf_msgcount);
4693 SCALABLE_COUNTER_DECLARE(oslog_msgbuf_dropped_msgcount);
4694 extern uint32_t oslog_msgbuf_dropped_charcount;
4695
4696 /* log message counters for vaddlog logging */
4697 extern uint32_t vaddlog_msgcount;
4698 extern uint32_t vaddlog_msgcount_dropped;
4699
4700 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_total_msgcount, oslog_p_total_msgcount, "");
4701 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_metadata_saved_msgcount, oslog_p_metadata_saved_msgcount, "");
4702 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_metadata_dropped_msgcount, oslog_p_metadata_dropped_msgcount, "");
4703 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_error_count, oslog_p_error_count, "");
4704 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_saved_msgcount, oslog_p_saved_msgcount, "");
4705 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_dropped_msgcount, oslog_p_dropped_msgcount, "");
4706 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_boot_dropped_msgcount, oslog_p_boot_dropped_msgcount, "");
4707 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_coprocessor_total_msgcount, oslog_p_coprocessor_total_msgcount, "");
4708 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_coprocessor_dropped_msgcount, oslog_p_coprocessor_dropped_msgcount, "");
4709 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_unresolved_kc_msgcount, oslog_p_unresolved_kc_msgcount, "");
4710
4711 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_fmt_invalid_msgcount, oslog_p_fmt_invalid_msgcount, "");
4712 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_fmt_max_args_msgcount, oslog_p_fmt_max_args_msgcount, "");
4713 SYSCTL_SCALABLE_COUNTER(_debug, oslog_p_truncated_msgcount, oslog_p_truncated_msgcount, "");
4714
4715 SYSCTL_SCALABLE_COUNTER(_debug, oslog_s_total_msgcount, oslog_s_total_msgcount, "Number of logs sent to streaming");
4716 SYSCTL_SCALABLE_COUNTER(_debug, oslog_s_metadata_msgcount, oslog_s_metadata_msgcount, "Number of metadata sent to streaming");
4717 SYSCTL_SCALABLE_COUNTER(_debug, oslog_s_error_count, oslog_s_error_count, "Number of invalid stream logs");
4718 SYSCTL_SCALABLE_COUNTER(_debug, oslog_s_streamed_msgcount, oslog_s_streamed_msgcount, "Number of streamed logs");
4719 SYSCTL_SCALABLE_COUNTER(_debug, oslog_s_dropped_msgcount, oslog_s_dropped_msgcount, "Number of logs dropped from stream");
4720
4721 SYSCTL_SCALABLE_COUNTER(_debug, oslog_msgbuf_msgcount, oslog_msgbuf_msgcount, "Number of dmesg log messages");
4722 SYSCTL_SCALABLE_COUNTER(_debug, oslog_msgbuf_dropped_msgcount, oslog_msgbuf_dropped_msgcount, "Number of dropped dmesg log messages");
4723 SYSCTL_UINT(_debug, OID_AUTO, oslog_msgbuf_dropped_charcount, CTLFLAG_ANYBODY | CTLFLAG_RD | CTLFLAG_LOCKED, &oslog_msgbuf_dropped_charcount, 0, "Number of dropped dmesg log chars");
4724
4725 SYSCTL_UINT(_debug, OID_AUTO, vaddlog_msgcount, CTLFLAG_ANYBODY | CTLFLAG_RD | CTLFLAG_LOCKED, &vaddlog_msgcount, 0, "");
4726 SYSCTL_UINT(_debug, OID_AUTO, vaddlog_msgcount_dropped, CTLFLAG_ANYBODY | CTLFLAG_RD | CTLFLAG_LOCKED, &vaddlog_msgcount_dropped, 0, "");
4727
4728 SYSCTL_SCALABLE_COUNTER(_debug, log_queue_cnt_received, log_queue_cnt_received, "Number of received logs");
4729 SYSCTL_SCALABLE_COUNTER(_debug, log_queue_cnt_rejected_fh, log_queue_cnt_rejected_fh, "Number of logs initially rejected by FH");
4730 SYSCTL_SCALABLE_COUNTER(_debug, log_queue_cnt_sent, log_queue_cnt_sent, "Number of logs successfully saved in FH");
4731 SYSCTL_SCALABLE_COUNTER(_debug, log_queue_cnt_dropped_nomem, log_queue_cnt_dropped_nomem, "Number of logs dropped due to lack of queue memory");
4732 SYSCTL_SCALABLE_COUNTER(_debug, log_queue_cnt_queued, log_queue_cnt_queued, "Current number of logs stored in log queues");
4733 SYSCTL_SCALABLE_COUNTER(_debug, log_queue_cnt_dropped_off, log_queue_cnt_dropped_off, "Number of logs dropped due to disabled log queues");
4734 SYSCTL_SCALABLE_COUNTER(_debug, log_queue_cnt_mem_allocated, log_queue_cnt_mem_allocated, "Number of memory allocations");
4735 SYSCTL_SCALABLE_COUNTER(_debug, log_queue_cnt_mem_released, log_queue_cnt_mem_released, "Number of memory releases");
4736 SYSCTL_SCALABLE_COUNTER(_debug, log_queue_cnt_mem_failed, log_queue_cnt_mem_failed, "Number of failed memory allocations");
4737
4738 #endif /* DEVELOPMENT || DEBUG */
4739
4740 /*
4741 * Enable tracing of voucher contents
4742 */
4743 extern uint32_t ipc_voucher_trace_contents;
4744
4745 SYSCTL_INT(_kern, OID_AUTO, ipc_voucher_trace_contents,
4746 CTLFLAG_RW | CTLFLAG_LOCKED, &ipc_voucher_trace_contents, 0, "Enable tracing voucher contents");
4747
4748 /*
4749 * Kernel stack size and depth
4750 */
4751 SYSCTL_INT(_kern, OID_AUTO, stack_size,
4752 CTLFLAG_RD | CTLFLAG_LOCKED, (int *) &kernel_stack_size, 0, "Kernel stack size");
4753 SYSCTL_INT(_kern, OID_AUTO, stack_depth_max,
4754 CTLFLAG_RD | CTLFLAG_LOCKED, (int *) &kernel_stack_depth_max, 0, "Max kernel stack depth at interrupt or context switch");
4755
4756 extern unsigned int kern_feature_overrides;
4757 SYSCTL_INT(_kern, OID_AUTO, kern_feature_overrides,
4758 CTLFLAG_RD | CTLFLAG_LOCKED, &kern_feature_overrides, 0, "Kernel feature override mask");
4759
4760 /*
4761 * enable back trace for port allocations
4762 */
4763 extern int ipc_portbt;
4764
4765 SYSCTL_INT(_kern, OID_AUTO, ipc_portbt,
4766 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
4767 &ipc_portbt, 0, "");
4768
4769 /*
4770 * Mach message signature validation control and outputs
4771 */
4772 extern unsigned int ikm_signature_failures;
4773 SYSCTL_INT(_kern, OID_AUTO, ikm_signature_failures,
4774 CTLFLAG_RD | CTLFLAG_LOCKED, &ikm_signature_failures, 0, "Message signature failure count");
4775 extern unsigned int ikm_signature_failure_id;
4776 SYSCTL_INT(_kern, OID_AUTO, ikm_signature_failure_id,
4777 CTLFLAG_RD | CTLFLAG_LOCKED, &ikm_signature_failure_id, 0, "Message signature failure count");
4778
4779 #if (DEVELOPMENT || DEBUG)
4780 extern unsigned int ikm_signature_panic_disable;
4781 SYSCTL_INT(_kern, OID_AUTO, ikm_signature_panic_disable,
4782 CTLFLAG_RW | CTLFLAG_LOCKED, &ikm_signature_panic_disable, 0, "Message signature failure mode");
4783 extern unsigned int ikm_signature_header_failures;
4784 SYSCTL_INT(_kern, OID_AUTO, ikm_signature_header_failures,
4785 CTLFLAG_RD | CTLFLAG_LOCKED, &ikm_signature_header_failures, 0, "Message header signature failure count");
4786 extern unsigned int ikm_signature_trailer_failures;
4787 SYSCTL_INT(_kern, OID_AUTO, ikm_signature_trailer_failures,
4788 CTLFLAG_RD | CTLFLAG_LOCKED, &ikm_signature_trailer_failures, 0, "Message trailer signature failure count");
4789 #endif
4790
4791 /*
4792 * Scheduler sysctls
4793 */
4794
4795 SYSCTL_STRING(_kern, OID_AUTO, sched,
4796 CTLFLAG_RD | CTLFLAG_KERN | CTLFLAG_LOCKED,
4797 sched_string, sizeof(sched_string),
4798 "Timeshare scheduler implementation");
4799
4800 #if CONFIG_QUIESCE_COUNTER
4801 static int
4802 sysctl_cpu_quiescent_counter_interval SYSCTL_HANDLER_ARGS
4803 {
4804 #pragma unused(arg1, arg2)
4805
4806 uint32_t local_min_interval_us = cpu_quiescent_counter_get_min_interval_us();
4807
4808 int error = sysctl_handle_int(oidp, &local_min_interval_us, 0, req);
4809 if (error || !req->newptr) {
4810 return error;
4811 }
4812
4813 cpu_quiescent_counter_set_min_interval_us(local_min_interval_us);
4814
4815 return 0;
4816 }
4817
4818 SYSCTL_PROC(_kern, OID_AUTO, cpu_checkin_interval,
4819 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
4820 0, 0,
4821 sysctl_cpu_quiescent_counter_interval, "I",
4822 "Quiescent CPU checkin interval (microseconds)");
4823 #endif /* CONFIG_QUIESCE_COUNTER */
4824
4825 /*
4826 * Allow the precise user/kernel time sysctl to be set, but don't allow it to
4827 * affect anything. Some tools expect to be able to set this, even though
4828 * runtime configuration is no longer supported.
4829 */
4830
4831 static int
4832 sysctl_precise_user_kernel_time SYSCTL_HANDLER_ARGS
4833 {
4834 #if PRECISE_USER_KERNEL_TIME
4835 int dummy_set = 1;
4836 #else /* PRECISE_USER_KERNEL_TIME */
4837 int dummy_set = 0;
4838 #endif /* !PRECISE_USER_KERNEL_TIME */
4839 return sysctl_handle_int(oidp, &dummy_set, 0, req);
4840 }
4841
4842 SYSCTL_PROC(_kern, OID_AUTO, precise_user_kernel_time,
4843 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
4844 0, 0, sysctl_precise_user_kernel_time, "I",
4845 "Precise accounting of kernel vs. user time (deprecated)");
4846
4847 #if CONFIG_PERVASIVE_ENERGY && HAS_CPU_DPE_COUNTER
4848 __security_const_late static int pervasive_energy = 1;
4849 #else /* CONFIG_PERVASIVE_ENERGY && HAS_CPU_DPE_COUNTER */
4850 __security_const_late static int pervasive_energy = 0;
4851 #endif /* !CONFIG_PERVASIVE_ENERGY || !HAS_CPU_DPE_COUNTER */
4852
4853 SYSCTL_INT(_kern, OID_AUTO, pervasive_energy,
4854 CTLFLAG_KERN | CTLFLAG_RD | CTLFLAG_LOCKED, &pervasive_energy, 0, "");
4855
4856 /* Parameters related to timer coalescing tuning, to be replaced
4857 * with a dedicated systemcall in the future.
4858 */
4859 /* Enable processing pending timers in the context of any other interrupt
4860 * Coalescing tuning parameters for various thread/task attributes */
4861 STATIC int
4862 sysctl_timer_user_us_kernel_abstime SYSCTL_HANDLER_ARGS
4863 {
4864 #pragma unused(oidp)
4865 int size = arg2; /* subcommand*/
4866 int error;
4867 int changed = 0;
4868 uint64_t old_value_ns;
4869 uint64_t new_value_ns;
4870 uint64_t value_abstime;
4871 if (size == sizeof(uint32_t)) {
4872 value_abstime = *((uint32_t *)arg1);
4873 } else if (size == sizeof(uint64_t)) {
4874 value_abstime = *((uint64_t *)arg1);
4875 } else {
4876 return ENOTSUP;
4877 }
4878
4879 absolutetime_to_nanoseconds(value_abstime, &old_value_ns);
4880 error = sysctl_io_number(req, old_value_ns, sizeof(old_value_ns), &new_value_ns, &changed);
4881 if ((error) || (!changed)) {
4882 return error;
4883 }
4884
4885 nanoseconds_to_absolutetime(new_value_ns, &value_abstime);
4886 if (size == sizeof(uint32_t)) {
4887 *((uint32_t *)arg1) = (uint32_t)value_abstime;
4888 } else {
4889 *((uint64_t *)arg1) = value_abstime;
4890 }
4891 return error;
4892 }
4893
4894 SYSCTL_INT(_kern, OID_AUTO, timer_coalesce_bg_scale,
4895 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4896 &tcoal_prio_params.timer_coalesce_bg_shift, 0, "");
4897 SYSCTL_PROC(_kern, OID_AUTO, timer_resort_threshold_ns,
4898 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4899 &tcoal_prio_params.timer_resort_threshold_abstime,
4900 sizeof(tcoal_prio_params.timer_resort_threshold_abstime),
4901 sysctl_timer_user_us_kernel_abstime,
4902 "Q", "");
4903 SYSCTL_PROC(_kern, OID_AUTO, timer_coalesce_bg_ns_max,
4904 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4905 &tcoal_prio_params.timer_coalesce_bg_abstime_max,
4906 sizeof(tcoal_prio_params.timer_coalesce_bg_abstime_max),
4907 sysctl_timer_user_us_kernel_abstime,
4908 "Q", "");
4909
4910 SYSCTL_INT(_kern, OID_AUTO, timer_coalesce_kt_scale,
4911 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4912 &tcoal_prio_params.timer_coalesce_kt_shift, 0, "");
4913
4914 SYSCTL_PROC(_kern, OID_AUTO, timer_coalesce_kt_ns_max,
4915 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4916 &tcoal_prio_params.timer_coalesce_kt_abstime_max,
4917 sizeof(tcoal_prio_params.timer_coalesce_kt_abstime_max),
4918 sysctl_timer_user_us_kernel_abstime,
4919 "Q", "");
4920
4921 SYSCTL_INT(_kern, OID_AUTO, timer_coalesce_fp_scale,
4922 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4923 &tcoal_prio_params.timer_coalesce_fp_shift, 0, "");
4924
4925 SYSCTL_PROC(_kern, OID_AUTO, timer_coalesce_fp_ns_max,
4926 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4927 &tcoal_prio_params.timer_coalesce_fp_abstime_max,
4928 sizeof(tcoal_prio_params.timer_coalesce_fp_abstime_max),
4929 sysctl_timer_user_us_kernel_abstime,
4930 "Q", "");
4931
4932 SYSCTL_INT(_kern, OID_AUTO, timer_coalesce_ts_scale,
4933 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4934 &tcoal_prio_params.timer_coalesce_ts_shift, 0, "");
4935
4936 SYSCTL_PROC(_kern, OID_AUTO, timer_coalesce_ts_ns_max,
4937 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4938 &tcoal_prio_params.timer_coalesce_ts_abstime_max,
4939 sizeof(tcoal_prio_params.timer_coalesce_ts_abstime_max),
4940 sysctl_timer_user_us_kernel_abstime,
4941 "Q", "");
4942
4943 SYSCTL_INT(_kern, OID_AUTO, timer_coalesce_tier0_scale,
4944 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4945 &tcoal_prio_params.latency_qos_scale[0], 0, "");
4946
4947 SYSCTL_PROC(_kern, OID_AUTO, timer_coalesce_tier0_ns_max,
4948 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4949 &tcoal_prio_params.latency_qos_abstime_max[0],
4950 sizeof(tcoal_prio_params.latency_qos_abstime_max[0]),
4951 sysctl_timer_user_us_kernel_abstime,
4952 "Q", "");
4953
4954 SYSCTL_INT(_kern, OID_AUTO, timer_coalesce_tier1_scale,
4955 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4956 &tcoal_prio_params.latency_qos_scale[1], 0, "");
4957
4958 SYSCTL_PROC(_kern, OID_AUTO, timer_coalesce_tier1_ns_max,
4959 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4960 &tcoal_prio_params.latency_qos_abstime_max[1],
4961 sizeof(tcoal_prio_params.latency_qos_abstime_max[1]),
4962 sysctl_timer_user_us_kernel_abstime,
4963 "Q", "");
4964
4965 SYSCTL_INT(_kern, OID_AUTO, timer_coalesce_tier2_scale,
4966 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4967 &tcoal_prio_params.latency_qos_scale[2], 0, "");
4968
4969 SYSCTL_PROC(_kern, OID_AUTO, timer_coalesce_tier2_ns_max,
4970 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4971 &tcoal_prio_params.latency_qos_abstime_max[2],
4972 sizeof(tcoal_prio_params.latency_qos_abstime_max[2]),
4973 sysctl_timer_user_us_kernel_abstime,
4974 "Q", "");
4975
4976 SYSCTL_INT(_kern, OID_AUTO, timer_coalesce_tier3_scale,
4977 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4978 &tcoal_prio_params.latency_qos_scale[3], 0, "");
4979
4980 SYSCTL_PROC(_kern, OID_AUTO, timer_coalesce_tier3_ns_max,
4981 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4982 &tcoal_prio_params.latency_qos_abstime_max[3],
4983 sizeof(tcoal_prio_params.latency_qos_abstime_max[3]),
4984 sysctl_timer_user_us_kernel_abstime,
4985 "Q", "");
4986
4987 SYSCTL_INT(_kern, OID_AUTO, timer_coalesce_tier4_scale,
4988 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4989 &tcoal_prio_params.latency_qos_scale[4], 0, "");
4990
4991 SYSCTL_PROC(_kern, OID_AUTO, timer_coalesce_tier4_ns_max,
4992 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
4993 &tcoal_prio_params.latency_qos_abstime_max[4],
4994 sizeof(tcoal_prio_params.latency_qos_abstime_max[4]),
4995 sysctl_timer_user_us_kernel_abstime,
4996 "Q", "");
4997
4998 SYSCTL_INT(_kern, OID_AUTO, timer_coalesce_tier5_scale,
4999 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5000 &tcoal_prio_params.latency_qos_scale[5], 0, "");
5001
5002 SYSCTL_PROC(_kern, OID_AUTO, timer_coalesce_tier5_ns_max,
5003 CTLTYPE_QUAD | CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5004 &tcoal_prio_params.latency_qos_abstime_max[5],
5005 sizeof(tcoal_prio_params.latency_qos_abstime_max[5]),
5006 sysctl_timer_user_us_kernel_abstime,
5007 "Q", "");
5008
5009 /* Communicate the "user idle level" heuristic to the timer layer, and
5010 * potentially other layers in the future.
5011 */
5012
5013 static int
timer_user_idle_level(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)5014 timer_user_idle_level(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
5015 {
5016 int new_value = 0, old_value = 0, changed = 0, error;
5017
5018 old_value = timer_get_user_idle_level();
5019
5020 error = sysctl_io_number(req, old_value, sizeof(int), &new_value, &changed);
5021
5022 if (error == 0 && changed) {
5023 if (timer_set_user_idle_level(new_value) != KERN_SUCCESS) {
5024 error = ERANGE;
5025 }
5026 }
5027
5028 return error;
5029 }
5030
5031 SYSCTL_PROC(_machdep, OID_AUTO, user_idle_level,
5032 CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED,
5033 0, 0,
5034 timer_user_idle_level, "I", "User idle level heuristic, 0-128");
5035
5036 #if HYPERVISOR
5037 SYSCTL_INT(_kern, OID_AUTO, hv_support,
5038 CTLFLAG_KERN | CTLFLAG_RD | CTLFLAG_LOCKED,
5039 &hv_support_available, 0, "");
5040
5041 SYSCTL_INT(_kern, OID_AUTO, hv_disable,
5042 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5043 &hv_disable, 0, "");
5044
5045 #endif /* HYPERVISOR */
5046
5047 #if DEVELOPMENT || DEBUG
5048 extern uint64_t driverkit_checkin_timed_out;
5049 SYSCTL_QUAD(_kern, OID_AUTO, driverkit_checkin_timed_out,
5050 CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_LOCKED,
5051 &driverkit_checkin_timed_out, "timestamp of dext checkin timeout");
5052 #endif
5053
5054 #if CONFIG_DARKBOOT
5055 STATIC int
5056 sysctl_darkboot SYSCTL_HANDLER_ARGS
5057 {
5058 int err = 0, value = 0;
5059 #pragma unused(oidp, arg1, arg2, err, value, req)
5060
5061 /*
5062 * Handle the sysctl request.
5063 *
5064 * If this is a read, the function will set the value to the current darkboot value. Otherwise,
5065 * we'll get the request identifier into "value" and then we can honor it.
5066 */
5067 if ((err = sysctl_io_number(req, darkboot, sizeof(int), &value, NULL)) != 0) {
5068 goto exit;
5069 }
5070
5071 /* writing requested, let's process the request */
5072 if (req->newptr) {
5073 /* writing is protected by an entitlement */
5074 if (priv_check_cred(kauth_cred_get(), PRIV_DARKBOOT, 0) != 0) {
5075 err = EPERM;
5076 goto exit;
5077 }
5078
5079 switch (value) {
5080 case MEMORY_MAINTENANCE_DARK_BOOT_UNSET:
5081 /*
5082 * If the darkboot sysctl is unset, the NVRAM variable
5083 * must be unset too. If that's not the case, it means
5084 * someone is doing something crazy and not supported.
5085 */
5086 if (darkboot != 0) {
5087 int ret = PERemoveNVRAMProperty(MEMORY_MAINTENANCE_DARK_BOOT_NVRAM_NAME);
5088 if (ret) {
5089 darkboot = 0;
5090 } else {
5091 err = EINVAL;
5092 }
5093 }
5094 break;
5095 case MEMORY_MAINTENANCE_DARK_BOOT_SET:
5096 darkboot = 1;
5097 break;
5098 case MEMORY_MAINTENANCE_DARK_BOOT_SET_PERSISTENT: {
5099 /*
5100 * Set the NVRAM and update 'darkboot' in case
5101 * of success. Otherwise, do not update
5102 * 'darkboot' and report the failure.
5103 */
5104 if (PEWriteNVRAMBooleanProperty(MEMORY_MAINTENANCE_DARK_BOOT_NVRAM_NAME, TRUE)) {
5105 darkboot = 1;
5106 } else {
5107 err = EINVAL;
5108 }
5109
5110 break;
5111 }
5112 default:
5113 err = EINVAL;
5114 }
5115 }
5116
5117 exit:
5118 return err;
5119 }
5120
5121 SYSCTL_PROC(_kern, OID_AUTO, darkboot,
5122 CTLFLAG_KERN | CTLTYPE_INT | CTLFLAG_RW | CTLFLAG_LOCKED | CTLFLAG_ANYBODY,
5123 0, 0, sysctl_darkboot, "I", "");
5124 #endif /* CONFIG_DARKBOOT */
5125
5126 #if DEVELOPMENT || DEBUG
5127 #include <sys/sysent.h>
5128 /* This should result in a fatal exception, verifying that "sysent" is
5129 * write-protected.
5130 */
5131 static int
kern_sysent_write(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)5132 kern_sysent_write(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
5133 {
5134 uint64_t new_value = 0, old_value = 0;
5135 int changed = 0, error;
5136
5137 error = sysctl_io_number(req, old_value, sizeof(uint64_t), &new_value, &changed);
5138 if ((error == 0) && changed) {
5139 volatile uint32_t *wraddr = __DECONST(uint32_t *, &sysent[0]);
5140 *wraddr = 0;
5141 printf("sysent[0] write succeeded\n");
5142 }
5143 return error;
5144 }
5145
5146 SYSCTL_PROC(_kern, OID_AUTO, sysent_const_check,
5147 CTLTYPE_QUAD | CTLFLAG_RW | CTLFLAG_LOCKED,
5148 0, 0,
5149 kern_sysent_write, "I", "Attempt sysent[0] write");
5150
5151 #endif
5152
5153 #if DEVELOPMENT || DEBUG
5154 SYSCTL_COMPAT_INT(_kern, OID_AUTO, development, CTLFLAG_RD | CTLFLAG_MASKED | CTLFLAG_KERN, NULL, 1, "");
5155 #else
5156 SYSCTL_COMPAT_INT(_kern, OID_AUTO, development, CTLFLAG_RD | CTLFLAG_MASKED, NULL, 0, "");
5157 #endif
5158
5159
5160 #if DEVELOPMENT || DEBUG
5161
5162 decl_lck_spin_data(, spinlock_panic_test_lock);
5163
5164 __attribute__((noreturn))
5165 static void
spinlock_panic_test_acquire_spinlock(void * arg __unused,wait_result_t wres __unused)5166 spinlock_panic_test_acquire_spinlock(void * arg __unused, wait_result_t wres __unused)
5167 {
5168 lck_spin_lock(&spinlock_panic_test_lock);
5169 while (1) {
5170 ;
5171 }
5172 }
5173
5174 static int
5175 sysctl_spinlock_panic_test SYSCTL_HANDLER_ARGS
5176 {
5177 #pragma unused(oidp, arg1, arg2)
5178 if (req->newlen == 0) {
5179 return EINVAL;
5180 }
5181
5182 thread_t panic_spinlock_thread;
5183 /* Initialize panic spinlock */
5184 lck_grp_t * panic_spinlock_grp;
5185 lck_grp_attr_t * panic_spinlock_grp_attr;
5186 lck_attr_t * panic_spinlock_attr;
5187
5188 panic_spinlock_grp_attr = lck_grp_attr_alloc_init();
5189 panic_spinlock_grp = lck_grp_alloc_init("panic_spinlock", panic_spinlock_grp_attr);
5190 panic_spinlock_attr = lck_attr_alloc_init();
5191
5192 lck_spin_init(&spinlock_panic_test_lock, panic_spinlock_grp, panic_spinlock_attr);
5193
5194
5195 /* Create thread to acquire spinlock */
5196 if (kernel_thread_start(spinlock_panic_test_acquire_spinlock, NULL, &panic_spinlock_thread) != KERN_SUCCESS) {
5197 return EBUSY;
5198 }
5199
5200 /* Try to acquire spinlock -- should panic eventually */
5201 lck_spin_lock(&spinlock_panic_test_lock);
5202 while (1) {
5203 ;
5204 }
5205 }
5206
5207 __attribute__((noreturn))
5208 static void
simultaneous_panic_worker(void * arg,wait_result_t wres __unused)5209 simultaneous_panic_worker
5210 (void * arg, wait_result_t wres __unused)
5211 {
5212 atomic_int *start_panic = (atomic_int *)arg;
5213
5214 while (!atomic_load(start_panic)) {
5215 ;
5216 }
5217 panic("SIMULTANEOUS PANIC TEST: INITIATING PANIC FROM CPU %d", cpu_number());
5218 __builtin_unreachable();
5219 }
5220
5221 static int
5222 sysctl_simultaneous_panic_test SYSCTL_HANDLER_ARGS
5223 {
5224 #pragma unused(oidp, arg1, arg2)
5225 if (req->newlen == 0) {
5226 return EINVAL;
5227 }
5228
5229 int i = 0, threads_to_create = 2 * processor_count;
5230 atomic_int start_panic = 0;
5231 unsigned int threads_created = 0;
5232 thread_t new_panic_thread;
5233
5234 for (i = threads_to_create; i > 0; i--) {
5235 if (kernel_thread_start(simultaneous_panic_worker, (void *) &start_panic, &new_panic_thread) == KERN_SUCCESS) {
5236 threads_created++;
5237 }
5238 }
5239
5240 /* FAIL if we couldn't create at least processor_count threads */
5241 if (threads_created < processor_count) {
5242 panic("SIMULTANEOUS PANIC TEST: FAILED TO CREATE ENOUGH THREADS, ONLY CREATED %d (of %d)",
5243 threads_created, threads_to_create);
5244 }
5245
5246 atomic_exchange(&start_panic, 1);
5247 while (1) {
5248 ;
5249 }
5250 }
5251
5252 extern unsigned int panic_test_failure_mode;
5253 SYSCTL_INT(_debug, OID_AUTO, xnu_panic_failure_mode, CTLFLAG_RW | CTLFLAG_LOCKED | CTLFLAG_KERN, &panic_test_failure_mode, 0, "panic/debugger test failure mode");
5254
5255 extern unsigned int panic_test_action_count;
5256 SYSCTL_INT(_debug, OID_AUTO, xnu_panic_action_count, CTLFLAG_RW | CTLFLAG_LOCKED | CTLFLAG_KERN, &panic_test_action_count, 0, "panic/debugger test action count");
5257
5258 extern unsigned int panic_test_case;
5259 SYSCTL_INT(_debug, OID_AUTO, xnu_panic_test_case, CTLFLAG_RW | CTLFLAG_LOCKED | CTLFLAG_KERN, &panic_test_case, 0, "panic/debugger testcase");
5260
5261 SYSCTL_PROC(_debug, OID_AUTO, xnu_spinlock_panic_test, CTLTYPE_STRING | CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_MASKED, 0, 0, sysctl_spinlock_panic_test, "A", "spinlock panic test");
5262 SYSCTL_PROC(_debug, OID_AUTO, xnu_simultaneous_panic_test, CTLTYPE_STRING | CTLFLAG_RW | CTLFLAG_KERN | CTLFLAG_MASKED, 0, 0, sysctl_simultaneous_panic_test, "A", "simultaneous panic test");
5263
5264 extern int exc_resource_threads_enabled;
5265
5266 SYSCTL_INT(_kern, OID_AUTO, exc_resource_threads_enabled, CTLFLAG_RD | CTLFLAG_LOCKED, &exc_resource_threads_enabled, 0, "exc_resource thread limit enabled");
5267
5268
5269 #endif /* DEVELOPMENT || DEBUG */
5270
5271 #if CONFIG_THREAD_GROUPS
5272 #if DEVELOPMENT || DEBUG
5273
5274 static int
5275 sysctl_get_thread_group_id SYSCTL_HANDLER_ARGS
5276 {
5277 #pragma unused(arg1, arg2, oidp)
5278 uint64_t thread_group_id = thread_group_get_id(thread_group_get(current_thread()));
5279 return SYSCTL_OUT(req, &thread_group_id, sizeof(thread_group_id));
5280 }
5281
5282 SYSCTL_PROC(_kern, OID_AUTO, thread_group_id, CTLFLAG_RD | CTLFLAG_LOCKED | CTLTYPE_QUAD,
5283 0, 0, &sysctl_get_thread_group_id, "I", "thread group id of the thread");
5284
5285 STATIC int
sysctl_thread_group_count(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)5286 sysctl_thread_group_count(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
5287 {
5288 int value = thread_group_count();
5289 return sysctl_io_number(req, value, sizeof(value), NULL, NULL);
5290 }
5291
5292 SYSCTL_PROC(_kern, OID_AUTO, thread_group_count, CTLFLAG_RD | CTLFLAG_LOCKED | CTLFLAG_KERN,
5293 0, 0, &sysctl_thread_group_count, "I", "count of thread groups");
5294
5295 #endif /* DEVELOPMENT || DEBUG */
5296 const uint32_t thread_groups_supported = 1;
5297 #else /* CONFIG_THREAD_GROUPS */
5298 const uint32_t thread_groups_supported = 0;
5299 #endif /* CONFIG_THREAD_GROUPS */
5300
5301 STATIC int
sysctl_thread_groups_supported(__unused struct sysctl_oid * oidp,__unused void * arg1,__unused int arg2,struct sysctl_req * req)5302 sysctl_thread_groups_supported(__unused struct sysctl_oid *oidp, __unused void *arg1, __unused int arg2, struct sysctl_req *req)
5303 {
5304 int value = thread_groups_supported;
5305 return sysctl_io_number(req, value, sizeof(value), NULL, NULL);
5306 }
5307
5308 SYSCTL_PROC(_kern, OID_AUTO, thread_groups_supported, CTLFLAG_RD | CTLFLAG_LOCKED | CTLFLAG_KERN,
5309 0, 0, &sysctl_thread_groups_supported, "I", "thread groups supported");
5310
5311 static int
5312 sysctl_grade_cputype SYSCTL_HANDLER_ARGS
5313 {
5314 #pragma unused(arg1, arg2, oidp)
5315 int error = 0;
5316 int type_tuple[2] = {};
5317 int return_value = 0;
5318
5319 error = SYSCTL_IN(req, &type_tuple, sizeof(type_tuple));
5320
5321 if (error) {
5322 return error;
5323 }
5324
5325 return_value = grade_binary(type_tuple[0], type_tuple[1] & ~CPU_SUBTYPE_MASK, type_tuple[1] & CPU_SUBTYPE_MASK, FALSE);
5326
5327 error = SYSCTL_OUT(req, &return_value, sizeof(return_value));
5328
5329 if (error) {
5330 return error;
5331 }
5332
5333 return error;
5334 }
5335
5336 SYSCTL_PROC(_kern, OID_AUTO, grade_cputype,
5337 CTLFLAG_RW | CTLFLAG_ANYBODY | CTLFLAG_MASKED | CTLFLAG_LOCKED | CTLTYPE_OPAQUE,
5338 0, 0, &sysctl_grade_cputype, "S",
5339 "grade value of cpu_type_t+cpu_sub_type_t");
5340
5341 extern boolean_t allow_direct_handoff;
5342 SYSCTL_INT(_kern, OID_AUTO, direct_handoff,
5343 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5344 &allow_direct_handoff, 0, "Enable direct handoff for realtime threads");
5345
5346 #if DEVELOPMENT || DEBUG
5347
5348 SYSCTL_LONG(_kern, OID_AUTO, phys_carveout_pa, CTLFLAG_RD | CTLFLAG_LOCKED | CTLFLAG_KERN,
5349 &phys_carveout_pa,
5350 "base physical address of the phys_carveout_mb boot-arg region");
5351 SYSCTL_LONG(_kern, OID_AUTO, phys_carveout_size, CTLFLAG_RD | CTLFLAG_LOCKED | CTLFLAG_KERN,
5352 &phys_carveout_size,
5353 "size in bytes of the phys_carveout_mb boot-arg region");
5354
5355
5356 extern void do_cseg_wedge_thread(void);
5357 extern void do_cseg_unwedge_thread(void);
5358
5359 static int
5360 cseg_wedge_thread SYSCTL_HANDLER_ARGS
5361 {
5362 #pragma unused(arg1, arg2)
5363
5364 int error, val = 0;
5365 error = sysctl_handle_int(oidp, &val, 0, req);
5366 if (error || val == 0) {
5367 return error;
5368 }
5369
5370 do_cseg_wedge_thread();
5371 return 0;
5372 }
5373 SYSCTL_PROC(_kern, OID_AUTO, cseg_wedge_thread, CTLFLAG_RW | CTLFLAG_LOCKED | CTLFLAG_MASKED, 0, 0, cseg_wedge_thread, "I", "wedge c_seg thread");
5374
5375 static int
5376 cseg_unwedge_thread SYSCTL_HANDLER_ARGS
5377 {
5378 #pragma unused(arg1, arg2)
5379
5380 int error, val = 0;
5381 error = sysctl_handle_int(oidp, &val, 0, req);
5382 if (error || val == 0) {
5383 return error;
5384 }
5385
5386 do_cseg_unwedge_thread();
5387 return 0;
5388 }
5389 SYSCTL_PROC(_kern, OID_AUTO, cseg_unwedge_thread, CTLFLAG_RW | CTLFLAG_LOCKED | CTLFLAG_MASKED, 0, 0, cseg_unwedge_thread, "I", "unstuck c_seg thread");
5390
5391 static atomic_int wedge_thread_should_wake = 0;
5392
5393 static int
5394 unwedge_thread SYSCTL_HANDLER_ARGS
5395 {
5396 #pragma unused(arg1, arg2)
5397 int error, val = 0;
5398 error = sysctl_handle_int(oidp, &val, 0, req);
5399 if (error || val == 0) {
5400 return error;
5401 }
5402
5403 atomic_store(&wedge_thread_should_wake, 1);
5404 return 0;
5405 }
5406
5407 SYSCTL_PROC(_kern, OID_AUTO, unwedge_thread, CTLFLAG_RW | CTLFLAG_ANYBODY | CTLFLAG_LOCKED, 0, 0, unwedge_thread, "I", "unwedge the thread wedged by kern.wedge_thread");
5408
5409 static int
5410 wedge_thread SYSCTL_HANDLER_ARGS
5411 {
5412 #pragma unused(arg1, arg2)
5413
5414 int error, val = 0;
5415 error = sysctl_handle_int(oidp, &val, 0, req);
5416 if (error || val == 0) {
5417 return error;
5418 }
5419
5420 uint64_t interval = 1;
5421 nanoseconds_to_absolutetime(1000 * 1000 * 50, &interval);
5422
5423 atomic_store(&wedge_thread_should_wake, 0);
5424 while (!atomic_load(&wedge_thread_should_wake)) {
5425 tsleep1(NULL, 0, "wedge_thread", mach_absolute_time() + interval, NULL);
5426 }
5427
5428 return 0;
5429 }
5430
5431 SYSCTL_PROC(_kern, OID_AUTO, wedge_thread,
5432 CTLFLAG_RW | CTLFLAG_ANYBODY | CTLFLAG_LOCKED, 0, 0, wedge_thread, "I",
5433 "wedge this thread so it cannot be cleaned up");
5434
5435 static int
5436 sysctl_total_corpses_count SYSCTL_HANDLER_ARGS
5437 {
5438 #pragma unused(oidp, arg1, arg2)
5439 extern unsigned long total_corpses_count(void);
5440
5441 unsigned long corpse_count_long = total_corpses_count();
5442 unsigned int corpse_count = (unsigned int)MIN(corpse_count_long, UINT_MAX);
5443 return sysctl_io_opaque(req, &corpse_count, sizeof(corpse_count), NULL);
5444 }
5445
5446 SYSCTL_PROC(_kern, OID_AUTO, total_corpses_count,
5447 CTLFLAG_RD | CTLFLAG_ANYBODY | CTLFLAG_LOCKED, 0, 0,
5448 sysctl_total_corpses_count, "I", "total corpses on the system");
5449
5450 static int
5451 sysctl_turnstile_test_prim_lock SYSCTL_HANDLER_ARGS;
5452 static int
5453 sysctl_turnstile_test_prim_unlock SYSCTL_HANDLER_ARGS;
5454 int
5455 tstile_test_prim_lock(boolean_t use_hashtable);
5456 int
5457 tstile_test_prim_unlock(boolean_t use_hashtable);
5458
5459 static int
5460 sysctl_turnstile_test_prim_lock SYSCTL_HANDLER_ARGS
5461 {
5462 #pragma unused(arg1, arg2)
5463 int error, val = 0;
5464 error = sysctl_handle_int(oidp, &val, 0, req);
5465 if (error || val == 0) {
5466 return error;
5467 }
5468 switch (val) {
5469 case SYSCTL_TURNSTILE_TEST_USER_DEFAULT:
5470 case SYSCTL_TURNSTILE_TEST_USER_HASHTABLE:
5471 case SYSCTL_TURNSTILE_TEST_KERNEL_DEFAULT:
5472 case SYSCTL_TURNSTILE_TEST_KERNEL_HASHTABLE:
5473 return tstile_test_prim_lock(val);
5474 default:
5475 return error;
5476 }
5477 }
5478
5479 static int
5480 sysctl_turnstile_test_prim_unlock SYSCTL_HANDLER_ARGS
5481 {
5482 #pragma unused(arg1, arg2)
5483 int error, val = 0;
5484 error = sysctl_handle_int(oidp, &val, 0, req);
5485 if (error || val == 0) {
5486 return error;
5487 }
5488 switch (val) {
5489 case SYSCTL_TURNSTILE_TEST_USER_DEFAULT:
5490 case SYSCTL_TURNSTILE_TEST_USER_HASHTABLE:
5491 case SYSCTL_TURNSTILE_TEST_KERNEL_DEFAULT:
5492 case SYSCTL_TURNSTILE_TEST_KERNEL_HASHTABLE:
5493 return tstile_test_prim_unlock(val);
5494 default:
5495 return error;
5496 }
5497 }
5498
5499 SYSCTL_PROC(_kern, OID_AUTO, turnstiles_test_lock, CTLFLAG_WR | CTLFLAG_ANYBODY | CTLFLAG_KERN | CTLFLAG_LOCKED,
5500 0, 0, sysctl_turnstile_test_prim_lock, "I", "turnstiles test lock");
5501
5502 SYSCTL_PROC(_kern, OID_AUTO, turnstiles_test_unlock, CTLFLAG_WR | CTLFLAG_ANYBODY | CTLFLAG_KERN | CTLFLAG_LOCKED,
5503 0, 0, sysctl_turnstile_test_prim_unlock, "I", "turnstiles test unlock");
5504
5505 int
5506 turnstile_get_boost_stats_sysctl(void *req);
5507 int
5508 turnstile_get_unboost_stats_sysctl(void *req);
5509 static int
5510 sysctl_turnstile_boost_stats SYSCTL_HANDLER_ARGS;
5511 static int
5512 sysctl_turnstile_unboost_stats SYSCTL_HANDLER_ARGS;
5513 extern uint64_t thread_block_on_turnstile_count;
5514 extern uint64_t thread_block_on_regular_waitq_count;
5515
5516 static int
5517 sysctl_turnstile_boost_stats SYSCTL_HANDLER_ARGS
5518 {
5519 #pragma unused(arg1, arg2, oidp)
5520 return turnstile_get_boost_stats_sysctl(req);
5521 }
5522
5523 static int
5524 sysctl_turnstile_unboost_stats SYSCTL_HANDLER_ARGS
5525 {
5526 #pragma unused(arg1, arg2, oidp)
5527 return turnstile_get_unboost_stats_sysctl(req);
5528 }
5529
5530 SYSCTL_PROC(_kern, OID_AUTO, turnstile_boost_stats, CTLFLAG_RD | CTLFLAG_ANYBODY | CTLFLAG_KERN | CTLFLAG_LOCKED | CTLTYPE_STRUCT,
5531 0, 0, sysctl_turnstile_boost_stats, "S", "turnstiles boost stats");
5532 SYSCTL_PROC(_kern, OID_AUTO, turnstile_unboost_stats, CTLFLAG_RD | CTLFLAG_ANYBODY | CTLFLAG_KERN | CTLFLAG_LOCKED | CTLTYPE_STRUCT,
5533 0, 0, sysctl_turnstile_unboost_stats, "S", "turnstiles unboost stats");
5534 SYSCTL_QUAD(_kern, OID_AUTO, thread_block_count_on_turnstile,
5535 CTLFLAG_RD | CTLFLAG_ANYBODY | CTLFLAG_KERN | CTLFLAG_LOCKED,
5536 &thread_block_on_turnstile_count, "thread blocked on turnstile count");
5537 SYSCTL_QUAD(_kern, OID_AUTO, thread_block_count_on_reg_waitq,
5538 CTLFLAG_RD | CTLFLAG_ANYBODY | CTLFLAG_KERN | CTLFLAG_LOCKED,
5539 &thread_block_on_regular_waitq_count, "thread blocked on regular waitq count");
5540
5541 #if CONFIG_PV_TICKET
5542
5543 extern int ticket_lock_spins;
5544 SYSCTL_INT(_kern, OID_AUTO, ticket_lock_spins,
5545 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5546 &ticket_lock_spins, 0, "loops before hypercall");
5547
5548 #if (DEBUG || DEVELOPMENT)
5549
5550 /* PV ticket lock stats */
5551
5552 SYSCTL_SCALABLE_COUNTER(_kern, ticket_lock_kicks, ticket_kick_count,
5553 "ticket lock kicks");
5554 SYSCTL_SCALABLE_COUNTER(_kern, ticket_lock_waits, ticket_wait_count,
5555 "ticket lock waits");
5556 SYSCTL_SCALABLE_COUNTER(_kern, ticket_lock_already, ticket_already_count,
5557 "ticket lock already unlocked");
5558 SYSCTL_SCALABLE_COUNTER(_kern, ticket_lock_just_unlock, ticket_just_unlock,
5559 "ticket unlock without kick");
5560 SYSCTL_SCALABLE_COUNTER(_kern, ticket_lock_wflag_cleared, ticket_wflag_cleared,
5561 "ticket lock wait flag cleared");
5562 SYSCTL_SCALABLE_COUNTER(_kern, ticket_lock_wflag_still, ticket_wflag_still,
5563 "ticket lock wait flag not cleared");
5564 SYSCTL_SCALABLE_COUNTER(_kern, ticket_lock_spin_count, ticket_spin_count,
5565 "ticket lock spin count");
5566
5567 /* sysctl kern.hcall_probe=n -- does hypercall #n exist? */
5568
5569 static int
5570 sysctl_hcall_probe SYSCTL_HANDLER_ARGS
5571 {
5572 char instr[20];
5573
5574 if (!req->newptr) {
5575 return 0;
5576 }
5577 if (req->newlen >= sizeof(instr)) {
5578 return EOVERFLOW;
5579 }
5580
5581 int error = SYSCTL_IN(req, instr, req->newlen);
5582 if (error) {
5583 return error;
5584 }
5585 instr[req->newlen] = '\0';
5586
5587 int hcall = 0;
5588 error = sscanf(instr, "%d", &hcall);
5589 if (error != 1 || hcall < 0) {
5590 return EINVAL;
5591 }
5592 uprintf("%savailable\n",
5593 hvg_is_hcall_available((hvg_hcall_code_t)hcall) ? "" : "not ");
5594 return 0;
5595 }
5596
5597 SYSCTL_PROC(_kern, OID_AUTO, hcall_probe,
5598 CTLTYPE_STRING | CTLFLAG_WR | CTLFLAG_LOCKED | CTLFLAG_MASKED,
5599 0, 0, sysctl_hcall_probe, "A", "probe hypercall by id");
5600
5601 #endif /* (DEBUG || DEVELOPMENT) */
5602 #endif /* CONFIG_PV_TICKET */
5603
5604 #if defined(__x86_64__)
5605 extern uint64_t MutexSpin;
5606
5607 SYSCTL_QUAD(_kern, OID_AUTO, mutex_spin_abs, CTLFLAG_RW, &MutexSpin,
5608 "Spin time in abs for acquiring a kernel mutex");
5609 #else
5610 extern machine_timeout_t MutexSpin;
5611
5612 SYSCTL_QUAD(_kern, OID_AUTO, mutex_spin_abs, CTLFLAG_RW, &MutexSpin,
5613 "Spin time in abs for acquiring a kernel mutex");
5614 #endif
5615
5616 extern uint64_t low_MutexSpin;
5617 extern int64_t high_MutexSpin;
5618 extern unsigned int real_ncpus;
5619
5620 SYSCTL_QUAD(_kern, OID_AUTO, low_mutex_spin_abs, CTLFLAG_RW, &low_MutexSpin,
5621 "Low spin threshold in abs for acquiring a kernel mutex");
5622
5623 static int
5624 sysctl_high_mutex_spin_ns SYSCTL_HANDLER_ARGS
5625 {
5626 #pragma unused(oidp, arg1, arg2)
5627 int error;
5628 int64_t val = 0;
5629 int64_t res;
5630
5631 /* Check if the user is writing to high_MutexSpin, or just reading it */
5632 if (req->newptr) {
5633 error = SYSCTL_IN(req, &val, sizeof(val));
5634 if (error || (val < 0 && val != -1)) {
5635 return error;
5636 }
5637 high_MutexSpin = val;
5638 }
5639
5640 if (high_MutexSpin >= 0) {
5641 res = high_MutexSpin;
5642 } else {
5643 res = low_MutexSpin * real_ncpus;
5644 }
5645 return SYSCTL_OUT(req, &res, sizeof(res));
5646 }
5647 SYSCTL_PROC(_kern, OID_AUTO, high_mutex_spin_abs, CTLFLAG_RW | CTLTYPE_QUAD, 0, 0, sysctl_high_mutex_spin_ns, "I",
5648 "High spin threshold in abs for acquiring a kernel mutex");
5649
5650 #if defined (__x86_64__)
5651
5652 semaphore_t sysctl_test_panic_with_thread_sem;
5653
5654 #pragma clang diagnostic push
5655 #pragma clang diagnostic ignored "-Winfinite-recursion" /* rdar://38801963 */
5656 __attribute__((noreturn))
5657 static void
panic_thread_test_child_spin(void * arg,wait_result_t wres)5658 panic_thread_test_child_spin(void * arg, wait_result_t wres)
5659 {
5660 static int panic_thread_recurse_count = 5;
5661
5662 if (panic_thread_recurse_count > 0) {
5663 panic_thread_recurse_count--;
5664 panic_thread_test_child_spin(arg, wres);
5665 }
5666
5667 semaphore_signal(sysctl_test_panic_with_thread_sem);
5668 while (1) {
5669 ;
5670 }
5671 }
5672 #pragma clang diagnostic pop
5673
5674 static void
panic_thread_test_child_park(void * arg __unused,wait_result_t wres __unused)5675 panic_thread_test_child_park(void * arg __unused, wait_result_t wres __unused)
5676 {
5677 int event;
5678
5679 assert_wait(&event, THREAD_UNINT);
5680 semaphore_signal(sysctl_test_panic_with_thread_sem);
5681 thread_block(panic_thread_test_child_park);
5682 }
5683
5684 static int
5685 sysctl_test_panic_with_thread SYSCTL_HANDLER_ARGS
5686 {
5687 #pragma unused(arg1, arg2)
5688 int rval = 0;
5689 char str[16] = { '\0' };
5690 thread_t child_thread = THREAD_NULL;
5691
5692 rval = sysctl_handle_string(oidp, str, sizeof(str), req);
5693 if (rval != 0 || !req->newptr) {
5694 return EINVAL;
5695 }
5696
5697 semaphore_create(kernel_task, &sysctl_test_panic_with_thread_sem, SYNC_POLICY_FIFO, 0);
5698
5699 /* Create thread to spin or park in continuation */
5700 if (strncmp("spin", str, strlen("spin")) == 0) {
5701 if (kernel_thread_start(panic_thread_test_child_spin, NULL, &child_thread) != KERN_SUCCESS) {
5702 semaphore_destroy(kernel_task, sysctl_test_panic_with_thread_sem);
5703 return EBUSY;
5704 }
5705 } else if (strncmp("continuation", str, strlen("continuation")) == 0) {
5706 if (kernel_thread_start(panic_thread_test_child_park, NULL, &child_thread) != KERN_SUCCESS) {
5707 semaphore_destroy(kernel_task, sysctl_test_panic_with_thread_sem);
5708 return EBUSY;
5709 }
5710 } else {
5711 semaphore_destroy(kernel_task, sysctl_test_panic_with_thread_sem);
5712 return EINVAL;
5713 }
5714
5715 semaphore_wait(sysctl_test_panic_with_thread_sem);
5716
5717 panic_with_thread_context(0, NULL, 0, child_thread, "testing panic_with_thread_context for thread %p", child_thread);
5718
5719 /* Not reached */
5720 return EINVAL;
5721 }
5722
5723 SYSCTL_PROC(_kern, OID_AUTO, test_panic_with_thread,
5724 CTLFLAG_MASKED | CTLFLAG_KERN | CTLFLAG_LOCKED | CTLFLAG_WR | CTLTYPE_STRING,
5725 0, 0, sysctl_test_panic_with_thread, "A", "test panic flow for backtracing a different thread");
5726 #endif /* defined (__x86_64__) */
5727
5728 #endif /* DEVELOPMENT || DEBUG */
5729
5730 static int
5731 sysctl_get_owned_vmobjects SYSCTL_HANDLER_ARGS
5732 {
5733 #pragma unused(oidp, arg1, arg2)
5734
5735 /* validate */
5736 if (req->newlen != sizeof(mach_port_name_t) || req->newptr == USER_ADDR_NULL ||
5737 req->oldidx != 0 || req->newidx != 0 || req->p == NULL ||
5738 (req->oldlen == 0 && req->oldptr != USER_ADDR_NULL)) {
5739 return EINVAL;
5740 }
5741
5742 int error;
5743 mach_port_name_t task_port_name;
5744 task_t task;
5745 size_t buffer_size = (req->oldptr != USER_ADDR_NULL) ? req->oldlen : 0;
5746 vmobject_list_output_t buffer = NULL;
5747 size_t output_size;
5748 size_t entries;
5749
5750 /* we have a "newptr" (for write) we get a task port name from the caller. */
5751 error = SYSCTL_IN(req, &task_port_name, sizeof(mach_port_name_t));
5752
5753 if (error != 0) {
5754 goto sysctl_get_vmobject_list_exit;
5755 }
5756
5757 task = port_name_to_task_read(task_port_name);
5758 if (task == TASK_NULL) {
5759 error = ESRCH;
5760 goto sysctl_get_vmobject_list_exit;
5761 }
5762
5763 bool corpse = is_corpsetask(task);
5764
5765 /* get the current size */
5766 size_t max_size;
5767 task_get_owned_vmobjects(task, 0, NULL, &max_size, &entries);
5768
5769 if (buffer_size && (buffer_size < sizeof(*buffer) + sizeof(vm_object_query_data_t))) {
5770 error = ENOMEM;
5771 goto sysctl_get_vmobject_list_deallocate_and_exit;
5772 }
5773
5774 if (corpse == false) {
5775 /* copy the vmobjects and vmobject data out of the task */
5776 if (buffer_size == 0) {
5777 output_size = max_size;
5778 } else {
5779 buffer_size = (buffer_size > max_size) ? max_size : buffer_size;
5780 buffer = (struct _vmobject_list_output_ *)kalloc_data(buffer_size, Z_WAITOK);
5781
5782 if (!buffer) {
5783 error = ENOMEM;
5784 goto sysctl_get_vmobject_list_deallocate_and_exit;
5785 }
5786
5787 task_get_owned_vmobjects(task, buffer_size, buffer, &output_size, &entries);
5788 }
5789
5790 /* req->oldptr should be USER_ADDR_NULL if buffer == NULL and return the current size */
5791 /* otherwise copy buffer to oldptr and return the bytes copied */
5792 error = SYSCTL_OUT(req, (char *)buffer, output_size);
5793 } else {
5794 vmobject_list_output_t list;
5795
5796 task_get_corpse_vmobject_list(task, &list, &max_size);
5797 assert(buffer == NULL);
5798
5799 /* copy corpse_vmobject_list to output buffer to avoid double copy */
5800 if (buffer_size) {
5801 size_t temp_size;
5802
5803 temp_size = buffer_size > max_size ? max_size : buffer_size;
5804 output_size = temp_size - sizeof(*buffer);
5805 /* whole multiple of vm_object_query_data_t */
5806 output_size = (output_size / sizeof(vm_object_query_data_t)) * sizeof(vm_object_query_data_t) + sizeof(*buffer);
5807 buffer = list;
5808 } else {
5809 output_size = max_size;
5810 }
5811
5812 /* req->oldptr should be USER_ADDR_NULL if buffer == NULL and return the current size */
5813 /* otherwise copy buffer to oldptr and return the bytes copied */
5814 error = SYSCTL_OUT(req, (char*)buffer, output_size);
5815 buffer = NULL;
5816 }
5817
5818 sysctl_get_vmobject_list_deallocate_and_exit:
5819 task_deallocate(task);
5820
5821 sysctl_get_vmobject_list_exit:
5822 if (buffer) {
5823 kfree_data(buffer, buffer_size);
5824 }
5825
5826 return error;
5827 }
5828
5829 SYSCTL_PROC(_vm, OID_AUTO, get_owned_vmobjects,
5830 CTLTYPE_OPAQUE | CTLFLAG_RD | CTLFLAG_WR | CTLFLAG_MASKED | CTLFLAG_KERN | CTLFLAG_LOCKED | CTLFLAG_ANYBODY,
5831 0, 0, sysctl_get_owned_vmobjects, "A", "get owned vmobjects in task");
5832
5833 extern uint64_t num_static_scalable_counters;
5834 SYSCTL_QUAD(_kern, OID_AUTO, num_static_scalable_counters, CTLFLAG_RD | CTLFLAG_LOCKED, &num_static_scalable_counters, "");
5835
5836 #if SCHED_HYGIENE_DEBUG
5837 TUNABLE_DT(bool, sched_hygiene_nonspec_tb, "machine-timeouts", "nonspec-tb", "sched-hygiene-nonspec-tb", false, TUNABLE_DT_NONE);
5838 #endif /* SCHED_HYGIENE_DEBUG */
5839
5840 uuid_string_t trial_treatment_id;
5841 uuid_string_t trial_experiment_id;
5842 int trial_deployment_id = -1;
5843
5844 SYSCTL_STRING(_kern, OID_AUTO, trial_treatment_id, CTLFLAG_RW | CTLFLAG_LOCKED | CTLFLAG_ANYBODY | CTLFLAG_EXPERIMENT, trial_treatment_id, sizeof(trial_treatment_id), "");
5845 SYSCTL_STRING(_kern, OID_AUTO, trial_experiment_id, CTLFLAG_RW | CTLFLAG_LOCKED | CTLFLAG_ANYBODY | CTLFLAG_EXPERIMENT, trial_experiment_id, sizeof(trial_experiment_id), "");
5846 SYSCTL_INT(_kern, OID_AUTO, trial_deployment_id, CTLFLAG_RW | CTLFLAG_LOCKED | CTLFLAG_ANYBODY | CTLFLAG_EXPERIMENT, &trial_deployment_id, 0, "");
5847
5848 #if (DEVELOPMENT || DEBUG)
5849 /* For unit testing setting factors & limits. */
5850 unsigned int testing_experiment_factor;
5851 EXPERIMENT_FACTOR_UINT(_kern, testing_experiment_factor, &testing_experiment_factor, 5, 10, "");
5852
5853 extern int exception_log_max_pid;
5854 SYSCTL_INT(_debug, OID_AUTO, exception_log_max_pid, CTLFLAG_RW | CTLFLAG_LOCKED, &exception_log_max_pid, 0, "Log exceptions for all processes up to this pid");
5855 #endif /* (DEVELOPMENT || DEBUG) */
5856
5857 #if DEVELOPMENT || DEBUG
5858 static int
5859 unlink_kernelcore_sysctl SYSCTL_HANDLER_ARGS
5860 {
5861 if (!req->newptr) {
5862 return EINVAL;
5863 }
5864 void IOBSDLowSpaceUnlinkKernelCore(void);
5865 IOBSDLowSpaceUnlinkKernelCore();
5866 return 0;
5867 }
5868
5869 SYSCTL_PROC(_kern, OID_AUTO, unlink_kernelcore,
5870 CTLTYPE_INT | CTLFLAG_WR | CTLFLAG_LOCKED | CTLFLAG_MASKED, 0, 0,
5871 unlink_kernelcore_sysctl, "-", "unlink the kernelcore file");
5872 #endif /* DEVELOPMENT || DEBUG */
5873
5874 #if CONFIG_IOTRACE
5875 #pragma clang diagnostic push
5876 #pragma clang diagnostic ignored "-Wcast-qual"
5877 SYSCTL_INT(_debug, OID_AUTO, MMIOtrace,
5878 CTLFLAG_KERN | CTLFLAG_RW | CTLFLAG_LOCKED,
5879 (int *)&mmiotrace_enabled, 0, "");
5880 #pragma clang diagnostic pop
5881 #endif /* CONFIG_IOTRACE */
5882