1 /*
2 * Copyright (c) 2013-2020 Apple Inc. All rights reserved.
3 *
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
5 *
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
14 *
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
17 *
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
25 *
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
27 */
28
29 #include <mach/mach_types.h>
30 #include <mach/vm_param.h>
31 #include <mach/mach_vm.h>
32 #include <mach/clock_types.h>
33 #include <sys/errno.h>
34 #include <sys/stackshot.h>
35 #ifdef IMPORTANCE_INHERITANCE
36 #include <ipc/ipc_importance.h>
37 #endif
38 #include <sys/appleapiopts.h>
39 #include <kern/debug.h>
40 #include <kern/block_hint.h>
41 #include <uuid/uuid.h>
42
43 #include <kdp/kdp_dyld.h>
44 #include <kdp/kdp_en_debugger.h>
45 #include <kdp/processor_core.h>
46 #include <kdp/kdp_common.h>
47
48 #include <libsa/types.h>
49 #include <libkern/version.h>
50 #include <libkern/section_keywords.h>
51
52 #include <string.h> /* bcopy */
53
54 #include <kern/backtrace.h>
55 #include <kern/coalition.h>
56 #include <kern/processor.h>
57 #include <kern/host_statistics.h>
58 #include <kern/counter.h>
59 #include <kern/thread.h>
60 #include <kern/thread_group.h>
61 #include <kern/task.h>
62 #include <kern/telemetry.h>
63 #include <kern/clock.h>
64 #include <kern/policy_internal.h>
65 #include <kern/socd_client.h>
66 #include <vm/vm_map.h>
67 #include <vm/vm_kern.h>
68 #include <vm/vm_pageout.h>
69 #include <vm/vm_fault.h>
70 #include <vm/vm_shared_region.h>
71 #include <vm/vm_compressor.h>
72 #include <libkern/OSKextLibPrivate.h>
73 #include <os/log.h>
74
75 #if defined(__x86_64__)
76 #include <i386/mp.h>
77 #include <i386/cpu_threads.h>
78 #endif
79
80 #include <pexpert/pexpert.h>
81
82 #if CONFIG_PERVASIVE_CPI
83 #include <kern/monotonic.h>
84 #endif /* CONFIG_PERVASIVE_CPI */
85
86 #include <san/kasan.h>
87
88 #if DEBUG || DEVELOPMENT
89 # define STACKSHOT_COLLECTS_LATENCY_INFO 1
90 #else
91 # define STACKSHOT_COLLECTS_LATENCY_INFO 0
92 #endif /* DEBUG || DEVELOPMENT */
93
94 extern unsigned int not_in_kdp;
95
96 /* indicate to the compiler that some accesses are unaligned */
97 typedef uint64_t unaligned_u64 __attribute__((aligned(1)));
98
99 int kdp_snapshot = 0;
100 static kern_return_t stack_snapshot_ret = 0;
101 static uint32_t stack_snapshot_bytes_traced = 0;
102 static uint32_t stack_snapshot_bytes_uncompressed = 0;
103
104 #if STACKSHOT_COLLECTS_LATENCY_INFO
105 static bool collect_latency_info = true;
106 #endif
107 static kcdata_descriptor_t stackshot_kcdata_p = NULL;
108 static void *stack_snapshot_buf;
109 static uint32_t stack_snapshot_bufsize;
110 int stack_snapshot_pid;
111 static uint64_t stack_snapshot_flags;
112 static uint64_t stack_snapshot_delta_since_timestamp;
113 static uint32_t stack_snapshot_pagetable_mask;
114 static boolean_t panic_stackshot;
115
116 static boolean_t stack_enable_faulting = FALSE;
117 static struct stackshot_fault_stats fault_stats;
118
119 static uint64_t stackshot_last_abs_start; /* start time of last stackshot */
120 static uint64_t stackshot_last_abs_end; /* end time of last stackshot */
121 static uint64_t stackshots_taken; /* total stackshots taken since boot */
122 static uint64_t stackshots_duration; /* total abs time spent in stackshot_trap() since boot */
123
124 /*
125 * Experimentally, our current estimates are 20% short 96% of the time; 40 gets
126 * us into 99.9%+ territory. In the longer run, we need to make stackshot
127 * estimates use a better approach (rdar://78880038); this is intended to be a
128 * short-term fix.
129 */
130 uint32_t stackshot_estimate_adj = 40; /* experiment factor: 0-100, adjust our estimate up by this amount */
131
132 static uint32_t stackshot_initial_estimate;
133 static uint32_t stackshot_initial_estimate_adj;
134 static uint64_t stackshot_duration_prior_abs; /* prior attempts, abs */
135 static unaligned_u64 * stackshot_duration_outer;
136 static uint64_t stackshot_microsecs;
137
138 void * kernel_stackshot_buf = NULL; /* Pointer to buffer for stackshots triggered from the kernel and retrieved later */
139 int kernel_stackshot_buf_size = 0;
140
141 void * stackshot_snapbuf = NULL; /* Used by stack_snapshot2 (to be removed) */
142
143 __private_extern__ void stackshot_init( void );
144 static boolean_t memory_iszero(void *addr, size_t size);
145 uint32_t get_stackshot_estsize(uint32_t prev_size_hint, uint32_t adj);
146 kern_return_t kern_stack_snapshot_internal(int stackshot_config_version, void *stackshot_config,
147 size_t stackshot_config_size, boolean_t stackshot_from_user);
148 kern_return_t do_stackshot(void *);
149 void kdp_snapshot_preflight(int pid, void * tracebuf, uint32_t tracebuf_size, uint64_t flags, kcdata_descriptor_t data_p, uint64_t since_timestamp, uint32_t pagetable_mask);
150 boolean_t stackshot_thread_is_idle_worker_unsafe(thread_t thread);
151 static int kdp_stackshot_kcdata_format(int pid, uint64_t trace_flags, uint32_t *pBytesTraced, uint32_t *pBytesUncompressed);
152 uint32_t kdp_stack_snapshot_bytes_traced(void);
153 uint32_t kdp_stack_snapshot_bytes_uncompressed(void);
154 static void kdp_mem_and_io_snapshot(struct mem_and_io_snapshot *memio_snap);
155 static vm_offset_t stackshot_find_phys(vm_map_t map, vm_offset_t target_addr, kdp_fault_flags_t fault_flags, uint32_t *kdp_fault_result_flags);
156 static boolean_t stackshot_copyin(vm_map_t map, uint64_t uaddr, void *dest, size_t size, boolean_t try_fault, uint32_t *kdp_fault_result);
157 static int stackshot_copyin_string(task_t task, uint64_t addr, char *buf, int buf_sz, boolean_t try_fault, uint32_t *kdp_fault_results);
158 static boolean_t stackshot_copyin_word(task_t task, uint64_t addr, uint64_t *result, boolean_t try_fault, uint32_t *kdp_fault_results);
159 static uint64_t proc_was_throttled_from_task(task_t task);
160 static void stackshot_thread_wait_owner_info(thread_t thread, thread_waitinfo_v2_t * waitinfo);
161 static int stackshot_thread_has_valid_waitinfo(thread_t thread);
162 static void stackshot_thread_turnstileinfo(thread_t thread, thread_turnstileinfo_v2_t *tsinfo);
163 static int stackshot_thread_has_valid_turnstileinfo(thread_t thread);
164
165 #if CONFIG_COALITIONS
166 static void stackshot_coalition_jetsam_count(void *arg, int i, coalition_t coal);
167 static void stackshot_coalition_jetsam_snapshot(void *arg, int i, coalition_t coal);
168 #endif /* CONFIG_COALITIONS */
169
170 #if CONFIG_THREAD_GROUPS
171 static void stackshot_thread_group_count(void *arg, int i, struct thread_group *tg);
172 static void stackshot_thread_group_snapshot(void *arg, int i, struct thread_group *tg);
173 #endif /* CONFIG_THREAD_GROUPS */
174
175 extern uint32_t workqueue_get_pwq_state_kdp(void *proc);
176
177 struct proc;
178 extern int proc_pid(struct proc *p);
179 extern uint64_t proc_uniqueid(void *p);
180 extern uint64_t proc_was_throttled(void *p);
181 extern uint64_t proc_did_throttle(void *p);
182 extern int proc_exiting(void *p);
183 extern int proc_in_teardown(void *p);
184 static uint64_t proc_did_throttle_from_task(task_t task);
185 extern void proc_name_kdp(struct proc *p, char * buf, int size);
186 extern int proc_threadname_kdp(void * uth, char * buf, size_t size);
187 extern void proc_starttime_kdp(void * p, uint64_t * tv_sec, uint64_t * tv_usec, uint64_t * abstime);
188 extern void proc_archinfo_kdp(void* p, cpu_type_t* cputype, cpu_subtype_t* cpusubtype);
189 extern uint64_t proc_getcsflags_kdp(void * p);
190 extern boolean_t proc_binary_uuid_kdp(task_t task, uuid_t uuid);
191 extern int memorystatus_get_pressure_status_kdp(void);
192 extern void memorystatus_proc_flags_unsafe(void * v, boolean_t *is_dirty, boolean_t *is_dirty_tracked, boolean_t *allow_idle_exit);
193
194 extern int count_busy_buffers(void); /* must track with declaration in bsd/sys/buf_internal.h */
195
196 #if CONFIG_TELEMETRY
197 extern kern_return_t stack_microstackshot(user_addr_t tracebuf, uint32_t tracebuf_size, uint32_t flags, int32_t *retval);
198 #endif /* CONFIG_TELEMETRY */
199
200 extern kern_return_t kern_stack_snapshot_with_reason(char* reason);
201 extern kern_return_t kern_stack_snapshot_internal(int stackshot_config_version, void *stackshot_config, size_t stackshot_config_size, boolean_t stackshot_from_user);
202
203 static size_t stackshot_plh_est_size(void);
204
205 /*
206 * Validates that the given address for a word is both a valid page and has
207 * default caching attributes for the current map.
208 */
209 bool machine_trace_thread_validate_kva(vm_offset_t);
210 /*
211 * Validates a region that stackshot will potentially inspect.
212 */
213 static bool _stackshot_validate_kva(vm_offset_t, size_t);
214 /*
215 * Must be called whenever stackshot is re-driven.
216 */
217 static void _stackshot_validation_reset(void);
218 /*
219 * A kdp-safe strlen() call. Returns:
220 * -1 if we reach maxlen or a bad address before the end of the string, or
221 * strlen(s)
222 */
223 static long _stackshot_strlen(const char *s, size_t maxlen);
224
225 #define MAX_FRAMES 1000
226 #define MAX_LOADINFOS 500
227 #define MAX_DYLD_COMPACTINFO (20 * 1024) // max bytes of compactinfo to include per proc/shared region
228 #define TASK_IMP_WALK_LIMIT 20
229
230 typedef struct thread_snapshot *thread_snapshot_t;
231 typedef struct task_snapshot *task_snapshot_t;
232
233 #if CONFIG_KDP_INTERACTIVE_DEBUGGING
234 extern kdp_send_t kdp_en_send_pkt;
235 #endif
236
237 /*
238 * Stackshot locking and other defines.
239 */
240 static LCK_GRP_DECLARE(stackshot_subsys_lck_grp, "stackshot_subsys_lock");
241 static LCK_MTX_DECLARE(stackshot_subsys_mutex, &stackshot_subsys_lck_grp);
242
243 #define STACKSHOT_SUBSYS_LOCK() lck_mtx_lock(&stackshot_subsys_mutex)
244 #define STACKSHOT_SUBSYS_TRY_LOCK() lck_mtx_try_lock(&stackshot_subsys_mutex)
245 #define STACKSHOT_SUBSYS_UNLOCK() lck_mtx_unlock(&stackshot_subsys_mutex)
246
247 #define SANE_BOOTPROFILE_TRACEBUF_SIZE (64ULL * 1024ULL * 1024ULL)
248 #define SANE_TRACEBUF_SIZE (8ULL * 1024ULL * 1024ULL)
249
250 #define TRACEBUF_SIZE_PER_GB (1024ULL * 1024ULL)
251 #define GIGABYTES (1024ULL * 1024ULL * 1024ULL)
252
253 SECURITY_READ_ONLY_LATE(static uint32_t) max_tracebuf_size = SANE_TRACEBUF_SIZE;
254
255 /*
256 * We currently set a ceiling of 3 milliseconds spent in the kdp fault path
257 * for non-panic stackshots where faulting is requested.
258 */
259 #define KDP_FAULT_PATH_MAX_TIME_PER_STACKSHOT_NSECS (3 * NSEC_PER_MSEC)
260
261 #define STACKSHOT_SUPP_SIZE (16 * 1024) /* Minimum stackshot size */
262 #define TASK_UUID_AVG_SIZE (16 * sizeof(uuid_t)) /* Average space consumed by UUIDs/task */
263
264 #ifndef ROUNDUP
265 #define ROUNDUP(x, y) ((((x)+(y)-1)/(y))*(y))
266 #endif
267
268 #define STACKSHOT_QUEUE_LABEL_MAXSIZE 64
269
270 /*
271 * Initialize the mutex governing access to the stack snapshot subsystem
272 * and other stackshot related bits.
273 */
274 __private_extern__ void
stackshot_init(void)275 stackshot_init( void )
276 {
277 mach_timebase_info_data_t timebase;
278
279 clock_timebase_info(&timebase);
280 fault_stats.sfs_system_max_fault_time = ((KDP_FAULT_PATH_MAX_TIME_PER_STACKSHOT_NSECS * timebase.denom) / timebase.numer);
281
282 max_tracebuf_size = MAX(max_tracebuf_size, ((ROUNDUP(max_mem, GIGABYTES) / GIGABYTES) * TRACEBUF_SIZE_PER_GB));
283
284 PE_parse_boot_argn("stackshot_maxsz", &max_tracebuf_size, sizeof(max_tracebuf_size));
285 }
286
287 /*
288 * Called with interrupts disabled after stackshot context has been
289 * initialized. Updates stack_snapshot_ret.
290 */
291 static kern_return_t
stackshot_trap(void)292 stackshot_trap(void)
293 {
294 kern_return_t rv;
295
296 #if defined(__x86_64__)
297 /*
298 * Since mp_rendezvous and stackshot both attempt to capture cpus then perform an
299 * operation, it's essential to apply mutual exclusion to the other when one
300 * mechanism is in operation, lest there be a deadlock as the mechanisms race to
301 * capture CPUs.
302 *
303 * Further, we assert that invoking stackshot from mp_rendezvous*() is not
304 * allowed, so we check to ensure there there is no rendezvous in progress before
305 * trying to grab the lock (if there is, a deadlock will occur when we try to
306 * grab the lock). This is accomplished by setting cpu_rendezvous_in_progress to
307 * TRUE in the mp rendezvous action function. If stackshot_trap() is called by
308 * a subordinate of the call chain within the mp rendezvous action, this flag will
309 * be set and can be used to detect the inevitable deadlock that would occur
310 * if this thread tried to grab the rendezvous lock.
311 */
312
313 if (current_cpu_datap()->cpu_rendezvous_in_progress == TRUE) {
314 panic("Calling stackshot from a rendezvous is not allowed!");
315 }
316
317 mp_rendezvous_lock();
318 #endif
319
320 stackshot_last_abs_start = mach_absolute_time();
321 stackshot_last_abs_end = 0;
322
323 rv = DebuggerTrapWithState(DBOP_STACKSHOT, NULL, NULL, NULL, 0, NULL, FALSE, 0);
324
325 stackshot_last_abs_end = mach_absolute_time();
326 stackshots_taken++;
327 stackshots_duration += (stackshot_last_abs_end - stackshot_last_abs_start);
328
329 #if defined(__x86_64__)
330 mp_rendezvous_unlock();
331 #endif
332 return rv;
333 }
334
335 extern void stackshot_get_timing(uint64_t *last_abs_start, uint64_t *last_abs_end, uint64_t *count, uint64_t *total_duration);
336 void
stackshot_get_timing(uint64_t * last_abs_start,uint64_t * last_abs_end,uint64_t * count,uint64_t * total_duration)337 stackshot_get_timing(uint64_t *last_abs_start, uint64_t *last_abs_end, uint64_t *count, uint64_t *total_duration)
338 {
339 STACKSHOT_SUBSYS_LOCK();
340 *last_abs_start = stackshot_last_abs_start;
341 *last_abs_end = stackshot_last_abs_end;
342 *count = stackshots_taken;
343 *total_duration = stackshots_duration;
344 STACKSHOT_SUBSYS_UNLOCK();
345 }
346
347 kern_return_t
stack_snapshot_from_kernel(int pid,void * buf,uint32_t size,uint64_t flags,uint64_t delta_since_timestamp,uint32_t pagetable_mask,unsigned * bytes_traced)348 stack_snapshot_from_kernel(int pid, void *buf, uint32_t size, uint64_t flags, uint64_t delta_since_timestamp, uint32_t pagetable_mask, unsigned *bytes_traced)
349 {
350 kern_return_t error = KERN_SUCCESS;
351 boolean_t istate;
352
353 #if DEVELOPMENT || DEBUG
354 if (kern_feature_override(KF_STACKSHOT_OVRD) == TRUE) {
355 return KERN_NOT_SUPPORTED;
356 }
357 #endif
358 if ((buf == NULL) || (size <= 0) || (bytes_traced == NULL)) {
359 return KERN_INVALID_ARGUMENT;
360 }
361
362 /* cap in individual stackshot to max_tracebuf_size */
363 if (size > max_tracebuf_size) {
364 size = max_tracebuf_size;
365 }
366
367 /* Serialize tracing */
368 if (flags & STACKSHOT_TRYLOCK) {
369 if (!STACKSHOT_SUBSYS_TRY_LOCK()) {
370 return KERN_LOCK_OWNED;
371 }
372 } else {
373 STACKSHOT_SUBSYS_LOCK();
374 }
375
376 struct kcdata_descriptor kcdata;
377 uint32_t hdr_tag = (flags & STACKSHOT_COLLECT_DELTA_SNAPSHOT) ?
378 KCDATA_BUFFER_BEGIN_DELTA_STACKSHOT : KCDATA_BUFFER_BEGIN_STACKSHOT;
379
380 error = kcdata_memory_static_init(&kcdata, (mach_vm_address_t)buf, hdr_tag, size,
381 KCFLAG_USE_MEMCOPY | KCFLAG_NO_AUTO_ENDBUFFER);
382 if (error) {
383 goto out;
384 }
385
386 stackshot_initial_estimate = 0;
387 stackshot_duration_prior_abs = 0;
388 stackshot_duration_outer = NULL;
389
390 KDBG_RELEASE(MACHDBG_CODE(DBG_MACH_STACKSHOT, STACKSHOT_KERN_RECORD) | DBG_FUNC_START,
391 flags, size, pid, delta_since_timestamp);
392
393 istate = ml_set_interrupts_enabled(FALSE);
394 uint64_t time_start = mach_absolute_time();
395
396 /* Emit a SOCD tracepoint that we are initiating a stackshot */
397 SOCD_TRACE_XNU_START(STACKSHOT);
398
399 /* Preload trace parameters*/
400 kdp_snapshot_preflight(pid, buf, size, flags, &kcdata,
401 delta_since_timestamp, pagetable_mask);
402
403 /*
404 * Trap to the debugger to obtain a coherent stack snapshot; this populates
405 * the trace buffer
406 */
407 error = stackshot_trap();
408
409 uint64_t time_end = mach_absolute_time();
410
411 /* Emit a SOCD tracepoint that we have completed the stackshot */
412 SOCD_TRACE_XNU_END(STACKSHOT);
413
414 ml_set_interrupts_enabled(istate);
415
416 if (stackshot_duration_outer) {
417 *stackshot_duration_outer = time_end - time_start;
418 }
419 *bytes_traced = kdp_stack_snapshot_bytes_traced();
420
421 KDBG_RELEASE(MACHDBG_CODE(DBG_MACH_STACKSHOT, STACKSHOT_KERN_RECORD) | DBG_FUNC_END,
422 error, (time_end - time_start), size, *bytes_traced);
423 out:
424 stackshot_kcdata_p = NULL;
425 STACKSHOT_SUBSYS_UNLOCK();
426 return error;
427 }
428
429 #if CONFIG_TELEMETRY
430 kern_return_t
stack_microstackshot(user_addr_t tracebuf,uint32_t tracebuf_size,uint32_t flags,int32_t * retval)431 stack_microstackshot(user_addr_t tracebuf, uint32_t tracebuf_size, uint32_t flags, int32_t *retval)
432 {
433 int error = KERN_SUCCESS;
434 uint32_t bytes_traced = 0;
435
436 *retval = -1;
437
438 /*
439 * Control related operations
440 */
441 if (flags & STACKSHOT_GLOBAL_MICROSTACKSHOT_ENABLE) {
442 telemetry_global_ctl(1);
443 *retval = 0;
444 goto exit;
445 } else if (flags & STACKSHOT_GLOBAL_MICROSTACKSHOT_DISABLE) {
446 telemetry_global_ctl(0);
447 *retval = 0;
448 goto exit;
449 }
450
451 /*
452 * Data related operations
453 */
454 *retval = -1;
455
456 if ((((void*)tracebuf) == NULL) || (tracebuf_size == 0)) {
457 error = KERN_INVALID_ARGUMENT;
458 goto exit;
459 }
460
461 STACKSHOT_SUBSYS_LOCK();
462
463 if (flags & STACKSHOT_GET_MICROSTACKSHOT) {
464 if (tracebuf_size > max_tracebuf_size) {
465 error = KERN_INVALID_ARGUMENT;
466 goto unlock_exit;
467 }
468
469 bytes_traced = tracebuf_size;
470 error = telemetry_gather(tracebuf, &bytes_traced,
471 (flags & STACKSHOT_SET_MICROSTACKSHOT_MARK) ? true : false);
472 *retval = (int)bytes_traced;
473 goto unlock_exit;
474 }
475
476 unlock_exit:
477 STACKSHOT_SUBSYS_UNLOCK();
478 exit:
479 return error;
480 }
481 #endif /* CONFIG_TELEMETRY */
482
483 /*
484 * Return the estimated size of a stackshot based on the
485 * number of currently running threads and tasks.
486 *
487 * adj is an adjustment in units of percentage
488 *
489 * This function is mostly unhinged from reality; struct thread_snapshot and
490 * struct task_stackshot are legacy, much larger versions of the structures we
491 * actually use, and there's no accounting for how we actually generate
492 * task & thread information. rdar://78880038 intends to replace this all.
493 */
494 uint32_t
get_stackshot_estsize(uint32_t prev_size_hint,uint32_t adj)495 get_stackshot_estsize(uint32_t prev_size_hint, uint32_t adj)
496 {
497 vm_size_t thread_total;
498 vm_size_t task_total;
499 uint64_t size;
500 uint32_t estimated_size;
501 size_t est_thread_size = sizeof(struct thread_snapshot);
502 size_t est_task_size = sizeof(struct task_snapshot) + TASK_UUID_AVG_SIZE;
503
504 adj = MIN(adj, 100u); /* no more than double our estimate */
505
506 #if STACKSHOT_COLLECTS_LATENCY_INFO
507 if (collect_latency_info) {
508 est_thread_size += sizeof(struct stackshot_latency_thread);
509 est_task_size += sizeof(struct stackshot_latency_task);
510 }
511 #endif
512
513 thread_total = (threads_count * est_thread_size);
514 task_total = (tasks_count * est_task_size);
515
516 size = thread_total + task_total + STACKSHOT_SUPP_SIZE; /* estimate */
517 size += (size * adj) / 100; /* add adj */
518 size = MAX(size, prev_size_hint); /* allow hint to increase */
519 size += stackshot_plh_est_size(); /* add space for the port label hash */
520 size = MIN(size, VM_MAP_TRUNC_PAGE(UINT32_MAX, PAGE_MASK)); /* avoid overflow */
521 estimated_size = (uint32_t) VM_MAP_ROUND_PAGE(size, PAGE_MASK); /* round to pagesize */
522
523 return estimated_size;
524 }
525
526 /*
527 * stackshot_remap_buffer: Utility function to remap bytes_traced bytes starting at stackshotbuf
528 * into the current task's user space and subsequently copy out the address
529 * at which the buffer has been mapped in user space to out_buffer_addr.
530 *
531 * Inputs: stackshotbuf - pointer to the original buffer in the kernel's address space
532 * bytes_traced - length of the buffer to remap starting from stackshotbuf
533 * out_buffer_addr - pointer to placeholder where newly mapped buffer will be mapped.
534 * out_size_addr - pointer to be filled in with the size of the buffer
535 *
536 * Outputs: ENOSPC if there is not enough free space in the task's address space to remap the buffer
537 * EINVAL for all other errors returned by task_remap_buffer/mach_vm_remap
538 * an error from copyout
539 */
540 static kern_return_t
stackshot_remap_buffer(void * stackshotbuf,uint32_t bytes_traced,uint64_t out_buffer_addr,uint64_t out_size_addr)541 stackshot_remap_buffer(void *stackshotbuf, uint32_t bytes_traced, uint64_t out_buffer_addr, uint64_t out_size_addr)
542 {
543 int error = 0;
544 mach_vm_offset_t stackshotbuf_user_addr = (mach_vm_offset_t)NULL;
545 vm_prot_t cur_prot, max_prot;
546
547 error = mach_vm_remap_kernel(get_task_map(current_task()), &stackshotbuf_user_addr, bytes_traced, 0,
548 VM_FLAGS_ANYWHERE, VM_KERN_MEMORY_NONE, kernel_map, (mach_vm_offset_t)stackshotbuf, FALSE, &cur_prot, &max_prot, VM_INHERIT_DEFAULT);
549 /*
550 * If the call to mach_vm_remap fails, we return the appropriate converted error
551 */
552 if (error == KERN_SUCCESS) {
553 /*
554 * If we fail to copy out the address or size of the new buffer, we remove the buffer mapping that
555 * we just made in the task's user space.
556 */
557 error = copyout(CAST_DOWN(void *, &stackshotbuf_user_addr), (user_addr_t)out_buffer_addr, sizeof(stackshotbuf_user_addr));
558 if (error != KERN_SUCCESS) {
559 mach_vm_deallocate(get_task_map(current_task()), stackshotbuf_user_addr, (mach_vm_size_t)bytes_traced);
560 return error;
561 }
562 error = copyout(&bytes_traced, (user_addr_t)out_size_addr, sizeof(bytes_traced));
563 if (error != KERN_SUCCESS) {
564 mach_vm_deallocate(get_task_map(current_task()), stackshotbuf_user_addr, (mach_vm_size_t)bytes_traced);
565 return error;
566 }
567 }
568 return error;
569 }
570
571 kern_return_t
kern_stack_snapshot_internal(int stackshot_config_version,void * stackshot_config,size_t stackshot_config_size,boolean_t stackshot_from_user)572 kern_stack_snapshot_internal(int stackshot_config_version, void *stackshot_config, size_t stackshot_config_size, boolean_t stackshot_from_user)
573 {
574 int error = 0;
575 boolean_t prev_interrupt_state;
576 uint32_t bytes_traced = 0;
577 uint32_t stackshot_estimate = 0;
578 uint32_t stackshotbuf_size = 0;
579 void * stackshotbuf = NULL;
580 kcdata_descriptor_t kcdata_p = NULL;
581
582 void * buf_to_free = NULL;
583 int size_to_free = 0;
584 bool is_traced = false; /* has FUNC_START tracepoint fired? */
585 uint64_t tot_interrupts_off_abs = 0; /* sum(time with interrupts off) */
586
587 /* Parsed arguments */
588 uint64_t out_buffer_addr;
589 uint64_t out_size_addr;
590 int pid = -1;
591 uint64_t flags;
592 uint64_t since_timestamp;
593 uint32_t size_hint = 0;
594 uint32_t pagetable_mask = STACKSHOT_PAGETABLES_MASK_ALL;
595
596 if (stackshot_config == NULL) {
597 return KERN_INVALID_ARGUMENT;
598 }
599 #if DEVELOPMENT || DEBUG
600 /* TBD: ask stackshot clients to avoid issuing stackshots in this
601 * configuration in lieu of the kernel feature override.
602 */
603 if (kern_feature_override(KF_STACKSHOT_OVRD) == TRUE) {
604 return KERN_NOT_SUPPORTED;
605 }
606 #endif
607
608 switch (stackshot_config_version) {
609 case STACKSHOT_CONFIG_TYPE:
610 if (stackshot_config_size != sizeof(stackshot_config_t)) {
611 return KERN_INVALID_ARGUMENT;
612 }
613 stackshot_config_t *config = (stackshot_config_t *) stackshot_config;
614 out_buffer_addr = config->sc_out_buffer_addr;
615 out_size_addr = config->sc_out_size_addr;
616 pid = config->sc_pid;
617 flags = config->sc_flags;
618 since_timestamp = config->sc_delta_timestamp;
619 if (config->sc_size <= max_tracebuf_size) {
620 size_hint = config->sc_size;
621 }
622 /*
623 * Retain the pre-sc_pagetable_mask behavior of STACKSHOT_PAGE_TABLES,
624 * dump every level if the pagetable_mask is not set
625 */
626 if (flags & STACKSHOT_PAGE_TABLES && config->sc_pagetable_mask) {
627 pagetable_mask = config->sc_pagetable_mask;
628 }
629 break;
630 default:
631 return KERN_NOT_SUPPORTED;
632 }
633
634 /*
635 * Currently saving a kernel buffer and trylock are only supported from the
636 * internal/KEXT API.
637 */
638 if (stackshot_from_user) {
639 if (flags & (STACKSHOT_TRYLOCK | STACKSHOT_SAVE_IN_KERNEL_BUFFER | STACKSHOT_FROM_PANIC)) {
640 return KERN_NO_ACCESS;
641 }
642 #if !DEVELOPMENT && !DEBUG
643 if (flags & (STACKSHOT_DO_COMPRESS)) {
644 return KERN_NO_ACCESS;
645 }
646 #endif
647 } else {
648 if (!(flags & STACKSHOT_SAVE_IN_KERNEL_BUFFER)) {
649 return KERN_NOT_SUPPORTED;
650 }
651 }
652
653 if (!((flags & STACKSHOT_KCDATA_FORMAT) || (flags & STACKSHOT_RETRIEVE_EXISTING_BUFFER))) {
654 return KERN_NOT_SUPPORTED;
655 }
656
657 /* Compresssed delta stackshots or page dumps are not yet supported */
658 if (((flags & STACKSHOT_COLLECT_DELTA_SNAPSHOT) || (flags & STACKSHOT_PAGE_TABLES))
659 && (flags & STACKSHOT_DO_COMPRESS)) {
660 return KERN_NOT_SUPPORTED;
661 }
662
663 /*
664 * If we're not saving the buffer in the kernel pointer, we need a place to copy into.
665 */
666 if ((!out_buffer_addr || !out_size_addr) && !(flags & STACKSHOT_SAVE_IN_KERNEL_BUFFER)) {
667 return KERN_INVALID_ARGUMENT;
668 }
669
670 if (since_timestamp != 0 && ((flags & STACKSHOT_COLLECT_DELTA_SNAPSHOT) == 0)) {
671 return KERN_INVALID_ARGUMENT;
672 }
673
674 #if CONFIG_PERVASIVE_CPI && MONOTONIC
675 if (!mt_core_supported) {
676 flags &= ~STACKSHOT_INSTRS_CYCLES;
677 }
678 #else /* CONFIG_PERVASIVE_CPI && MONOTONIC */
679 flags &= ~STACKSHOT_INSTRS_CYCLES;
680 #endif /* !CONFIG_PERVASIVE_CPI || !MONOTONIC */
681
682 STACKSHOT_SUBSYS_LOCK();
683
684 if (flags & STACKSHOT_SAVE_IN_KERNEL_BUFFER) {
685 /*
686 * Don't overwrite an existing stackshot
687 */
688 if (kernel_stackshot_buf != NULL) {
689 error = KERN_MEMORY_PRESENT;
690 goto error_exit;
691 }
692 } else if (flags & STACKSHOT_RETRIEVE_EXISTING_BUFFER) {
693 if ((kernel_stackshot_buf == NULL) || (kernel_stackshot_buf_size <= 0)) {
694 error = KERN_NOT_IN_SET;
695 goto error_exit;
696 }
697 error = stackshot_remap_buffer(kernel_stackshot_buf, kernel_stackshot_buf_size,
698 out_buffer_addr, out_size_addr);
699 /*
700 * If we successfully remapped the buffer into the user's address space, we
701 * set buf_to_free and size_to_free so the prior kernel mapping will be removed
702 * and then clear the kernel stackshot pointer and associated size.
703 */
704 if (error == KERN_SUCCESS) {
705 buf_to_free = kernel_stackshot_buf;
706 size_to_free = (int) VM_MAP_ROUND_PAGE(kernel_stackshot_buf_size, PAGE_MASK);
707 kernel_stackshot_buf = NULL;
708 kernel_stackshot_buf_size = 0;
709 }
710
711 goto error_exit;
712 }
713
714 if (flags & STACKSHOT_GET_BOOT_PROFILE) {
715 void *bootprofile = NULL;
716 uint32_t len = 0;
717 #if CONFIG_TELEMETRY
718 bootprofile_get(&bootprofile, &len);
719 #endif
720 if (!bootprofile || !len) {
721 error = KERN_NOT_IN_SET;
722 goto error_exit;
723 }
724 error = stackshot_remap_buffer(bootprofile, len, out_buffer_addr, out_size_addr);
725 goto error_exit;
726 }
727
728 stackshot_duration_prior_abs = 0;
729 stackshot_initial_estimate_adj = os_atomic_load(&stackshot_estimate_adj, relaxed);
730 stackshotbuf_size = stackshot_estimate =
731 get_stackshot_estsize(size_hint, stackshot_initial_estimate_adj);
732 stackshot_initial_estimate = stackshot_estimate;
733
734 KDBG_RELEASE(MACHDBG_CODE(DBG_MACH_STACKSHOT, STACKSHOT_RECORD) | DBG_FUNC_START,
735 flags, stackshotbuf_size, pid, since_timestamp);
736 is_traced = true;
737
738 for (; stackshotbuf_size <= max_tracebuf_size; stackshotbuf_size <<= 1) {
739 if (kmem_alloc(kernel_map, (vm_offset_t *)&stackshotbuf, stackshotbuf_size,
740 KMA_ZERO | KMA_DATA, VM_KERN_MEMORY_DIAG) != KERN_SUCCESS) {
741 error = KERN_RESOURCE_SHORTAGE;
742 goto error_exit;
743 }
744
745
746 uint32_t hdr_tag = (flags & STACKSHOT_COLLECT_DELTA_SNAPSHOT) ? KCDATA_BUFFER_BEGIN_DELTA_STACKSHOT
747 : (flags & STACKSHOT_DO_COMPRESS) ? KCDATA_BUFFER_BEGIN_COMPRESSED
748 : KCDATA_BUFFER_BEGIN_STACKSHOT;
749 kcdata_p = kcdata_memory_alloc_init((mach_vm_address_t)stackshotbuf, hdr_tag, stackshotbuf_size,
750 KCFLAG_USE_MEMCOPY | KCFLAG_NO_AUTO_ENDBUFFER);
751
752 stackshot_duration_outer = NULL;
753
754 /* if compression was requested, allocate the extra zlib scratch area */
755 if (flags & STACKSHOT_DO_COMPRESS) {
756 hdr_tag = (flags & STACKSHOT_COLLECT_DELTA_SNAPSHOT) ? KCDATA_BUFFER_BEGIN_DELTA_STACKSHOT
757 : KCDATA_BUFFER_BEGIN_STACKSHOT;
758 error = kcdata_init_compress(kcdata_p, hdr_tag, kdp_memcpy, KCDCT_ZLIB);
759 if (error != KERN_SUCCESS) {
760 os_log(OS_LOG_DEFAULT, "failed to initialize compression: %d!\n",
761 (int) error);
762 goto error_exit;
763 }
764 }
765
766 /*
767 * Disable interrupts and save the current interrupt state.
768 */
769 prev_interrupt_state = ml_set_interrupts_enabled(FALSE);
770 uint64_t time_start = mach_absolute_time();
771
772 /* Emit a SOCD tracepoint that we are initiating a stackshot */
773 SOCD_TRACE_XNU_START(STACKSHOT);
774
775 /*
776 * Load stackshot parameters.
777 */
778 kdp_snapshot_preflight(pid, stackshotbuf, stackshotbuf_size, flags, kcdata_p, since_timestamp,
779 pagetable_mask);
780
781 error = stackshot_trap();
782
783 /* record the duration that interupts were disabled */
784 uint64_t time_end = mach_absolute_time();
785
786 /* Emit a SOCD tracepoint that we have completed the stackshot */
787 SOCD_TRACE_XNU_END(STACKSHOT);
788 ml_set_interrupts_enabled(prev_interrupt_state);
789
790 if (stackshot_duration_outer) {
791 *stackshot_duration_outer = time_end - time_start;
792 }
793 tot_interrupts_off_abs += time_end - time_start;
794
795 if (error != KERN_SUCCESS) {
796 if (kcdata_p != NULL) {
797 kcdata_memory_destroy(kcdata_p);
798 kcdata_p = NULL;
799 stackshot_kcdata_p = NULL;
800 }
801 kmem_free(kernel_map, (vm_offset_t)stackshotbuf, stackshotbuf_size);
802 stackshotbuf = NULL;
803 if (error == KERN_INSUFFICIENT_BUFFER_SIZE) {
804 /*
805 * If we didn't allocate a big enough buffer, deallocate and try again.
806 */
807 KDBG_RELEASE(MACHDBG_CODE(DBG_MACH_STACKSHOT, STACKSHOT_RECORD_SHORT) | DBG_FUNC_NONE,
808 time_end - time_start, stackshot_estimate, stackshotbuf_size);
809 stackshot_duration_prior_abs += (time_end - time_start);
810 continue;
811 } else {
812 goto error_exit;
813 }
814 }
815
816 bytes_traced = kdp_stack_snapshot_bytes_traced();
817 if (bytes_traced <= 0) {
818 error = KERN_ABORTED;
819 goto error_exit;
820 }
821
822 assert(bytes_traced <= stackshotbuf_size);
823 if (!(flags & STACKSHOT_SAVE_IN_KERNEL_BUFFER)) {
824 error = stackshot_remap_buffer(stackshotbuf, bytes_traced, out_buffer_addr, out_size_addr);
825 goto error_exit;
826 }
827
828 /*
829 * Save the stackshot in the kernel buffer.
830 */
831 kernel_stackshot_buf = stackshotbuf;
832 kernel_stackshot_buf_size = bytes_traced;
833 /*
834 * Figure out if we didn't use all the pages in the buffer. If so, we set buf_to_free to the beginning of
835 * the next page after the end of the stackshot in the buffer so that the kmem_free clips the buffer and
836 * update size_to_free for kmem_free accordingly.
837 */
838 size_to_free = stackshotbuf_size - (int) VM_MAP_ROUND_PAGE(bytes_traced, PAGE_MASK);
839
840 assert(size_to_free >= 0);
841
842 if (size_to_free != 0) {
843 buf_to_free = (void *)((uint64_t)stackshotbuf + stackshotbuf_size - size_to_free);
844 }
845
846 stackshotbuf = NULL;
847 stackshotbuf_size = 0;
848 goto error_exit;
849 }
850
851 if (stackshotbuf_size > max_tracebuf_size) {
852 error = KERN_RESOURCE_SHORTAGE;
853 }
854
855 error_exit:
856 if (is_traced) {
857 KDBG_RELEASE(MACHDBG_CODE(DBG_MACH_STACKSHOT, STACKSHOT_RECORD) | DBG_FUNC_END,
858 error, tot_interrupts_off_abs, stackshotbuf_size, bytes_traced);
859 }
860 if (kcdata_p != NULL) {
861 kcdata_memory_destroy(kcdata_p);
862 kcdata_p = NULL;
863 stackshot_kcdata_p = NULL;
864 }
865
866 if (stackshotbuf != NULL) {
867 kmem_free(kernel_map, (vm_offset_t)stackshotbuf, stackshotbuf_size);
868 }
869 if (buf_to_free != NULL) {
870 kmem_free(kernel_map, (vm_offset_t)buf_to_free, size_to_free);
871 }
872 STACKSHOT_SUBSYS_UNLOCK();
873 return error;
874 }
875
876 /*
877 * Cache stack snapshot parameters in preparation for a trace.
878 */
879 void
kdp_snapshot_preflight(int pid,void * tracebuf,uint32_t tracebuf_size,uint64_t flags,kcdata_descriptor_t data_p,uint64_t since_timestamp,uint32_t pagetable_mask)880 kdp_snapshot_preflight(int pid, void * tracebuf, uint32_t tracebuf_size, uint64_t flags,
881 kcdata_descriptor_t data_p, uint64_t since_timestamp, uint32_t pagetable_mask)
882 {
883 uint64_t microsecs = 0, secs = 0;
884 clock_get_calendar_microtime((clock_sec_t *)&secs, (clock_usec_t *)µsecs);
885
886 stackshot_microsecs = microsecs + (secs * USEC_PER_SEC);
887 stack_snapshot_pid = pid;
888 stack_snapshot_buf = tracebuf;
889 stack_snapshot_bufsize = tracebuf_size;
890 stack_snapshot_flags = flags;
891 stack_snapshot_delta_since_timestamp = since_timestamp;
892 stack_snapshot_pagetable_mask = pagetable_mask;
893
894 panic_stackshot = ((flags & STACKSHOT_FROM_PANIC) != 0);
895
896 assert(data_p != NULL);
897 assert(stackshot_kcdata_p == NULL);
898 stackshot_kcdata_p = data_p;
899
900 stack_snapshot_bytes_traced = 0;
901 stack_snapshot_bytes_uncompressed = 0;
902 }
903
904 void
panic_stackshot_reset_state(void)905 panic_stackshot_reset_state(void)
906 {
907 stackshot_kcdata_p = NULL;
908 }
909
910 boolean_t
stackshot_active(void)911 stackshot_active(void)
912 {
913 return stackshot_kcdata_p != NULL;
914 }
915
916 uint32_t
kdp_stack_snapshot_bytes_traced(void)917 kdp_stack_snapshot_bytes_traced(void)
918 {
919 return stack_snapshot_bytes_traced;
920 }
921
922 uint32_t
kdp_stack_snapshot_bytes_uncompressed(void)923 kdp_stack_snapshot_bytes_uncompressed(void)
924 {
925 return stack_snapshot_bytes_uncompressed;
926 }
927
928 static boolean_t
memory_iszero(void * addr,size_t size)929 memory_iszero(void *addr, size_t size)
930 {
931 char *data = (char *)addr;
932 for (size_t i = 0; i < size; i++) {
933 if (data[i] != 0) {
934 return FALSE;
935 }
936 }
937 return TRUE;
938 }
939
940 /*
941 * Keep a simple cache of the most recent validation done at a page granularity
942 * to avoid the expensive software KVA-to-phys translation in the VM.
943 */
944
945 struct _stackshot_validation_state {
946 vm_offset_t last_valid_page_kva;
947 size_t last_valid_size;
948 } g_validation_state;
949
950 static void
_stackshot_validation_reset(void)951 _stackshot_validation_reset(void)
952 {
953 g_validation_state.last_valid_page_kva = -1;
954 g_validation_state.last_valid_size = 0;
955 }
956
957 static bool
_stackshot_validate_kva(vm_offset_t addr,size_t size)958 _stackshot_validate_kva(vm_offset_t addr, size_t size)
959 {
960 vm_offset_t page_addr = atop_kernel(addr);
961 if (g_validation_state.last_valid_page_kva == page_addr &&
962 g_validation_state.last_valid_size <= size) {
963 return true;
964 }
965
966 if (ml_validate_nofault(addr, size)) {
967 g_validation_state.last_valid_page_kva = page_addr;
968 g_validation_state.last_valid_size = size;
969 return true;
970 }
971 return false;
972 }
973
974 static long
_stackshot_strlen(const char * s,size_t maxlen)975 _stackshot_strlen(const char *s, size_t maxlen)
976 {
977 size_t len = 0;
978 for (len = 0; _stackshot_validate_kva((vm_offset_t)s, 1); len++, s++) {
979 if (*s == 0) {
980 return len;
981 }
982 if (len >= maxlen) {
983 return -1;
984 }
985 }
986 return -1; /* failed before end of string */
987 }
988
989 #define kcd_end_address(kcd) ((void *)((uint64_t)((kcd)->kcd_addr_begin) + kcdata_memory_get_used_bytes((kcd))))
990 #define kcd_max_address(kcd) ((void *)((kcd)->kcd_addr_begin + (kcd)->kcd_length))
991 /*
992 * Use of the kcd_exit_on_error(action) macro requires a local
993 * 'kern_return_t error' variable and 'error_exit' label.
994 */
995 #define kcd_exit_on_error(action) \
996 do { \
997 if (KERN_SUCCESS != (error = (action))) { \
998 if (error == KERN_RESOURCE_SHORTAGE) { \
999 error = KERN_INSUFFICIENT_BUFFER_SIZE; \
1000 } \
1001 goto error_exit; \
1002 } \
1003 } while (0); /* end kcd_exit_on_error */
1004
1005
1006 /*
1007 * For port labels, we have a small hash table we use to track the
1008 * struct ipc_service_port_label pointers we see along the way.
1009 * This structure encapsulates the global state.
1010 *
1011 * The hash table is insert-only, similar to "intern"ing strings. It's
1012 * only used an manipulated in during the stackshot collection. We use
1013 * seperate chaining, with the hash elements and chains being int16_ts
1014 * indexes into the parallel arrays, with -1 ending the chain. Array indices are
1015 * allocated using a bump allocator.
1016 *
1017 * The parallel arrays contain:
1018 * - plh_array[idx] the pointer entered
1019 * - plh_chains[idx] the hash chain
1020 * - plh_gen[idx] the last 'generation #' seen
1021 *
1022 * Generation IDs are used to track entries looked up in the current
1023 * task; 0 is never used, and the plh_gen array is cleared to 0 on
1024 * rollover.
1025 *
1026 * The portlabel_ids we report externally are just the index in the array,
1027 * plus 1 to avoid 0 as a value. 0 is NONE, -1 is UNKNOWN (e.g. there is
1028 * one, but we ran out of space)
1029 */
1030 struct port_label_hash {
1031 uint16_t plh_size; /* size of allocations; 0 disables tracking */
1032 uint16_t plh_count; /* count of used entries in plh_array */
1033 struct ipc_service_port_label **plh_array; /* _size allocated, _count used */
1034 int16_t *plh_chains; /* _size allocated */
1035 uint8_t *plh_gen; /* last 'gen #' seen in */
1036 int16_t *plh_hash; /* (1 << STACKSHOT_PLH_SHIFT) entry hash table: hash(ptr) -> array index */
1037 int16_t plh_curgen_min; /* min idx seen for this gen */
1038 int16_t plh_curgen_max; /* max idx seen for this gen */
1039 uint8_t plh_curgen; /* current gen */
1040 #if DEVELOPMENT || DEBUG
1041 /* statistics */
1042 uint32_t plh_lookups; /* # lookups or inserts */
1043 uint32_t plh_found;
1044 uint32_t plh_found_depth;
1045 uint32_t plh_insert;
1046 uint32_t plh_insert_depth;
1047 uint32_t plh_bad;
1048 uint32_t plh_bad_depth;
1049 uint32_t plh_lookup_send;
1050 uint32_t plh_lookup_receive;
1051 #define PLH_STAT_OP(...) (void)(__VA_ARGS__)
1052 #else /* DEVELOPMENT || DEBUG */
1053 #define PLH_STAT_OP(...) (void)(0)
1054 #endif /* DEVELOPMENT || DEBUG */
1055 } port_label_hash;
1056
1057 #define STACKSHOT_PLH_SHIFT 7
1058 #define STACKSHOT_PLH_SIZE_MAX ((kdp_ipc_have_splabel)? 1024 : 0)
1059 size_t stackshot_port_label_size = (2 * (1u << STACKSHOT_PLH_SHIFT));
1060 #define STASKSHOT_PLH_SIZE(x) MIN((x), STACKSHOT_PLH_SIZE_MAX)
1061
1062 static size_t
stackshot_plh_est_size(void)1063 stackshot_plh_est_size(void)
1064 {
1065 struct port_label_hash *plh = &port_label_hash;
1066 size_t size = STASKSHOT_PLH_SIZE(stackshot_port_label_size);
1067
1068 if (size == 0) {
1069 return 0;
1070 }
1071 #define SIZE_EST(x) ROUNDUP((x), sizeof (uintptr_t))
1072 return SIZE_EST(size * sizeof(*plh->plh_array)) +
1073 SIZE_EST(size * sizeof(*plh->plh_chains)) +
1074 SIZE_EST(size * sizeof(*plh->plh_gen)) +
1075 SIZE_EST((1ul << STACKSHOT_PLH_SHIFT) * sizeof(*plh->plh_hash));
1076 #undef SIZE_EST
1077 }
1078
1079 static void
stackshot_plh_reset(void)1080 stackshot_plh_reset(void)
1081 {
1082 port_label_hash = (struct port_label_hash){.plh_size = 0}; /* structure assignment */
1083 }
1084
1085 static void
stackshot_plh_setup(kcdata_descriptor_t data)1086 stackshot_plh_setup(kcdata_descriptor_t data)
1087 {
1088 struct port_label_hash plh = {
1089 .plh_size = STASKSHOT_PLH_SIZE(stackshot_port_label_size),
1090 .plh_count = 0,
1091 .plh_curgen = 1,
1092 .plh_curgen_min = STACKSHOT_PLH_SIZE_MAX,
1093 .plh_curgen_max = 0,
1094 };
1095 stackshot_plh_reset();
1096 size_t size = plh.plh_size;
1097 if (size == 0) {
1098 return;
1099 }
1100 plh.plh_array = kcdata_endalloc(data, size * sizeof(*plh.plh_array));
1101 plh.plh_chains = kcdata_endalloc(data, size * sizeof(*plh.plh_chains));
1102 plh.plh_gen = kcdata_endalloc(data, size * sizeof(*plh.plh_gen));
1103 plh.plh_hash = kcdata_endalloc(data, (1ul << STACKSHOT_PLH_SHIFT) * sizeof(*plh.plh_hash));
1104 if (plh.plh_array == NULL || plh.plh_chains == NULL || plh.plh_gen == NULL || plh.plh_hash == NULL) {
1105 PLH_STAT_OP(port_label_hash.plh_bad++);
1106 return;
1107 }
1108 for (int x = 0; x < size; x++) {
1109 plh.plh_array[x] = NULL;
1110 plh.plh_chains[x] = -1;
1111 plh.plh_gen[x] = 0;
1112 }
1113 for (int x = 0; x < (1ul << STACKSHOT_PLH_SHIFT); x++) {
1114 plh.plh_hash[x] = -1;
1115 }
1116 port_label_hash = plh; /* structure assignment */
1117 }
1118
1119 static int16_t
stackshot_plh_hash(struct ipc_service_port_label * ispl)1120 stackshot_plh_hash(struct ipc_service_port_label *ispl)
1121 {
1122 uintptr_t ptr = (uintptr_t)ispl;
1123 static_assert(STACKSHOT_PLH_SHIFT < 16, "plh_hash must fit in 15 bits");
1124 #define PLH_HASH_STEP(ptr, x) \
1125 ((((x) * STACKSHOT_PLH_SHIFT) < (sizeof(ispl) * CHAR_BIT)) ? ((ptr) >> ((x) * STACKSHOT_PLH_SHIFT)) : 0)
1126 ptr ^= PLH_HASH_STEP(ptr, 16);
1127 ptr ^= PLH_HASH_STEP(ptr, 8);
1128 ptr ^= PLH_HASH_STEP(ptr, 4);
1129 ptr ^= PLH_HASH_STEP(ptr, 2);
1130 ptr ^= PLH_HASH_STEP(ptr, 1);
1131 #undef PLH_HASH_STEP
1132 return (int16_t)(ptr & ((1ul << STACKSHOT_PLH_SHIFT) - 1));
1133 }
1134
1135 enum stackshot_plh_lookup_type {
1136 STACKSHOT_PLH_LOOKUP_UNKNOWN,
1137 STACKSHOT_PLH_LOOKUP_SEND,
1138 STACKSHOT_PLH_LOOKUP_RECEIVE,
1139 };
1140
1141 static void
stackshot_plh_resetgen(void)1142 stackshot_plh_resetgen(void)
1143 {
1144 struct port_label_hash *plh = &port_label_hash;
1145 if (plh->plh_curgen_min == STACKSHOT_PLH_SIZE_MAX && plh->plh_curgen_max == 0) {
1146 return; // no lookups, nothing using the current generation
1147 }
1148 plh->plh_curgen++;
1149 plh->plh_curgen_min = STACKSHOT_PLH_SIZE_MAX;
1150 plh->plh_curgen_max = 0;
1151 if (plh->plh_curgen == 0) { // wrapped, zero the array and increment the generation
1152 for (int x = 0; x < plh->plh_size; x++) {
1153 plh->plh_gen[x] = 0;
1154 }
1155 plh->plh_curgen = 1;
1156 }
1157 }
1158
1159 static int16_t
stackshot_plh_lookup(struct ipc_service_port_label * ispl,enum stackshot_plh_lookup_type type)1160 stackshot_plh_lookup(struct ipc_service_port_label *ispl, enum stackshot_plh_lookup_type type)
1161 {
1162 struct port_label_hash *plh = &port_label_hash;
1163 int depth;
1164 int16_t cur;
1165 if (ispl == NULL) {
1166 return STACKSHOT_PORTLABELID_NONE;
1167 }
1168 switch (type) {
1169 case STACKSHOT_PLH_LOOKUP_SEND:
1170 PLH_STAT_OP(plh->plh_lookup_send++);
1171 break;
1172 case STACKSHOT_PLH_LOOKUP_RECEIVE:
1173 PLH_STAT_OP(plh->plh_lookup_receive++);
1174 break;
1175 default:
1176 break;
1177 }
1178 PLH_STAT_OP(plh->plh_lookups++);
1179 if (plh->plh_size == 0) {
1180 return STACKSHOT_PORTLABELID_MISSING;
1181 }
1182 int16_t hash = stackshot_plh_hash(ispl);
1183 assert(hash >= 0 && hash < (1ul << STACKSHOT_PLH_SHIFT));
1184 depth = 0;
1185 for (cur = plh->plh_hash[hash]; cur >= 0; cur = plh->plh_chains[cur]) {
1186 /* cur must be in-range, and chain depth can never be above our # allocated */
1187 if (cur >= plh->plh_count || depth > plh->plh_count || depth > plh->plh_size) {
1188 PLH_STAT_OP((plh->plh_bad++), (plh->plh_bad_depth += depth));
1189 return STACKSHOT_PORTLABELID_MISSING;
1190 }
1191 assert(cur < plh->plh_count);
1192 if (plh->plh_array[cur] == ispl) {
1193 PLH_STAT_OP((plh->plh_found++), (plh->plh_found_depth += depth));
1194 goto found;
1195 }
1196 depth++;
1197 }
1198 /* not found in hash table, so alloc and insert it */
1199 if (cur != -1) {
1200 PLH_STAT_OP((plh->plh_bad++), (plh->plh_bad_depth += depth));
1201 return STACKSHOT_PORTLABELID_MISSING; /* bad end of chain */
1202 }
1203 PLH_STAT_OP((plh->plh_insert++), (plh->plh_insert_depth += depth));
1204 if (plh->plh_count >= plh->plh_size) {
1205 return STACKSHOT_PORTLABELID_MISSING; /* no space */
1206 }
1207 cur = plh->plh_count;
1208 plh->plh_count++;
1209 plh->plh_array[cur] = ispl;
1210 plh->plh_chains[cur] = plh->plh_hash[hash];
1211 plh->plh_hash[hash] = cur;
1212 found:
1213 plh->plh_gen[cur] = plh->plh_curgen;
1214 if (plh->plh_curgen_min > cur) {
1215 plh->plh_curgen_min = cur;
1216 }
1217 if (plh->plh_curgen_max < cur) {
1218 plh->plh_curgen_max = cur;
1219 }
1220 return cur + 1; /* offset to avoid 0 */
1221 }
1222
1223 // record any PLH referenced since the last stackshot_plh_resetgen() call
1224 static kern_return_t
kdp_stackshot_plh_record(void)1225 kdp_stackshot_plh_record(void)
1226 {
1227 kern_return_t error = KERN_SUCCESS;
1228 struct port_label_hash *plh = &port_label_hash;
1229 uint16_t count = plh->plh_count;
1230 uint8_t curgen = plh->plh_curgen;
1231 int16_t curgen_min = plh->plh_curgen_min;
1232 int16_t curgen_max = plh->plh_curgen_max;
1233 if (curgen_min <= curgen_max && curgen_max < count &&
1234 count <= plh->plh_size && plh->plh_size <= STACKSHOT_PLH_SIZE_MAX) {
1235 struct ipc_service_port_label **arr = plh->plh_array;
1236 size_t ispl_size, max_namelen;
1237 kdp_ipc_splabel_size(&ispl_size, &max_namelen);
1238 for (int idx = curgen_min; idx <= curgen_max; idx++) {
1239 struct ipc_service_port_label *ispl = arr[idx];
1240 struct portlabel_info spl = {
1241 .portlabel_id = (idx + 1),
1242 };
1243 const char *name = NULL;
1244 long name_sz = 0;
1245 if (plh->plh_gen[idx] != curgen) {
1246 continue;
1247 }
1248 if (_stackshot_validate_kva((vm_offset_t)ispl, ispl_size)) {
1249 kdp_ipc_fill_splabel(ispl, &spl, &name);
1250 }
1251 kcd_exit_on_error(kcdata_add_container_marker(stackshot_kcdata_p, KCDATA_TYPE_CONTAINER_BEGIN,
1252 STACKSHOT_KCCONTAINER_PORTLABEL, idx + 1));
1253 if (name != NULL && (name_sz = _stackshot_strlen(name, max_namelen)) > 0) { /* validates the kva */
1254 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_PORTLABEL_NAME, name_sz + 1, name));
1255 } else {
1256 spl.portlabel_flags |= STACKSHOT_PORTLABEL_READFAILED;
1257 }
1258 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_PORTLABEL, sizeof(spl), &spl));
1259 kcd_exit_on_error(kcdata_add_container_marker(stackshot_kcdata_p, KCDATA_TYPE_CONTAINER_END,
1260 STACKSHOT_KCCONTAINER_PORTLABEL, idx + 1));
1261 }
1262 }
1263
1264 error_exit:
1265 return error;
1266 }
1267
1268 #if DEVELOPMENT || DEBUG
1269 static kern_return_t
kdp_stackshot_plh_stats(void)1270 kdp_stackshot_plh_stats(void)
1271 {
1272 kern_return_t error = KERN_SUCCESS;
1273 struct port_label_hash *plh = &port_label_hash;
1274
1275 #define PLH_STAT(x) do { if (plh->x != 0) { \
1276 kcd_exit_on_error(kcdata_add_uint32_with_description(stackshot_kcdata_p, plh->x, "stackshot_" #x)); \
1277 } } while (0)
1278 PLH_STAT(plh_size);
1279 PLH_STAT(plh_lookups);
1280 PLH_STAT(plh_found);
1281 PLH_STAT(plh_found_depth);
1282 PLH_STAT(plh_insert);
1283 PLH_STAT(plh_insert_depth);
1284 PLH_STAT(plh_bad);
1285 PLH_STAT(plh_bad_depth);
1286 PLH_STAT(plh_lookup_send);
1287 PLH_STAT(plh_lookup_receive);
1288 #undef PLH_STAT
1289
1290 error_exit:
1291 return error;
1292 }
1293 #endif /* DEVELOPMENT || DEBUG */
1294
1295 static uint64_t
kcdata_get_task_ss_flags(task_t task)1296 kcdata_get_task_ss_flags(task_t task)
1297 {
1298 uint64_t ss_flags = 0;
1299 boolean_t task_64bit_addr = task_has_64Bit_addr(task);
1300 void *bsd_info = get_bsdtask_info(task);
1301
1302 if (task_64bit_addr) {
1303 ss_flags |= kUser64_p;
1304 }
1305 if (!task->active || task_is_a_corpse(task) || proc_exiting(bsd_info)) {
1306 ss_flags |= kTerminatedSnapshot;
1307 }
1308 if (task->pidsuspended) {
1309 ss_flags |= kPidSuspended;
1310 }
1311 if (task->frozen) {
1312 ss_flags |= kFrozen;
1313 }
1314 if (task->effective_policy.tep_darwinbg == 1) {
1315 ss_flags |= kTaskDarwinBG;
1316 }
1317 if (task->requested_policy.trp_role == TASK_FOREGROUND_APPLICATION) {
1318 ss_flags |= kTaskIsForeground;
1319 }
1320 if (task->requested_policy.trp_boosted == 1) {
1321 ss_flags |= kTaskIsBoosted;
1322 }
1323 if (task->effective_policy.tep_sup_active == 1) {
1324 ss_flags |= kTaskIsSuppressed;
1325 }
1326 #if CONFIG_MEMORYSTATUS
1327
1328 boolean_t dirty = FALSE, dirty_tracked = FALSE, allow_idle_exit = FALSE;
1329 memorystatus_proc_flags_unsafe(bsd_info, &dirty, &dirty_tracked, &allow_idle_exit);
1330 if (dirty) {
1331 ss_flags |= kTaskIsDirty;
1332 }
1333 if (dirty_tracked) {
1334 ss_flags |= kTaskIsDirtyTracked;
1335 }
1336 if (allow_idle_exit) {
1337 ss_flags |= kTaskAllowIdleExit;
1338 }
1339
1340 #endif
1341 if (task->effective_policy.tep_tal_engaged) {
1342 ss_flags |= kTaskTALEngaged;
1343 }
1344
1345 ss_flags |= (0x7 & workqueue_get_pwq_state_kdp(bsd_info)) << 17;
1346
1347 #if IMPORTANCE_INHERITANCE
1348 if (task->task_imp_base) {
1349 if (task->task_imp_base->iit_donor) {
1350 ss_flags |= kTaskIsImpDonor;
1351 }
1352 if (task->task_imp_base->iit_live_donor) {
1353 ss_flags |= kTaskIsLiveImpDonor;
1354 }
1355 }
1356 #endif
1357 return ss_flags;
1358 }
1359
1360 static kern_return_t
kcdata_record_shared_cache_info(kcdata_descriptor_t kcd,task_t task,unaligned_u64 * task_snap_ss_flags)1361 kcdata_record_shared_cache_info(kcdata_descriptor_t kcd, task_t task, unaligned_u64 *task_snap_ss_flags)
1362 {
1363 kern_return_t error = KERN_SUCCESS;
1364
1365 uint64_t shared_cache_slide = 0;
1366 uint64_t shared_cache_first_mapping = 0;
1367 uint32_t kdp_fault_results = 0;
1368 uint32_t shared_cache_id = 0;
1369 struct dyld_shared_cache_loadinfo shared_cache_data = {0};
1370
1371
1372 assert(task_snap_ss_flags != NULL);
1373
1374 /* Get basic info about the shared region pointer, regardless of any failures */
1375 if (task->shared_region == NULL) {
1376 *task_snap_ss_flags |= kTaskSharedRegionNone;
1377 } else if (task->shared_region == primary_system_shared_region) {
1378 *task_snap_ss_flags |= kTaskSharedRegionSystem;
1379 } else {
1380 *task_snap_ss_flags |= kTaskSharedRegionOther;
1381 }
1382
1383 if (task->shared_region && _stackshot_validate_kva((vm_offset_t)task->shared_region, sizeof(struct vm_shared_region))) {
1384 struct vm_shared_region *sr = task->shared_region;
1385 shared_cache_first_mapping = sr->sr_base_address + sr->sr_first_mapping;
1386
1387 shared_cache_id = sr->sr_id;
1388 } else {
1389 *task_snap_ss_flags |= kTaskSharedRegionInfoUnavailable;
1390 goto error_exit;
1391 }
1392
1393 /* We haven't copied in the shared region UUID yet as part of setup */
1394 if (!shared_cache_first_mapping || !task->shared_region->sr_uuid_copied) {
1395 goto error_exit;
1396 }
1397
1398
1399 /*
1400 * No refcounting here, but we are in debugger context, so that should be safe.
1401 */
1402 shared_cache_slide = task->shared_region->sr_slide;
1403
1404 if (task->shared_region == primary_system_shared_region) {
1405 /* skip adding shared cache info -- it's the same as the system level one */
1406 goto error_exit;
1407 }
1408 /*
1409 * New-style shared cache reference: for non-primary shared regions,
1410 * just include the ID of the shared cache we're attached to. Consumers
1411 * should use the following info from the task's ts_ss_flags as well:
1412 *
1413 * kTaskSharedRegionNone - task is not attached to a shared region
1414 * kTaskSharedRegionSystem - task is attached to the shared region
1415 * with kSharedCacheSystemPrimary set in sharedCacheFlags.
1416 * kTaskSharedRegionOther - task is attached to the shared region with
1417 * sharedCacheID matching the STACKSHOT_KCTYPE_SHAREDCACHE_ID entry.
1418 */
1419 kcd_exit_on_error(kcdata_push_data(kcd, STACKSHOT_KCTYPE_SHAREDCACHE_ID, sizeof(shared_cache_id), &shared_cache_id));
1420
1421 /*
1422 * For backwards compatibility; this should eventually be removed.
1423 *
1424 * Historically, this data was in a dyld_uuid_info_64 structure, but the
1425 * naming of both the structure and fields for this use wasn't great. The
1426 * dyld_shared_cache_loadinfo structure has better names, but the same
1427 * layout and content as the original.
1428 *
1429 * The imageSlidBaseAddress/sharedCacheUnreliableSlidBaseAddress field
1430 * has been used inconsistently for STACKSHOT_COLLECT_SHAREDCACHE_LAYOUT
1431 * entries; here, it's the slid first mapping, and we leave it that way
1432 * for backwards compatibility.
1433 */
1434 shared_cache_data.sharedCacheSlide = shared_cache_slide;
1435 kdp_memcpy(&shared_cache_data.sharedCacheUUID, task->shared_region->sr_uuid, sizeof(task->shared_region->sr_uuid));
1436 shared_cache_data.sharedCacheUnreliableSlidBaseAddress = shared_cache_first_mapping;
1437 shared_cache_data.sharedCacheSlidFirstMapping = shared_cache_first_mapping;
1438 kcd_exit_on_error(kcdata_push_data(kcd, STACKSHOT_KCTYPE_SHAREDCACHE_LOADINFO, sizeof(shared_cache_data), &shared_cache_data));
1439
1440 error_exit:
1441 if (kdp_fault_results & KDP_FAULT_RESULT_PAGED_OUT) {
1442 *task_snap_ss_flags |= kTaskUUIDInfoMissing;
1443 }
1444
1445 if (kdp_fault_results & KDP_FAULT_RESULT_TRIED_FAULT) {
1446 *task_snap_ss_flags |= kTaskUUIDInfoTriedFault;
1447 }
1448
1449 if (kdp_fault_results & KDP_FAULT_RESULT_FAULTED_IN) {
1450 *task_snap_ss_flags |= kTaskUUIDInfoFaultedIn;
1451 }
1452
1453 return error;
1454 }
1455
1456 static kern_return_t
kcdata_record_uuid_info(kcdata_descriptor_t kcd,task_t task,uint64_t trace_flags,boolean_t have_pmap,unaligned_u64 * task_snap_ss_flags)1457 kcdata_record_uuid_info(kcdata_descriptor_t kcd, task_t task, uint64_t trace_flags, boolean_t have_pmap, unaligned_u64 *task_snap_ss_flags)
1458 {
1459 bool save_loadinfo_p = ((trace_flags & STACKSHOT_SAVE_LOADINFO) != 0);
1460 bool save_kextloadinfo_p = ((trace_flags & STACKSHOT_SAVE_KEXT_LOADINFO) != 0);
1461 bool save_compactinfo_p = ((trace_flags & STACKSHOT_SAVE_DYLD_COMPACTINFO) != 0);
1462 bool should_fault = (trace_flags & STACKSHOT_ENABLE_UUID_FAULTING);
1463
1464 kern_return_t error = KERN_SUCCESS;
1465 mach_vm_address_t out_addr = 0;
1466
1467 mach_vm_address_t dyld_compactinfo_addr = 0;
1468 uint32_t dyld_compactinfo_size = 0;
1469
1470 uint32_t uuid_info_count = 0;
1471 mach_vm_address_t uuid_info_addr = 0;
1472 uint64_t uuid_info_timestamp = 0;
1473 kdp_fault_result_flags_t kdp_fault_results = 0;
1474
1475
1476 assert(task_snap_ss_flags != NULL);
1477
1478 int task_pid = pid_from_task(task);
1479 boolean_t task_64bit_addr = task_has_64Bit_addr(task);
1480
1481 if ((save_loadinfo_p || save_compactinfo_p) && have_pmap && task->active && task_pid > 0) {
1482 /* Read the dyld_all_image_infos struct from the task memory to get UUID array count and location */
1483 if (task_64bit_addr) {
1484 struct user64_dyld_all_image_infos task_image_infos;
1485 if (stackshot_copyin(task->map, task->all_image_info_addr, &task_image_infos,
1486 sizeof(struct user64_dyld_all_image_infos), should_fault, &kdp_fault_results)) {
1487 uuid_info_count = (uint32_t)task_image_infos.uuidArrayCount;
1488 uuid_info_addr = task_image_infos.uuidArray;
1489 if (task_image_infos.version >= DYLD_ALL_IMAGE_INFOS_TIMESTAMP_MINIMUM_VERSION) {
1490 uuid_info_timestamp = task_image_infos.timestamp;
1491 }
1492 if (task_image_infos.version >= DYLD_ALL_IMAGE_INFOS_COMPACTINFO_MINIMUM_VERSION) {
1493 dyld_compactinfo_addr = task_image_infos.compact_dyld_image_info_addr;
1494 dyld_compactinfo_size = task_image_infos.compact_dyld_image_info_size;
1495 }
1496
1497 }
1498 } else {
1499 struct user32_dyld_all_image_infos task_image_infos;
1500 if (stackshot_copyin(task->map, task->all_image_info_addr, &task_image_infos,
1501 sizeof(struct user32_dyld_all_image_infos), should_fault, &kdp_fault_results)) {
1502 uuid_info_count = task_image_infos.uuidArrayCount;
1503 uuid_info_addr = task_image_infos.uuidArray;
1504 if (task_image_infos.version >= DYLD_ALL_IMAGE_INFOS_TIMESTAMP_MINIMUM_VERSION) {
1505 uuid_info_timestamp = task_image_infos.timestamp;
1506 }
1507 if (task_image_infos.version >= DYLD_ALL_IMAGE_INFOS_COMPACTINFO_MINIMUM_VERSION) {
1508 dyld_compactinfo_addr = task_image_infos.compact_dyld_image_info_addr;
1509 dyld_compactinfo_size = task_image_infos.compact_dyld_image_info_size;
1510 }
1511 }
1512 }
1513
1514 /*
1515 * If we get a NULL uuid_info_addr (which can happen when we catch dyld in the middle of updating
1516 * this data structure), we zero the uuid_info_count so that we won't even try to save load info
1517 * for this task.
1518 */
1519 if (!uuid_info_addr) {
1520 uuid_info_count = 0;
1521 }
1522
1523 if (!dyld_compactinfo_addr) {
1524 dyld_compactinfo_size = 0;
1525 }
1526
1527 }
1528
1529 if (have_pmap && task_pid == 0) {
1530 if (save_kextloadinfo_p && _stackshot_validate_kva((vm_offset_t)(gLoadedKextSummaries), sizeof(OSKextLoadedKextSummaryHeader))) {
1531 uuid_info_count = gLoadedKextSummaries->numSummaries + 1; /* include main kernel UUID */
1532 } else {
1533 uuid_info_count = 1; /* include kernelcache UUID (embedded) or kernel UUID (desktop) */
1534 }
1535 }
1536
1537 if (save_compactinfo_p && task_pid > 0) {
1538 if (dyld_compactinfo_size == 0) {
1539 *task_snap_ss_flags |= kTaskDyldCompactInfoNone;
1540 } else if (dyld_compactinfo_size > MAX_DYLD_COMPACTINFO) {
1541 *task_snap_ss_flags |= kTaskDyldCompactInfoTooBig;
1542 } else {
1543 kdp_fault_result_flags_t ci_kdp_fault_results = 0;
1544
1545 /* Open a compression window to avoid overflowing the stack */
1546 kcdata_compression_window_open(kcd);
1547 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_DYLD_COMPACTINFO,
1548 dyld_compactinfo_size, &out_addr));
1549
1550 if (!stackshot_copyin(task->map, dyld_compactinfo_addr, (void *)out_addr,
1551 dyld_compactinfo_size, should_fault, &ci_kdp_fault_results)) {
1552 bzero((void *)out_addr, dyld_compactinfo_size);
1553 }
1554 if (ci_kdp_fault_results & KDP_FAULT_RESULT_PAGED_OUT) {
1555 *task_snap_ss_flags |= kTaskDyldCompactInfoMissing;
1556 }
1557
1558 if (ci_kdp_fault_results & KDP_FAULT_RESULT_TRIED_FAULT) {
1559 *task_snap_ss_flags |= kTaskDyldCompactInfoTriedFault;
1560 }
1561
1562 if (ci_kdp_fault_results & KDP_FAULT_RESULT_FAULTED_IN) {
1563 *task_snap_ss_flags |= kTaskDyldCompactInfoFaultedIn;
1564 }
1565
1566 kcd_exit_on_error(kcdata_compression_window_close(kcd));
1567 }
1568 }
1569 if (save_loadinfo_p && task_pid > 0 && (uuid_info_count < MAX_LOADINFOS)) {
1570 uint32_t copied_uuid_count = 0;
1571 uint32_t uuid_info_size = (uint32_t)(task_64bit_addr ? sizeof(struct user64_dyld_uuid_info) : sizeof(struct user32_dyld_uuid_info));
1572 uint32_t uuid_info_array_size = 0;
1573
1574 /* Open a compression window to avoid overflowing the stack */
1575 kcdata_compression_window_open(kcd);
1576
1577 /* If we found some UUID information, first try to copy it in -- this will only be non-zero if we had a pmap above */
1578 if (uuid_info_count > 0) {
1579 uuid_info_array_size = uuid_info_count * uuid_info_size;
1580
1581 kcd_exit_on_error(kcdata_get_memory_addr_for_array(kcd, (task_64bit_addr ? KCDATA_TYPE_LIBRARY_LOADINFO64 : KCDATA_TYPE_LIBRARY_LOADINFO),
1582 uuid_info_size, uuid_info_count, &out_addr));
1583
1584 if (!stackshot_copyin(task->map, uuid_info_addr, (void *)out_addr, uuid_info_array_size, should_fault, &kdp_fault_results)) {
1585 bzero((void *)out_addr, uuid_info_array_size);
1586 } else {
1587 copied_uuid_count = uuid_info_count;
1588 }
1589 }
1590
1591 uuid_t binary_uuid;
1592 if (!copied_uuid_count && proc_binary_uuid_kdp(task, binary_uuid)) {
1593 /* We failed to copyin the UUID information, try to store the UUID of the main binary we have in the proc */
1594 if (uuid_info_array_size == 0) {
1595 /* We just need to store one UUID */
1596 uuid_info_array_size = uuid_info_size;
1597 kcd_exit_on_error(kcdata_get_memory_addr_for_array(kcd, (task_64bit_addr ? KCDATA_TYPE_LIBRARY_LOADINFO64 : KCDATA_TYPE_LIBRARY_LOADINFO),
1598 uuid_info_size, 1, &out_addr));
1599 }
1600
1601 if (task_64bit_addr) {
1602 struct user64_dyld_uuid_info *uuid_info = (struct user64_dyld_uuid_info *)out_addr;
1603 uint64_t image_load_address = task->mach_header_vm_address;
1604
1605 kdp_memcpy(&uuid_info->imageUUID, binary_uuid, sizeof(uuid_t));
1606 kdp_memcpy(&uuid_info->imageLoadAddress, &image_load_address, sizeof(image_load_address));
1607 } else {
1608 struct user32_dyld_uuid_info *uuid_info = (struct user32_dyld_uuid_info *)out_addr;
1609 uint32_t image_load_address = (uint32_t) task->mach_header_vm_address;
1610
1611 kdp_memcpy(&uuid_info->imageUUID, binary_uuid, sizeof(uuid_t));
1612 kdp_memcpy(&uuid_info->imageLoadAddress, &image_load_address, sizeof(image_load_address));
1613 }
1614 }
1615
1616 kcd_exit_on_error(kcdata_compression_window_close(kcd));
1617 } else if (task_pid == 0 && uuid_info_count > 0 && uuid_info_count < MAX_LOADINFOS) {
1618 uintptr_t image_load_address;
1619
1620 do {
1621 #if defined(__arm64__)
1622 if (kernelcache_uuid_valid && !save_kextloadinfo_p) {
1623 struct dyld_uuid_info_64 kc_uuid = {0};
1624 kc_uuid.imageLoadAddress = VM_MIN_KERNEL_AND_KEXT_ADDRESS;
1625 kdp_memcpy(&kc_uuid.imageUUID, &kernelcache_uuid, sizeof(uuid_t));
1626 kcd_exit_on_error(kcdata_push_data(kcd, STACKSHOT_KCTYPE_KERNELCACHE_LOADINFO, sizeof(struct dyld_uuid_info_64), &kc_uuid));
1627 break;
1628 }
1629 #endif /* defined(__arm64__) */
1630
1631 if (!kernel_uuid || !_stackshot_validate_kva((vm_offset_t)kernel_uuid, sizeof(uuid_t))) {
1632 /* Kernel UUID not found or inaccessible */
1633 break;
1634 }
1635
1636 uint32_t uuid_type = KCDATA_TYPE_LIBRARY_LOADINFO;
1637 if ((sizeof(kernel_uuid_info) == sizeof(struct user64_dyld_uuid_info))) {
1638 uuid_type = KCDATA_TYPE_LIBRARY_LOADINFO64;
1639 #if defined(__arm64__)
1640 kc_format_t primary_kc_type = KCFormatUnknown;
1641 if (PE_get_primary_kc_format(&primary_kc_type) && (primary_kc_type == KCFormatFileset)) {
1642 /* return TEXT_EXEC based load information on arm devices running with fileset kernelcaches */
1643 uuid_type = STACKSHOT_KCTYPE_LOADINFO64_TEXT_EXEC;
1644 }
1645 #endif
1646 }
1647
1648 /*
1649 * The element count of the array can vary - avoid overflowing the
1650 * stack by opening a window.
1651 */
1652 kcdata_compression_window_open(kcd);
1653 kcd_exit_on_error(kcdata_get_memory_addr_for_array(kcd, uuid_type,
1654 sizeof(kernel_uuid_info), uuid_info_count, &out_addr));
1655 kernel_uuid_info *uuid_info_array = (kernel_uuid_info *)out_addr;
1656
1657 image_load_address = (uintptr_t)VM_KERNEL_UNSLIDE(vm_kernel_stext);
1658 #if defined(__arm64__)
1659 if (uuid_type == STACKSHOT_KCTYPE_LOADINFO64_TEXT_EXEC) {
1660 /* If we're reporting TEXT_EXEC load info, populate the TEXT_EXEC base instead */
1661 extern vm_offset_t segTEXTEXECB;
1662 image_load_address = (uintptr_t)VM_KERNEL_UNSLIDE(segTEXTEXECB);
1663 }
1664 #endif
1665 uuid_info_array[0].imageLoadAddress = image_load_address;
1666 kdp_memcpy(&uuid_info_array[0].imageUUID, kernel_uuid, sizeof(uuid_t));
1667
1668 if (save_kextloadinfo_p &&
1669 _stackshot_validate_kva((vm_offset_t)(gLoadedKextSummaries), sizeof(OSKextLoadedKextSummaryHeader)) &&
1670 _stackshot_validate_kva((vm_offset_t)(&gLoadedKextSummaries->summaries[0]),
1671 gLoadedKextSummaries->entry_size * gLoadedKextSummaries->numSummaries)) {
1672 uint32_t kexti;
1673 for (kexti = 0; kexti < gLoadedKextSummaries->numSummaries; kexti++) {
1674 image_load_address = (uintptr_t)VM_KERNEL_UNSLIDE(gLoadedKextSummaries->summaries[kexti].address);
1675 #if defined(__arm64__)
1676 if (uuid_type == STACKSHOT_KCTYPE_LOADINFO64_TEXT_EXEC) {
1677 /* If we're reporting TEXT_EXEC load info, populate the TEXT_EXEC base instead */
1678 image_load_address = (uintptr_t)VM_KERNEL_UNSLIDE(gLoadedKextSummaries->summaries[kexti].text_exec_address);
1679 }
1680 #endif
1681 uuid_info_array[kexti + 1].imageLoadAddress = image_load_address;
1682 kdp_memcpy(&uuid_info_array[kexti + 1].imageUUID, &gLoadedKextSummaries->summaries[kexti].uuid, sizeof(uuid_t));
1683 }
1684 }
1685 kcd_exit_on_error(kcdata_compression_window_close(kcd));
1686 } while (0);
1687 }
1688
1689 error_exit:
1690 if (kdp_fault_results & KDP_FAULT_RESULT_PAGED_OUT) {
1691 *task_snap_ss_flags |= kTaskUUIDInfoMissing;
1692 }
1693
1694 if (kdp_fault_results & KDP_FAULT_RESULT_TRIED_FAULT) {
1695 *task_snap_ss_flags |= kTaskUUIDInfoTriedFault;
1696 }
1697
1698 if (kdp_fault_results & KDP_FAULT_RESULT_FAULTED_IN) {
1699 *task_snap_ss_flags |= kTaskUUIDInfoFaultedIn;
1700 }
1701
1702 return error;
1703 }
1704
1705 static kern_return_t
kcdata_record_task_iostats(kcdata_descriptor_t kcd,task_t task)1706 kcdata_record_task_iostats(kcdata_descriptor_t kcd, task_t task)
1707 {
1708 kern_return_t error = KERN_SUCCESS;
1709 mach_vm_address_t out_addr = 0;
1710
1711 /* I/O Statistics if any counters are non zero */
1712 assert(IO_NUM_PRIORITIES == STACKSHOT_IO_NUM_PRIORITIES);
1713 if (task->task_io_stats && !memory_iszero(task->task_io_stats, sizeof(struct io_stat_info))) {
1714 /* struct io_stats_snapshot is quite large - avoid overflowing the stack. */
1715 kcdata_compression_window_open(kcd);
1716 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_IOSTATS, sizeof(struct io_stats_snapshot), &out_addr));
1717 struct io_stats_snapshot *_iostat = (struct io_stats_snapshot *)out_addr;
1718 _iostat->ss_disk_reads_count = task->task_io_stats->disk_reads.count;
1719 _iostat->ss_disk_reads_size = task->task_io_stats->disk_reads.size;
1720 _iostat->ss_disk_writes_count = (task->task_io_stats->total_io.count - task->task_io_stats->disk_reads.count);
1721 _iostat->ss_disk_writes_size = (task->task_io_stats->total_io.size - task->task_io_stats->disk_reads.size);
1722 _iostat->ss_paging_count = task->task_io_stats->paging.count;
1723 _iostat->ss_paging_size = task->task_io_stats->paging.size;
1724 _iostat->ss_non_paging_count = (task->task_io_stats->total_io.count - task->task_io_stats->paging.count);
1725 _iostat->ss_non_paging_size = (task->task_io_stats->total_io.size - task->task_io_stats->paging.size);
1726 _iostat->ss_metadata_count = task->task_io_stats->metadata.count;
1727 _iostat->ss_metadata_size = task->task_io_stats->metadata.size;
1728 _iostat->ss_data_count = (task->task_io_stats->total_io.count - task->task_io_stats->metadata.count);
1729 _iostat->ss_data_size = (task->task_io_stats->total_io.size - task->task_io_stats->metadata.size);
1730 for (int i = 0; i < IO_NUM_PRIORITIES; i++) {
1731 _iostat->ss_io_priority_count[i] = task->task_io_stats->io_priority[i].count;
1732 _iostat->ss_io_priority_size[i] = task->task_io_stats->io_priority[i].size;
1733 }
1734 kcd_exit_on_error(kcdata_compression_window_close(kcd));
1735 }
1736
1737
1738 error_exit:
1739 return error;
1740 }
1741
1742 #if CONFIG_PERVASIVE_CPI
1743 static kern_return_t
kcdata_record_task_instrs_cycles(kcdata_descriptor_t kcd,task_t task)1744 kcdata_record_task_instrs_cycles(kcdata_descriptor_t kcd, task_t task)
1745 {
1746 struct instrs_cycles_snapshot_v2 instrs_cycles = { 0 };
1747 struct recount_usage usage = { 0 };
1748 struct recount_usage perf_only = { 0 };
1749 recount_task_terminated_usage_perf_only(task, &usage, &perf_only);
1750 instrs_cycles.ics_instructions = usage.ru_instructions;
1751 instrs_cycles.ics_cycles = usage.ru_cycles;
1752 instrs_cycles.ics_p_instructions = perf_only.ru_instructions;
1753 instrs_cycles.ics_p_cycles = perf_only.ru_cycles;
1754
1755 return kcdata_push_data(kcd, STACKSHOT_KCTYPE_INSTRS_CYCLES, sizeof(instrs_cycles), &instrs_cycles);
1756 }
1757 #endif /* CONFIG_PERVASIVE_CPI */
1758
1759 static kern_return_t
kcdata_record_task_cpu_architecture(kcdata_descriptor_t kcd,task_t task)1760 kcdata_record_task_cpu_architecture(kcdata_descriptor_t kcd, task_t task)
1761 {
1762 struct stackshot_cpu_architecture cpu_architecture = {0};
1763 int32_t cputype;
1764 int32_t cpusubtype;
1765
1766 proc_archinfo_kdp(get_bsdtask_info(task), &cputype, &cpusubtype);
1767 cpu_architecture.cputype = cputype;
1768 cpu_architecture.cpusubtype = cpusubtype;
1769
1770 return kcdata_push_data(kcd, STACKSHOT_KCTYPE_TASK_CPU_ARCHITECTURE, sizeof(struct stackshot_cpu_architecture), &cpu_architecture);
1771 }
1772
1773 static kern_return_t
kcdata_record_task_codesigning_info(kcdata_descriptor_t kcd,task_t task)1774 kcdata_record_task_codesigning_info(kcdata_descriptor_t kcd, task_t task)
1775 {
1776 struct stackshot_task_codesigning_info codesigning_info = {};
1777 void * bsdtask_info = NULL;
1778 if (task != kernel_task) {
1779 bsdtask_info = get_bsdtask_info(task);
1780 codesigning_info.csflags = proc_getcsflags_kdp(bsdtask_info);
1781 codesigning_info.cs_trust_level = 0; //TODO in rdar://102261763
1782 } else {
1783 return KERN_SUCCESS;
1784 }
1785 return kcdata_push_data(kcd, STACKSHOT_KCTYPE_CODESIGNING_INFO, sizeof(struct stackshot_task_codesigning_info), &codesigning_info);
1786 }
1787
1788 static kern_return_t
kcdata_record_transitioning_task_snapshot(kcdata_descriptor_t kcd,task_t task,unaligned_u64 task_snap_ss_flags,uint64_t transition_type)1789 kcdata_record_transitioning_task_snapshot(kcdata_descriptor_t kcd, task_t task, unaligned_u64 task_snap_ss_flags, uint64_t transition_type)
1790 {
1791 kern_return_t error = KERN_SUCCESS;
1792 mach_vm_address_t out_addr = 0;
1793 struct transitioning_task_snapshot * cur_tsnap = NULL;
1794
1795 int task_pid = pid_from_task(task);
1796 /* Is returning -1 ok for terminating task ok ??? */
1797 uint64_t task_uniqueid = get_task_uniqueid(task);
1798
1799 if (task_pid && (task_did_exec_internal(task) || task_is_exec_copy_internal(task))) {
1800 /*
1801 * if this task is a transit task from another one, show the pid as
1802 * negative
1803 */
1804 task_pid = 0 - task_pid;
1805 }
1806
1807 /* the task_snapshot_v2 struct is large - avoid overflowing the stack */
1808 kcdata_compression_window_open(kcd);
1809 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_TRANSITIONING_TASK_SNAPSHOT, sizeof(struct transitioning_task_snapshot), &out_addr));
1810 cur_tsnap = (struct transitioning_task_snapshot *)out_addr;
1811 bzero(cur_tsnap, sizeof(*cur_tsnap));
1812
1813 cur_tsnap->tts_unique_pid = task_uniqueid;
1814 cur_tsnap->tts_ss_flags = kcdata_get_task_ss_flags(task);
1815 cur_tsnap->tts_ss_flags |= task_snap_ss_flags;
1816 cur_tsnap->tts_transition_type = transition_type;
1817 cur_tsnap->tts_pid = task_pid;
1818
1819 /* Add the BSD process identifiers */
1820 if (task_pid != -1 && get_bsdtask_info(task) != NULL) {
1821 proc_name_kdp(get_bsdtask_info(task), cur_tsnap->tts_p_comm, sizeof(cur_tsnap->tts_p_comm));
1822 } else {
1823 cur_tsnap->tts_p_comm[0] = '\0';
1824 }
1825
1826 kcd_exit_on_error(kcdata_compression_window_close(kcd));
1827
1828 error_exit:
1829 return error;
1830 }
1831
1832 static kern_return_t
1833 #if STACKSHOT_COLLECTS_LATENCY_INFO
kcdata_record_task_snapshot(kcdata_descriptor_t kcd,task_t task,uint64_t trace_flags,boolean_t have_pmap,unaligned_u64 task_snap_ss_flags,struct stackshot_latency_task * latency_info)1834 kcdata_record_task_snapshot(kcdata_descriptor_t kcd, task_t task, uint64_t trace_flags, boolean_t have_pmap, unaligned_u64 task_snap_ss_flags, struct stackshot_latency_task *latency_info)
1835 #else
1836 kcdata_record_task_snapshot(kcdata_descriptor_t kcd, task_t task, uint64_t trace_flags, boolean_t have_pmap, unaligned_u64 task_snap_ss_flags)
1837 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
1838 {
1839 boolean_t collect_delta_stackshot = ((trace_flags & STACKSHOT_COLLECT_DELTA_SNAPSHOT) != 0);
1840 boolean_t collect_iostats = !collect_delta_stackshot && !(trace_flags & STACKSHOT_NO_IO_STATS);
1841 #if CONFIG_PERVASIVE_CPI
1842 boolean_t collect_instrs_cycles = ((trace_flags & STACKSHOT_INSTRS_CYCLES) != 0);
1843 #endif /* CONFIG_PERVASIVE_CPI */
1844 #if __arm64__
1845 boolean_t collect_asid = ((trace_flags & STACKSHOT_ASID) != 0);
1846 #endif
1847 boolean_t collect_pagetables = ((trace_flags & STACKSHOT_PAGE_TABLES) != 0);
1848
1849
1850 kern_return_t error = KERN_SUCCESS;
1851 mach_vm_address_t out_addr = 0;
1852 struct task_snapshot_v2 * cur_tsnap = NULL;
1853 #if STACKSHOT_COLLECTS_LATENCY_INFO
1854 latency_info->cur_tsnap_latency = mach_absolute_time();
1855 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
1856
1857 int task_pid = pid_from_task(task);
1858 uint64_t task_uniqueid = get_task_uniqueid(task);
1859 void *bsd_info = get_bsdtask_info(task);
1860 uint64_t proc_starttime_secs = 0;
1861
1862 if (task_pid && (task_did_exec_internal(task) || task_is_exec_copy_internal(task))) {
1863 /*
1864 * if this task is a transit task from another one, show the pid as
1865 * negative
1866 */
1867 task_pid = 0 - task_pid;
1868 }
1869
1870 /* the task_snapshot_v2 struct is large - avoid overflowing the stack */
1871 kcdata_compression_window_open(kcd);
1872 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_TASK_SNAPSHOT, sizeof(struct task_snapshot_v2), &out_addr));
1873 cur_tsnap = (struct task_snapshot_v2 *)out_addr;
1874 bzero(cur_tsnap, sizeof(*cur_tsnap));
1875
1876 cur_tsnap->ts_unique_pid = task_uniqueid;
1877 cur_tsnap->ts_ss_flags = kcdata_get_task_ss_flags(task);
1878 cur_tsnap->ts_ss_flags |= task_snap_ss_flags;
1879
1880 struct recount_usage term_usage = { 0 };
1881 recount_task_terminated_usage(task, &term_usage);
1882 cur_tsnap->ts_user_time_in_terminated_threads =
1883 term_usage.ru_user_time_mach;
1884 cur_tsnap->ts_system_time_in_terminated_threads =
1885 term_usage.ru_system_time_mach;
1886
1887 proc_starttime_kdp(bsd_info, &proc_starttime_secs, NULL, NULL);
1888 cur_tsnap->ts_p_start_sec = proc_starttime_secs;
1889 cur_tsnap->ts_task_size = have_pmap ? get_task_phys_footprint(task) : 0;
1890 cur_tsnap->ts_max_resident_size = get_task_resident_max(task);
1891 cur_tsnap->ts_was_throttled = (uint32_t) proc_was_throttled_from_task(task);
1892 cur_tsnap->ts_did_throttle = (uint32_t) proc_did_throttle_from_task(task);
1893
1894 cur_tsnap->ts_suspend_count = task->suspend_count;
1895 cur_tsnap->ts_faults = counter_load(&task->faults);
1896 cur_tsnap->ts_pageins = counter_load(&task->pageins);
1897 cur_tsnap->ts_cow_faults = counter_load(&task->cow_faults);
1898 cur_tsnap->ts_latency_qos = (task->effective_policy.tep_latency_qos == LATENCY_QOS_TIER_UNSPECIFIED) ?
1899 LATENCY_QOS_TIER_UNSPECIFIED : ((0xFF << 16) | task->effective_policy.tep_latency_qos);
1900 cur_tsnap->ts_pid = task_pid;
1901
1902 /* Add the BSD process identifiers */
1903 if (task_pid != -1 && bsd_info != NULL) {
1904 proc_name_kdp(bsd_info, cur_tsnap->ts_p_comm, sizeof(cur_tsnap->ts_p_comm));
1905 } else {
1906 cur_tsnap->ts_p_comm[0] = '\0';
1907 #if IMPORTANCE_INHERITANCE && (DEVELOPMENT || DEBUG)
1908 if (task->task_imp_base != NULL) {
1909 kdp_strlcpy(cur_tsnap->ts_p_comm, &task->task_imp_base->iit_procname[0],
1910 MIN((int)sizeof(task->task_imp_base->iit_procname), (int)sizeof(cur_tsnap->ts_p_comm)));
1911 }
1912 #endif /* IMPORTANCE_INHERITANCE && (DEVELOPMENT || DEBUG) */
1913 }
1914
1915 kcd_exit_on_error(kcdata_compression_window_close(kcd));
1916
1917 #if CONFIG_COALITIONS
1918 if (task_pid != -1 && bsd_info != NULL &&
1919 (task->coalition[COALITION_TYPE_JETSAM] != NULL)) {
1920 /*
1921 * The jetsam coalition ID is always saved, even if
1922 * STACKSHOT_SAVE_JETSAM_COALITIONS is not set.
1923 */
1924 uint64_t jetsam_coal_id = coalition_id(task->coalition[COALITION_TYPE_JETSAM]);
1925 kcd_exit_on_error(kcdata_push_data(kcd, STACKSHOT_KCTYPE_JETSAM_COALITION, sizeof(jetsam_coal_id), &jetsam_coal_id));
1926 }
1927 #endif /* CONFIG_COALITIONS */
1928
1929 #if __arm64__
1930 if (collect_asid && have_pmap) {
1931 uint32_t asid = PMAP_VASID(task->map->pmap);
1932 kcd_exit_on_error(kcdata_push_data(kcd, STACKSHOT_KCTYPE_ASID, sizeof(asid), &asid));
1933 }
1934 #endif
1935
1936 #if STACKSHOT_COLLECTS_LATENCY_INFO
1937 latency_info->cur_tsnap_latency = mach_absolute_time() - latency_info->cur_tsnap_latency;
1938 latency_info->pmap_latency = mach_absolute_time();
1939 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
1940
1941 if (collect_pagetables && have_pmap) {
1942 #if SCHED_HYGIENE_DEBUG
1943 // pagetable dumps can be large; reset the interrupt timeout to avoid a panic
1944 ml_spin_debug_clear_self();
1945 #endif
1946 size_t bytes_dumped = 0;
1947 error = pmap_dump_page_tables(task->map->pmap, kcd_end_address(kcd), kcd_max_address(kcd), stack_snapshot_pagetable_mask, &bytes_dumped);
1948 if (error != KERN_SUCCESS) {
1949 goto error_exit;
1950 } else {
1951 /* Variable size array - better not have it on the stack. */
1952 kcdata_compression_window_open(kcd);
1953 kcd_exit_on_error(kcdata_get_memory_addr_for_array(kcd, STACKSHOT_KCTYPE_PAGE_TABLES,
1954 sizeof(uint64_t), (uint32_t)(bytes_dumped / sizeof(uint64_t)), &out_addr));
1955 kcd_exit_on_error(kcdata_compression_window_close(kcd));
1956 }
1957 }
1958
1959 #if STACKSHOT_COLLECTS_LATENCY_INFO
1960 latency_info->pmap_latency = mach_absolute_time() - latency_info->pmap_latency;
1961 latency_info->bsd_proc_ids_latency = mach_absolute_time();
1962 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
1963
1964 #if STACKSHOT_COLLECTS_LATENCY_INFO
1965 latency_info->bsd_proc_ids_latency = mach_absolute_time() - latency_info->bsd_proc_ids_latency;
1966 latency_info->end_latency = mach_absolute_time();
1967 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
1968
1969 if (collect_iostats) {
1970 kcd_exit_on_error(kcdata_record_task_iostats(kcd, task));
1971 }
1972
1973 #if CONFIG_PERVASIVE_CPI
1974 if (collect_instrs_cycles) {
1975 kcd_exit_on_error(kcdata_record_task_instrs_cycles(kcd, task));
1976 }
1977 #endif /* CONFIG_PERVASIVE_CPI */
1978
1979 kcd_exit_on_error(kcdata_record_task_cpu_architecture(kcd, task));
1980 kcd_exit_on_error(kcdata_record_task_codesigning_info(kcd, task));
1981
1982 #if STACKSHOT_COLLECTS_LATENCY_INFO
1983 latency_info->end_latency = mach_absolute_time() - latency_info->end_latency;
1984 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
1985
1986 error_exit:
1987 return error;
1988 }
1989
1990 static kern_return_t
kcdata_record_task_delta_snapshot(kcdata_descriptor_t kcd,task_t task,uint64_t trace_flags,boolean_t have_pmap,unaligned_u64 task_snap_ss_flags)1991 kcdata_record_task_delta_snapshot(kcdata_descriptor_t kcd, task_t task, uint64_t trace_flags, boolean_t have_pmap, unaligned_u64 task_snap_ss_flags)
1992 {
1993 #if !CONFIG_PERVASIVE_CPI
1994 #pragma unused(trace_flags)
1995 #endif /* !CONFIG_PERVASIVE_CPI */
1996 kern_return_t error = KERN_SUCCESS;
1997 struct task_delta_snapshot_v2 * cur_tsnap = NULL;
1998 mach_vm_address_t out_addr = 0;
1999 (void) trace_flags;
2000 #if __arm64__
2001 boolean_t collect_asid = ((trace_flags & STACKSHOT_ASID) != 0);
2002 #endif
2003 #if CONFIG_PERVASIVE_CPI
2004 boolean_t collect_instrs_cycles = ((trace_flags & STACKSHOT_INSTRS_CYCLES) != 0);
2005 #endif /* CONFIG_PERVASIVE_CPI */
2006
2007 uint64_t task_uniqueid = get_task_uniqueid(task);
2008
2009 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_TASK_DELTA_SNAPSHOT, sizeof(struct task_delta_snapshot_v2), &out_addr));
2010
2011 cur_tsnap = (struct task_delta_snapshot_v2 *)out_addr;
2012
2013 cur_tsnap->tds_unique_pid = task_uniqueid;
2014 cur_tsnap->tds_ss_flags = kcdata_get_task_ss_flags(task);
2015 cur_tsnap->tds_ss_flags |= task_snap_ss_flags;
2016
2017 struct recount_usage usage = { 0 };
2018 recount_task_terminated_usage(task, &usage);
2019
2020 cur_tsnap->tds_user_time_in_terminated_threads = usage.ru_user_time_mach;
2021 cur_tsnap->tds_system_time_in_terminated_threads =
2022 usage.ru_system_time_mach;
2023
2024 cur_tsnap->tds_task_size = have_pmap ? get_task_phys_footprint(task) : 0;
2025
2026 cur_tsnap->tds_max_resident_size = get_task_resident_max(task);
2027 cur_tsnap->tds_suspend_count = task->suspend_count;
2028 cur_tsnap->tds_faults = counter_load(&task->faults);
2029 cur_tsnap->tds_pageins = counter_load(&task->pageins);
2030 cur_tsnap->tds_cow_faults = counter_load(&task->cow_faults);
2031 cur_tsnap->tds_was_throttled = (uint32_t)proc_was_throttled_from_task(task);
2032 cur_tsnap->tds_did_throttle = (uint32_t)proc_did_throttle_from_task(task);
2033 cur_tsnap->tds_latency_qos = (task->effective_policy.tep_latency_qos == LATENCY_QOS_TIER_UNSPECIFIED)
2034 ? LATENCY_QOS_TIER_UNSPECIFIED
2035 : ((0xFF << 16) | task->effective_policy.tep_latency_qos);
2036
2037 #if __arm64__
2038 if (collect_asid && have_pmap) {
2039 uint32_t asid = PMAP_VASID(task->map->pmap);
2040 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_ASID, sizeof(uint32_t), &out_addr));
2041 kdp_memcpy((void*)out_addr, &asid, sizeof(asid));
2042 }
2043 #endif
2044
2045 #if CONFIG_PERVASIVE_CPI
2046 if (collect_instrs_cycles) {
2047 kcd_exit_on_error(kcdata_record_task_instrs_cycles(kcd, task));
2048 }
2049 #endif /* CONFIG_PERVASIVE_CPI */
2050
2051 error_exit:
2052 return error;
2053 }
2054
2055 static kern_return_t
kcdata_record_thread_iostats(kcdata_descriptor_t kcd,thread_t thread)2056 kcdata_record_thread_iostats(kcdata_descriptor_t kcd, thread_t thread)
2057 {
2058 kern_return_t error = KERN_SUCCESS;
2059 mach_vm_address_t out_addr = 0;
2060
2061 /* I/O Statistics */
2062 assert(IO_NUM_PRIORITIES == STACKSHOT_IO_NUM_PRIORITIES);
2063 if (thread->thread_io_stats && !memory_iszero(thread->thread_io_stats, sizeof(struct io_stat_info))) {
2064 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_IOSTATS, sizeof(struct io_stats_snapshot), &out_addr));
2065 struct io_stats_snapshot *_iostat = (struct io_stats_snapshot *)out_addr;
2066 _iostat->ss_disk_reads_count = thread->thread_io_stats->disk_reads.count;
2067 _iostat->ss_disk_reads_size = thread->thread_io_stats->disk_reads.size;
2068 _iostat->ss_disk_writes_count = (thread->thread_io_stats->total_io.count - thread->thread_io_stats->disk_reads.count);
2069 _iostat->ss_disk_writes_size = (thread->thread_io_stats->total_io.size - thread->thread_io_stats->disk_reads.size);
2070 _iostat->ss_paging_count = thread->thread_io_stats->paging.count;
2071 _iostat->ss_paging_size = thread->thread_io_stats->paging.size;
2072 _iostat->ss_non_paging_count = (thread->thread_io_stats->total_io.count - thread->thread_io_stats->paging.count);
2073 _iostat->ss_non_paging_size = (thread->thread_io_stats->total_io.size - thread->thread_io_stats->paging.size);
2074 _iostat->ss_metadata_count = thread->thread_io_stats->metadata.count;
2075 _iostat->ss_metadata_size = thread->thread_io_stats->metadata.size;
2076 _iostat->ss_data_count = (thread->thread_io_stats->total_io.count - thread->thread_io_stats->metadata.count);
2077 _iostat->ss_data_size = (thread->thread_io_stats->total_io.size - thread->thread_io_stats->metadata.size);
2078 for (int i = 0; i < IO_NUM_PRIORITIES; i++) {
2079 _iostat->ss_io_priority_count[i] = thread->thread_io_stats->io_priority[i].count;
2080 _iostat->ss_io_priority_size[i] = thread->thread_io_stats->io_priority[i].size;
2081 }
2082 }
2083
2084 error_exit:
2085 return error;
2086 }
2087
2088 bool
machine_trace_thread_validate_kva(vm_offset_t addr)2089 machine_trace_thread_validate_kva(vm_offset_t addr)
2090 {
2091 return _stackshot_validate_kva(addr, sizeof(uintptr_t));
2092 }
2093
2094 struct _stackshot_backtrace_context {
2095 vm_map_t sbc_map;
2096 vm_offset_t sbc_prev_page;
2097 vm_offset_t sbc_prev_kva;
2098 uint32_t sbc_flags;
2099 bool sbc_allow_faulting;
2100 };
2101
2102 static errno_t
_stackshot_backtrace_copy(void * vctx,void * dst,user_addr_t src,size_t size)2103 _stackshot_backtrace_copy(void *vctx, void *dst, user_addr_t src, size_t size)
2104 {
2105 struct _stackshot_backtrace_context *ctx = vctx;
2106 size_t map_page_mask = 0;
2107 size_t __assert_only map_page_size = kdp_vm_map_get_page_size(ctx->sbc_map,
2108 &map_page_mask);
2109 assert(size < map_page_size);
2110 if (src & (size - 1)) {
2111 // The source should be aligned to the size passed in, like a stack
2112 // frame or word.
2113 return EINVAL;
2114 }
2115
2116 vm_offset_t src_page = src & ~map_page_mask;
2117 vm_offset_t src_kva = 0;
2118
2119 if (src_page != ctx->sbc_prev_page) {
2120 uint32_t res = 0;
2121 uint32_t flags = 0;
2122 vm_offset_t src_pa = stackshot_find_phys(ctx->sbc_map, src,
2123 ctx->sbc_allow_faulting, &res);
2124
2125 flags |= (res & KDP_FAULT_RESULT_PAGED_OUT) ? kThreadTruncatedBT : 0;
2126 flags |= (res & KDP_FAULT_RESULT_TRIED_FAULT) ? kThreadTriedFaultBT : 0;
2127 flags |= (res & KDP_FAULT_RESULT_FAULTED_IN) ? kThreadFaultedBT : 0;
2128 ctx->sbc_flags |= flags;
2129 if (src_pa == 0) {
2130 return EFAULT;
2131 }
2132
2133 src_kva = phystokv(src_pa);
2134 ctx->sbc_prev_page = src_page;
2135 ctx->sbc_prev_kva = (src_kva & ~map_page_mask);
2136 } else {
2137 src_kva = ctx->sbc_prev_kva + (src & map_page_mask);
2138 }
2139
2140 #if KASAN
2141 /*
2142 * KASan does not monitor accesses to userspace pages. Therefore, it is
2143 * pointless to maintain a shadow map for them. Instead, they are all
2144 * mapped to a single, always valid shadow map page. This approach saves
2145 * a considerable amount of shadow map pages which are limited and
2146 * precious.
2147 */
2148 kasan_notify_address_nopoison(src_kva, size);
2149 #endif
2150 memcpy(dst, (const void *)src_kva, size);
2151
2152 return 0;
2153 }
2154
2155 static kern_return_t
kcdata_record_thread_snapshot(kcdata_descriptor_t kcd,thread_t thread,task_t task,uint64_t trace_flags,boolean_t have_pmap,boolean_t thread_on_core)2156 kcdata_record_thread_snapshot(
2157 kcdata_descriptor_t kcd, thread_t thread, task_t task, uint64_t trace_flags, boolean_t have_pmap, boolean_t thread_on_core)
2158 {
2159 boolean_t dispatch_p = ((trace_flags & STACKSHOT_GET_DQ) != 0);
2160 boolean_t active_kthreads_only_p = ((trace_flags & STACKSHOT_ACTIVE_KERNEL_THREADS_ONLY) != 0);
2161 boolean_t collect_delta_stackshot = ((trace_flags & STACKSHOT_COLLECT_DELTA_SNAPSHOT) != 0);
2162 boolean_t collect_iostats = !collect_delta_stackshot && !(trace_flags & STACKSHOT_NO_IO_STATS);
2163 #if CONFIG_PERVASIVE_CPI
2164 boolean_t collect_instrs_cycles = ((trace_flags & STACKSHOT_INSTRS_CYCLES) != 0);
2165 #endif /* CONFIG_PERVASIVE_CPI */
2166 kern_return_t error = KERN_SUCCESS;
2167
2168 #if STACKSHOT_COLLECTS_LATENCY_INFO
2169 struct stackshot_latency_thread latency_info;
2170 latency_info.cur_thsnap1_latency = mach_absolute_time();
2171 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2172
2173 mach_vm_address_t out_addr = 0;
2174 int saved_count = 0;
2175
2176 struct thread_snapshot_v4 * cur_thread_snap = NULL;
2177 char cur_thread_name[STACKSHOT_MAX_THREAD_NAME_SIZE];
2178
2179 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_THREAD_SNAPSHOT, sizeof(struct thread_snapshot_v4), &out_addr));
2180 cur_thread_snap = (struct thread_snapshot_v4 *)out_addr;
2181
2182 /* Populate the thread snapshot header */
2183 cur_thread_snap->ths_ss_flags = 0;
2184 cur_thread_snap->ths_thread_id = thread_tid(thread);
2185 cur_thread_snap->ths_wait_event = VM_KERNEL_UNSLIDE_OR_PERM(thread->wait_event);
2186 cur_thread_snap->ths_continuation = VM_KERNEL_UNSLIDE(thread->continuation);
2187 cur_thread_snap->ths_total_syscalls = thread->syscalls_mach + thread->syscalls_unix;
2188
2189 if (IPC_VOUCHER_NULL != thread->ith_voucher) {
2190 cur_thread_snap->ths_voucher_identifier = VM_KERNEL_ADDRPERM(thread->ith_voucher);
2191 } else {
2192 cur_thread_snap->ths_voucher_identifier = 0;
2193 }
2194
2195 #if STACKSHOT_COLLECTS_LATENCY_INFO
2196 latency_info.cur_thsnap1_latency = mach_absolute_time() - latency_info.cur_thsnap1_latency;
2197 latency_info.dispatch_serial_latency = mach_absolute_time();
2198 latency_info.dispatch_label_latency = 0;
2199 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2200
2201 cur_thread_snap->ths_dqserialnum = 0;
2202 if (dispatch_p && (task != kernel_task) && (task->active) && have_pmap) {
2203 uint64_t dqkeyaddr = thread_dispatchqaddr(thread);
2204 if (dqkeyaddr != 0) {
2205 uint64_t dqaddr = 0;
2206 boolean_t copyin_ok = stackshot_copyin_word(task, dqkeyaddr, &dqaddr, FALSE, NULL);
2207 if (copyin_ok && dqaddr != 0) {
2208 uint64_t dqserialnumaddr = dqaddr + get_task_dispatchqueue_serialno_offset(task);
2209 uint64_t dqserialnum = 0;
2210 copyin_ok = stackshot_copyin_word(task, dqserialnumaddr, &dqserialnum, FALSE, NULL);
2211 if (copyin_ok) {
2212 cur_thread_snap->ths_ss_flags |= kHasDispatchSerial;
2213 cur_thread_snap->ths_dqserialnum = dqserialnum;
2214 }
2215
2216 #if STACKSHOT_COLLECTS_LATENCY_INFO
2217 latency_info.dispatch_serial_latency = mach_absolute_time() - latency_info.dispatch_serial_latency;
2218 latency_info.dispatch_label_latency = mach_absolute_time();
2219 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2220
2221 /* try copying in the queue label */
2222 uint64_t label_offs = get_task_dispatchqueue_label_offset(task);
2223 if (label_offs) {
2224 uint64_t dqlabeladdr = dqaddr + label_offs;
2225 uint64_t actual_dqlabeladdr = 0;
2226
2227 copyin_ok = stackshot_copyin_word(task, dqlabeladdr, &actual_dqlabeladdr, FALSE, NULL);
2228 if (copyin_ok && actual_dqlabeladdr != 0) {
2229 char label_buf[STACKSHOT_QUEUE_LABEL_MAXSIZE];
2230 int len;
2231
2232 bzero(label_buf, STACKSHOT_QUEUE_LABEL_MAXSIZE * sizeof(char));
2233 len = stackshot_copyin_string(task, actual_dqlabeladdr, label_buf, STACKSHOT_QUEUE_LABEL_MAXSIZE, FALSE, NULL);
2234 if (len > 0) {
2235 mach_vm_address_t label_addr = 0;
2236 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_THREAD_DISPATCH_QUEUE_LABEL, len, &label_addr));
2237 kdp_strlcpy((char*)label_addr, &label_buf[0], len);
2238 }
2239 }
2240 }
2241 #if STACKSHOT_COLLECTS_LATENCY_INFO
2242 latency_info.dispatch_label_latency = mach_absolute_time() - latency_info.dispatch_label_latency;
2243 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2244 }
2245 }
2246 }
2247
2248 #if STACKSHOT_COLLECTS_LATENCY_INFO
2249 if ((cur_thread_snap->ths_ss_flags & kHasDispatchSerial) == 0) {
2250 latency_info.dispatch_serial_latency = 0;
2251 }
2252 latency_info.cur_thsnap2_latency = mach_absolute_time();
2253 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2254
2255 struct recount_times_mach times = recount_thread_times(thread);
2256 cur_thread_snap->ths_user_time = times.rtm_user;
2257 cur_thread_snap->ths_sys_time = times.rtm_system;
2258
2259 if (thread->thread_tag & THREAD_TAG_MAINTHREAD) {
2260 cur_thread_snap->ths_ss_flags |= kThreadMain;
2261 }
2262 if (thread->effective_policy.thep_darwinbg) {
2263 cur_thread_snap->ths_ss_flags |= kThreadDarwinBG;
2264 }
2265 if (proc_get_effective_thread_policy(thread, TASK_POLICY_PASSIVE_IO)) {
2266 cur_thread_snap->ths_ss_flags |= kThreadIOPassive;
2267 }
2268 if (thread->suspend_count > 0) {
2269 cur_thread_snap->ths_ss_flags |= kThreadSuspended;
2270 }
2271 if (thread->options & TH_OPT_GLOBAL_FORCED_IDLE) {
2272 cur_thread_snap->ths_ss_flags |= kGlobalForcedIdle;
2273 }
2274 if (thread_on_core) {
2275 cur_thread_snap->ths_ss_flags |= kThreadOnCore;
2276 }
2277 if (stackshot_thread_is_idle_worker_unsafe(thread)) {
2278 cur_thread_snap->ths_ss_flags |= kThreadIdleWorker;
2279 }
2280
2281 /* make sure state flags defined in kcdata.h still match internal flags */
2282 static_assert(SS_TH_WAIT == TH_WAIT);
2283 static_assert(SS_TH_SUSP == TH_SUSP);
2284 static_assert(SS_TH_RUN == TH_RUN);
2285 static_assert(SS_TH_UNINT == TH_UNINT);
2286 static_assert(SS_TH_TERMINATE == TH_TERMINATE);
2287 static_assert(SS_TH_TERMINATE2 == TH_TERMINATE2);
2288 static_assert(SS_TH_IDLE == TH_IDLE);
2289
2290 cur_thread_snap->ths_last_run_time = thread->last_run_time;
2291 cur_thread_snap->ths_last_made_runnable_time = thread->last_made_runnable_time;
2292 cur_thread_snap->ths_state = thread->state;
2293 cur_thread_snap->ths_sched_flags = thread->sched_flags;
2294 cur_thread_snap->ths_base_priority = thread->base_pri;
2295 cur_thread_snap->ths_sched_priority = thread->sched_pri;
2296 cur_thread_snap->ths_eqos = thread->effective_policy.thep_qos;
2297 cur_thread_snap->ths_rqos = thread->requested_policy.thrp_qos;
2298 cur_thread_snap->ths_rqos_override = MAX(thread->requested_policy.thrp_qos_override,
2299 thread->requested_policy.thrp_qos_workq_override);
2300 cur_thread_snap->ths_io_tier = (uint8_t) proc_get_effective_thread_policy(thread, TASK_POLICY_IO);
2301 cur_thread_snap->ths_thread_t = VM_KERNEL_UNSLIDE_OR_PERM(thread);
2302
2303 static_assert(sizeof(thread->effective_policy) == sizeof(uint64_t));
2304 static_assert(sizeof(thread->requested_policy) == sizeof(uint64_t));
2305 cur_thread_snap->ths_requested_policy = *(unaligned_u64 *) &thread->requested_policy;
2306 cur_thread_snap->ths_effective_policy = *(unaligned_u64 *) &thread->effective_policy;
2307
2308 #if STACKSHOT_COLLECTS_LATENCY_INFO
2309 latency_info.cur_thsnap2_latency = mach_absolute_time() - latency_info.cur_thsnap2_latency;
2310 latency_info.thread_name_latency = mach_absolute_time();
2311 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2312
2313 /* if there is thread name then add to buffer */
2314 cur_thread_name[0] = '\0';
2315 proc_threadname_kdp(get_bsdthread_info(thread), cur_thread_name, STACKSHOT_MAX_THREAD_NAME_SIZE);
2316 if (strnlen(cur_thread_name, STACKSHOT_MAX_THREAD_NAME_SIZE) > 0) {
2317 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_THREAD_NAME, sizeof(cur_thread_name), &out_addr));
2318 kdp_memcpy((void *)out_addr, (void *)cur_thread_name, sizeof(cur_thread_name));
2319 }
2320
2321 #if STACKSHOT_COLLECTS_LATENCY_INFO
2322 latency_info.thread_name_latency = mach_absolute_time() - latency_info.thread_name_latency;
2323 latency_info.sur_times_latency = mach_absolute_time();
2324 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2325
2326 /* record system, user, and runnable times */
2327 time_value_t runnable_time;
2328 thread_read_times(thread, NULL, NULL, &runnable_time);
2329 clock_sec_t user_sec = 0, system_sec = 0;
2330 clock_usec_t user_usec = 0, system_usec = 0;
2331 absolutetime_to_microtime(times.rtm_user, &user_sec, &user_usec);
2332 absolutetime_to_microtime(times.rtm_system, &system_sec, &system_usec);
2333
2334 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_CPU_TIMES, sizeof(struct stackshot_cpu_times_v2), &out_addr));
2335 struct stackshot_cpu_times_v2 *stackshot_cpu_times = (struct stackshot_cpu_times_v2 *)out_addr;
2336 *stackshot_cpu_times = (struct stackshot_cpu_times_v2){
2337 .user_usec = user_sec * USEC_PER_SEC + user_usec,
2338 .system_usec = system_sec * USEC_PER_SEC + system_usec,
2339 .runnable_usec = (uint64_t)runnable_time.seconds * USEC_PER_SEC + runnable_time.microseconds,
2340 };
2341
2342 #if STACKSHOT_COLLECTS_LATENCY_INFO
2343 latency_info.sur_times_latency = mach_absolute_time() - latency_info.sur_times_latency;
2344 latency_info.user_stack_latency = mach_absolute_time();
2345 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2346
2347 /* Trace user stack, if any */
2348 if (!active_kthreads_only_p && task->active && task->map != kernel_map) {
2349 uint32_t user_ths_ss_flags = 0;
2350
2351 /*
2352 * This relies on knowing the "end" address points to the start of the
2353 * next elements data and, in the case of arrays, the elements.
2354 */
2355 out_addr = (mach_vm_address_t)kcd_end_address(kcd);
2356 mach_vm_address_t max_addr = (mach_vm_address_t)kcd_max_address(kcd);
2357 assert(out_addr <= max_addr);
2358 size_t avail_frames = (max_addr - out_addr) / sizeof(uintptr_t);
2359 size_t max_frames = MIN(avail_frames, MAX_FRAMES);
2360 if (max_frames == 0) {
2361 error = KERN_RESOURCE_SHORTAGE;
2362 goto error_exit;
2363 }
2364 struct _stackshot_backtrace_context ctx = {
2365 .sbc_map = task->map,
2366 .sbc_allow_faulting = stack_enable_faulting,
2367 .sbc_prev_page = -1,
2368 .sbc_prev_kva = -1,
2369 };
2370 struct backtrace_control ctl = {
2371 .btc_user_thread = thread,
2372 .btc_user_copy = _stackshot_backtrace_copy,
2373 .btc_user_copy_context = &ctx,
2374 };
2375 struct backtrace_user_info info = BTUINFO_INIT;
2376
2377 saved_count = backtrace_user((uintptr_t *)out_addr, max_frames, &ctl,
2378 &info);
2379 if (saved_count > 0) {
2380 #if __LP64__
2381 #define STACKLR_WORDS STACKSHOT_KCTYPE_USER_STACKLR64
2382 #else // __LP64__
2383 #define STACKLR_WORDS STACKSHOT_KCTYPE_USER_STACKLR
2384 #endif // !__LP64__
2385 mach_vm_address_t out_addr_array;
2386 kcd_exit_on_error(kcdata_get_memory_addr_for_array(kcd,
2387 STACKLR_WORDS, sizeof(uintptr_t), saved_count,
2388 &out_addr_array));
2389 /*
2390 * Ensure the kcd_end_address (above) trick worked.
2391 */
2392 assert(out_addr == out_addr_array);
2393 if (info.btui_info & BTI_64_BIT) {
2394 user_ths_ss_flags |= kUser64_p;
2395 }
2396 if ((info.btui_info & BTI_TRUNCATED) ||
2397 (ctx.sbc_flags & kThreadTruncatedBT)) {
2398 user_ths_ss_flags |= kThreadTruncatedBT;
2399 user_ths_ss_flags |= kThreadTruncUserBT;
2400 }
2401 user_ths_ss_flags |= ctx.sbc_flags;
2402 ctx.sbc_flags = 0;
2403 #if __LP64__
2404 /* We only support async stacks on 64-bit kernels */
2405 if (info.btui_async_frame_addr != 0) {
2406 uint32_t async_start_offset = info.btui_async_start_index;
2407 kcd_exit_on_error(kcdata_push_data(kcd, STACKSHOT_KCTYPE_USER_ASYNC_START_INDEX,
2408 sizeof(async_start_offset), &async_start_offset));
2409 out_addr = (mach_vm_address_t)kcd_end_address(kcd);
2410 assert(out_addr <= max_addr);
2411
2412 avail_frames = (max_addr - out_addr) / sizeof(uintptr_t);
2413 max_frames = MIN(avail_frames, MAX_FRAMES);
2414 if (max_frames == 0) {
2415 error = KERN_RESOURCE_SHORTAGE;
2416 goto error_exit;
2417 }
2418 ctl.btc_frame_addr = info.btui_async_frame_addr;
2419 ctl.btc_addr_offset = BTCTL_ASYNC_ADDR_OFFSET;
2420 info = BTUINFO_INIT;
2421 unsigned int async_count = backtrace_user((uintptr_t *)out_addr, max_frames, &ctl,
2422 &info);
2423 if (async_count > 0) {
2424 mach_vm_address_t async_out_addr;
2425 kcd_exit_on_error(kcdata_get_memory_addr_for_array(kcd,
2426 STACKSHOT_KCTYPE_USER_ASYNC_STACKLR64, sizeof(uintptr_t), async_count,
2427 &async_out_addr));
2428 /*
2429 * Ensure the kcd_end_address (above) trick worked.
2430 */
2431 assert(out_addr == async_out_addr);
2432 if ((info.btui_info & BTI_TRUNCATED) ||
2433 (ctx.sbc_flags & kThreadTruncatedBT)) {
2434 user_ths_ss_flags |= kThreadTruncatedBT;
2435 user_ths_ss_flags |= kThreadTruncUserAsyncBT;
2436 }
2437 user_ths_ss_flags |= ctx.sbc_flags;
2438 }
2439 }
2440 #endif /* _LP64 */
2441 }
2442 if (user_ths_ss_flags != 0) {
2443 cur_thread_snap->ths_ss_flags |= user_ths_ss_flags;
2444 }
2445 }
2446
2447 #if STACKSHOT_COLLECTS_LATENCY_INFO
2448 latency_info.user_stack_latency = mach_absolute_time() - latency_info.user_stack_latency;
2449 latency_info.kernel_stack_latency = mach_absolute_time();
2450 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2451
2452 /* Call through to the machine specific trace routines
2453 * Frames are added past the snapshot header.
2454 */
2455 if (thread->kernel_stack != 0) {
2456 uint32_t kern_ths_ss_flags = 0;
2457 out_addr = (mach_vm_address_t)kcd_end_address(kcd);
2458 #if defined(__LP64__)
2459 uint32_t stack_kcdata_type = STACKSHOT_KCTYPE_KERN_STACKLR64;
2460 extern int machine_trace_thread64(thread_t thread, char *tracepos,
2461 char *tracebound, int nframes, uint32_t *thread_trace_flags);
2462 saved_count = machine_trace_thread64(
2463 #else
2464 uint32_t stack_kcdata_type = STACKSHOT_KCTYPE_KERN_STACKLR;
2465 extern int machine_trace_thread(thread_t thread, char *tracepos,
2466 char *tracebound, int nframes, uint32_t *thread_trace_flags);
2467 saved_count = machine_trace_thread(
2468 #endif
2469 thread, (char *)out_addr, (char *)kcd_max_address(kcd), MAX_FRAMES,
2470 &kern_ths_ss_flags);
2471 if (saved_count > 0) {
2472 int frame_size = sizeof(uintptr_t);
2473 #if defined(__LP64__)
2474 cur_thread_snap->ths_ss_flags |= kKernel64_p;
2475 #endif
2476 kcd_exit_on_error(kcdata_get_memory_addr_for_array(kcd, stack_kcdata_type,
2477 frame_size, saved_count / frame_size, &out_addr));
2478 }
2479 if (kern_ths_ss_flags & kThreadTruncatedBT) {
2480 kern_ths_ss_flags |= kThreadTruncKernBT;
2481 }
2482 if (kern_ths_ss_flags != 0) {
2483 cur_thread_snap->ths_ss_flags |= kern_ths_ss_flags;
2484 }
2485 }
2486
2487 #if STACKSHOT_COLLECTS_LATENCY_INFO
2488 latency_info.kernel_stack_latency = mach_absolute_time() - latency_info.kernel_stack_latency;
2489 latency_info.misc_latency = mach_absolute_time();
2490 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2491
2492 #if CONFIG_THREAD_GROUPS
2493 if (trace_flags & STACKSHOT_THREAD_GROUP) {
2494 uint64_t thread_group_id = thread->thread_group ? thread_group_get_id(thread->thread_group) : 0;
2495 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_THREAD_GROUP, sizeof(thread_group_id), &out_addr));
2496 kdp_memcpy((void*)out_addr, &thread_group_id, sizeof(uint64_t));
2497 }
2498 #endif /* CONFIG_THREAD_GROUPS */
2499
2500 if (collect_iostats) {
2501 kcd_exit_on_error(kcdata_record_thread_iostats(kcd, thread));
2502 }
2503
2504 #if CONFIG_PERVASIVE_CPI
2505 if (collect_instrs_cycles) {
2506 struct recount_usage usage = { 0 };
2507 recount_sum_unsafe(&recount_thread_plan, thread->th_recount.rth_lifetime,
2508 &usage);
2509
2510 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_INSTRS_CYCLES, sizeof(struct instrs_cycles_snapshot), &out_addr));
2511 struct instrs_cycles_snapshot *instrs_cycles = (struct instrs_cycles_snapshot *)out_addr;
2512 instrs_cycles->ics_instructions = usage.ru_instructions;
2513 instrs_cycles->ics_cycles = usage.ru_cycles;
2514 }
2515 #endif /* CONFIG_PERVASIVE_CPI */
2516
2517 #if STACKSHOT_COLLECTS_LATENCY_INFO
2518 latency_info.misc_latency = mach_absolute_time() - latency_info.misc_latency;
2519 if (collect_latency_info) {
2520 kcd_exit_on_error(kcdata_push_data(kcd, STACKSHOT_KCTYPE_LATENCY_INFO_THREAD, sizeof(latency_info), &latency_info));
2521 }
2522 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2523
2524 error_exit:
2525 return error;
2526 }
2527
2528 static int
kcdata_record_thread_delta_snapshot(struct thread_delta_snapshot_v3 * cur_thread_snap,thread_t thread,boolean_t thread_on_core)2529 kcdata_record_thread_delta_snapshot(struct thread_delta_snapshot_v3 * cur_thread_snap, thread_t thread, boolean_t thread_on_core)
2530 {
2531 cur_thread_snap->tds_thread_id = thread_tid(thread);
2532 if (IPC_VOUCHER_NULL != thread->ith_voucher) {
2533 cur_thread_snap->tds_voucher_identifier = VM_KERNEL_ADDRPERM(thread->ith_voucher);
2534 } else {
2535 cur_thread_snap->tds_voucher_identifier = 0;
2536 }
2537
2538 cur_thread_snap->tds_ss_flags = 0;
2539 if (thread->effective_policy.thep_darwinbg) {
2540 cur_thread_snap->tds_ss_flags |= kThreadDarwinBG;
2541 }
2542 if (proc_get_effective_thread_policy(thread, TASK_POLICY_PASSIVE_IO)) {
2543 cur_thread_snap->tds_ss_flags |= kThreadIOPassive;
2544 }
2545 if (thread->suspend_count > 0) {
2546 cur_thread_snap->tds_ss_flags |= kThreadSuspended;
2547 }
2548 if (thread->options & TH_OPT_GLOBAL_FORCED_IDLE) {
2549 cur_thread_snap->tds_ss_flags |= kGlobalForcedIdle;
2550 }
2551 if (thread_on_core) {
2552 cur_thread_snap->tds_ss_flags |= kThreadOnCore;
2553 }
2554 if (stackshot_thread_is_idle_worker_unsafe(thread)) {
2555 cur_thread_snap->tds_ss_flags |= kThreadIdleWorker;
2556 }
2557
2558 cur_thread_snap->tds_last_made_runnable_time = thread->last_made_runnable_time;
2559 cur_thread_snap->tds_state = thread->state;
2560 cur_thread_snap->tds_sched_flags = thread->sched_flags;
2561 cur_thread_snap->tds_base_priority = thread->base_pri;
2562 cur_thread_snap->tds_sched_priority = thread->sched_pri;
2563 cur_thread_snap->tds_eqos = thread->effective_policy.thep_qos;
2564 cur_thread_snap->tds_rqos = thread->requested_policy.thrp_qos;
2565 cur_thread_snap->tds_rqos_override = MAX(thread->requested_policy.thrp_qos_override,
2566 thread->requested_policy.thrp_qos_workq_override);
2567 cur_thread_snap->tds_io_tier = (uint8_t) proc_get_effective_thread_policy(thread, TASK_POLICY_IO);
2568
2569 static_assert(sizeof(thread->effective_policy) == sizeof(uint64_t));
2570 static_assert(sizeof(thread->requested_policy) == sizeof(uint64_t));
2571 cur_thread_snap->tds_requested_policy = *(unaligned_u64 *) &thread->requested_policy;
2572 cur_thread_snap->tds_effective_policy = *(unaligned_u64 *) &thread->effective_policy;
2573
2574 return 0;
2575 }
2576
2577 /*
2578 * Why 12? 12 strikes a decent balance between allocating a large array on
2579 * the stack and having large kcdata item overheads for recording nonrunable
2580 * tasks.
2581 */
2582 #define UNIQUEIDSPERFLUSH 12
2583
2584 struct saved_uniqueids {
2585 uint64_t ids[UNIQUEIDSPERFLUSH];
2586 unsigned count;
2587 };
2588
2589 enum thread_classification {
2590 tc_full_snapshot, /* take a full snapshot */
2591 tc_delta_snapshot, /* take a delta snapshot */
2592 };
2593
2594 static enum thread_classification
classify_thread(thread_t thread,boolean_t * thread_on_core_p,boolean_t collect_delta_stackshot)2595 classify_thread(thread_t thread, boolean_t * thread_on_core_p, boolean_t collect_delta_stackshot)
2596 {
2597 processor_t last_processor = thread->last_processor;
2598
2599 boolean_t thread_on_core = FALSE;
2600 if (last_processor != PROCESSOR_NULL) {
2601 /* Idle threads are always treated as on-core, since the processor state can change while they are running. */
2602 thread_on_core = (thread == last_processor->idle_thread) ||
2603 ((last_processor->state == PROCESSOR_SHUTDOWN || last_processor->state == PROCESSOR_RUNNING) &&
2604 last_processor->active_thread == thread);
2605 }
2606
2607 *thread_on_core_p = thread_on_core;
2608
2609 /* Capture the full thread snapshot if this is not a delta stackshot or if the thread has run subsequent to the
2610 * previous full stackshot */
2611 if (!collect_delta_stackshot || thread_on_core || (thread->last_run_time > stack_snapshot_delta_since_timestamp)) {
2612 return tc_full_snapshot;
2613 } else {
2614 return tc_delta_snapshot;
2615 }
2616 }
2617
2618 struct stackshot_context {
2619 int pid;
2620 uint64_t trace_flags;
2621 bool include_drivers;
2622 };
2623
2624 static kern_return_t
kdp_stackshot_record_task(struct stackshot_context * ctx,task_t task)2625 kdp_stackshot_record_task(struct stackshot_context *ctx, task_t task)
2626 {
2627 boolean_t active_kthreads_only_p = ((ctx->trace_flags & STACKSHOT_ACTIVE_KERNEL_THREADS_ONLY) != 0);
2628 boolean_t save_donating_pids_p = ((ctx->trace_flags & STACKSHOT_SAVE_IMP_DONATION_PIDS) != 0);
2629 boolean_t collect_delta_stackshot = ((ctx->trace_flags & STACKSHOT_COLLECT_DELTA_SNAPSHOT) != 0);
2630 boolean_t save_owner_info = ((ctx->trace_flags & STACKSHOT_THREAD_WAITINFO) != 0);
2631
2632 kern_return_t error = KERN_SUCCESS;
2633 mach_vm_address_t out_addr = 0;
2634 int saved_count = 0;
2635
2636 int task_pid = 0;
2637 uint64_t task_uniqueid = 0;
2638 int num_delta_thread_snapshots = 0;
2639 int num_waitinfo_threads = 0;
2640 int num_turnstileinfo_threads = 0;
2641
2642 uint64_t task_start_abstime = 0;
2643 boolean_t have_map = FALSE, have_pmap = FALSE;
2644 boolean_t some_thread_ran = FALSE;
2645 unaligned_u64 task_snap_ss_flags = 0;
2646 #if STACKSHOT_COLLECTS_LATENCY_INFO
2647 struct stackshot_latency_task latency_info;
2648 latency_info.setup_latency = mach_absolute_time();
2649 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2650
2651 #if SCHED_HYGIENE_DEBUG && CONFIG_PERVASIVE_CPI
2652 uint64_t task_begin_cpu_cycle_count = 0;
2653 if (!panic_stackshot) {
2654 task_begin_cpu_cycle_count = mt_cur_cpu_cycles();
2655 }
2656 #endif
2657
2658 if ((task == NULL) || !_stackshot_validate_kva((vm_offset_t)task, sizeof(struct task))) {
2659 error = KERN_FAILURE;
2660 goto error_exit;
2661 }
2662
2663 void *bsd_info = get_bsdtask_info(task);
2664 boolean_t task_in_teardown = (bsd_info == NULL) || proc_in_teardown(bsd_info);// has P_LPEXIT set during proc_exit()
2665 boolean_t task_in_transition = task_in_teardown; // here we can add other types of transition.
2666 uint32_t container_type = (task_in_transition) ? STACKSHOT_KCCONTAINER_TRANSITIONING_TASK : STACKSHOT_KCCONTAINER_TASK;
2667 uint32_t transition_type = (task_in_teardown) ? kTaskIsTerminated : 0;
2668
2669 if (task_in_transition) {
2670 collect_delta_stackshot = FALSE;
2671 }
2672
2673 have_map = (task->map != NULL) && (_stackshot_validate_kva((vm_offset_t)(task->map), sizeof(struct _vm_map)));
2674 have_pmap = have_map && (task->map->pmap != NULL) && (_stackshot_validate_kva((vm_offset_t)(task->map->pmap), sizeof(struct pmap)));
2675
2676 task_pid = pid_from_task(task);
2677 /* Is returning -1 ok for terminating task ok ??? */
2678 task_uniqueid = get_task_uniqueid(task);
2679
2680 if (!task->active || task_is_a_corpse(task) || task_is_a_corpse_fork(task)) {
2681 /*
2682 * Not interested in terminated tasks without threads.
2683 */
2684 if (queue_empty(&task->threads) || task_pid == -1) {
2685 return KERN_SUCCESS;
2686 }
2687 }
2688
2689 /* All PIDs should have the MSB unset */
2690 assert((task_pid & (1ULL << 31)) == 0);
2691
2692 #if STACKSHOT_COLLECTS_LATENCY_INFO
2693 latency_info.setup_latency = mach_absolute_time() - latency_info.setup_latency;
2694 latency_info.task_uniqueid = task_uniqueid;
2695 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2696
2697 /* Trace everything, unless a process was specified. Add in driver tasks if requested. */
2698 if ((ctx->pid == -1) || (ctx->pid == task_pid) || (ctx->include_drivers && task_is_driver(task))) {
2699 /* add task snapshot marker */
2700 kcd_exit_on_error(kcdata_add_container_marker(stackshot_kcdata_p, KCDATA_TYPE_CONTAINER_BEGIN,
2701 container_type, task_uniqueid));
2702
2703 if (collect_delta_stackshot) {
2704 /*
2705 * For delta stackshots we need to know if a thread from this task has run since the
2706 * previous timestamp to decide whether we're going to record a full snapshot and UUID info.
2707 */
2708 thread_t thread = THREAD_NULL;
2709 queue_iterate(&task->threads, thread, thread_t, task_threads)
2710 {
2711 if ((thread == NULL) || !_stackshot_validate_kva((vm_offset_t)thread, sizeof(struct thread))) {
2712 error = KERN_FAILURE;
2713 goto error_exit;
2714 }
2715
2716 if (active_kthreads_only_p && thread->kernel_stack == 0) {
2717 continue;
2718 }
2719
2720 boolean_t thread_on_core;
2721 enum thread_classification thread_classification = classify_thread(thread, &thread_on_core, collect_delta_stackshot);
2722
2723 switch (thread_classification) {
2724 case tc_full_snapshot:
2725 some_thread_ran = TRUE;
2726 break;
2727 case tc_delta_snapshot:
2728 num_delta_thread_snapshots++;
2729 break;
2730 }
2731 }
2732 }
2733
2734 if (collect_delta_stackshot) {
2735 proc_starttime_kdp(get_bsdtask_info(task), NULL, NULL, &task_start_abstime);
2736 }
2737
2738 /* Next record any relevant UUID info and store the task snapshot */
2739 if (task_in_transition ||
2740 !collect_delta_stackshot ||
2741 (task_start_abstime == 0) ||
2742 (task_start_abstime > stack_snapshot_delta_since_timestamp) ||
2743 some_thread_ran) {
2744 /*
2745 * Collect full task information in these scenarios:
2746 *
2747 * 1) a full stackshot or the task is in transition
2748 * 2) a delta stackshot where the task started after the previous full stackshot
2749 * 3) a delta stackshot where any thread from the task has run since the previous full stackshot
2750 *
2751 * because the task may have exec'ed, changing its name, architecture, load info, etc
2752 */
2753
2754 kcd_exit_on_error(kcdata_record_shared_cache_info(stackshot_kcdata_p, task, &task_snap_ss_flags));
2755 kcd_exit_on_error(kcdata_record_uuid_info(stackshot_kcdata_p, task, ctx->trace_flags, have_pmap, &task_snap_ss_flags));
2756 #if STACKSHOT_COLLECTS_LATENCY_INFO
2757 if (!task_in_transition) {
2758 kcd_exit_on_error(kcdata_record_task_snapshot(stackshot_kcdata_p, task, ctx->trace_flags, have_pmap, task_snap_ss_flags, &latency_info));
2759 } else {
2760 kcd_exit_on_error(kcdata_record_transitioning_task_snapshot(stackshot_kcdata_p, task, task_snap_ss_flags, transition_type));
2761 }
2762 #else
2763 if (!task_in_transition) {
2764 kcd_exit_on_error(kcdata_record_task_snapshot(stackshot_kcdata_p, task, ctx->trace_flags, have_pmap, task_snap_ss_flags));
2765 } else {
2766 kcd_exit_on_error(kcdata_record_transitioning_task_snapshot(stackshot_kcdata_p, task, task_snap_ss_flags, transition_type));
2767 }
2768 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2769 } else {
2770 kcd_exit_on_error(kcdata_record_task_delta_snapshot(stackshot_kcdata_p, task, ctx->trace_flags, have_pmap, task_snap_ss_flags));
2771 }
2772
2773 #if STACKSHOT_COLLECTS_LATENCY_INFO
2774 latency_info.misc_latency = mach_absolute_time();
2775 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2776
2777 struct thread_delta_snapshot_v3 * delta_snapshots = NULL;
2778 int current_delta_snapshot_index = 0;
2779 if (num_delta_thread_snapshots > 0) {
2780 kcd_exit_on_error(kcdata_get_memory_addr_for_array(stackshot_kcdata_p, STACKSHOT_KCTYPE_THREAD_DELTA_SNAPSHOT,
2781 sizeof(struct thread_delta_snapshot_v3),
2782 num_delta_thread_snapshots, &out_addr));
2783 delta_snapshots = (struct thread_delta_snapshot_v3 *)out_addr;
2784 }
2785
2786
2787 #if STACKSHOT_COLLECTS_LATENCY_INFO
2788 latency_info.task_thread_count_loop_latency = mach_absolute_time();
2789 #endif
2790 /*
2791 * Iterate over the task threads to save thread snapshots and determine
2792 * how much space we need for waitinfo and turnstile info
2793 */
2794 thread_t thread = THREAD_NULL;
2795 queue_iterate(&task->threads, thread, thread_t, task_threads)
2796 {
2797 if ((thread == NULL) || !_stackshot_validate_kva((vm_offset_t)thread, sizeof(struct thread))) {
2798 error = KERN_FAILURE;
2799 goto error_exit;
2800 }
2801
2802 uint64_t thread_uniqueid;
2803 if (active_kthreads_only_p && thread->kernel_stack == 0) {
2804 continue;
2805 }
2806 thread_uniqueid = thread_tid(thread);
2807
2808 boolean_t thread_on_core;
2809 enum thread_classification thread_classification = classify_thread(thread, &thread_on_core, collect_delta_stackshot);
2810
2811 switch (thread_classification) {
2812 case tc_full_snapshot:
2813 /* add thread marker */
2814 kcd_exit_on_error(kcdata_add_container_marker(stackshot_kcdata_p, KCDATA_TYPE_CONTAINER_BEGIN,
2815 STACKSHOT_KCCONTAINER_THREAD, thread_uniqueid));
2816
2817 /* thread snapshot can be large, including strings, avoid overflowing the stack. */
2818 kcdata_compression_window_open(stackshot_kcdata_p);
2819
2820 kcd_exit_on_error(kcdata_record_thread_snapshot(stackshot_kcdata_p, thread, task, ctx->trace_flags, have_pmap, thread_on_core));
2821
2822 kcd_exit_on_error(kcdata_compression_window_close(stackshot_kcdata_p));
2823
2824 /* mark end of thread snapshot data */
2825 kcd_exit_on_error(kcdata_add_container_marker(stackshot_kcdata_p, KCDATA_TYPE_CONTAINER_END,
2826 STACKSHOT_KCCONTAINER_THREAD, thread_uniqueid));
2827 break;
2828 case tc_delta_snapshot:
2829 kcd_exit_on_error(kcdata_record_thread_delta_snapshot(&delta_snapshots[current_delta_snapshot_index++], thread, thread_on_core));
2830 break;
2831 }
2832
2833 /*
2834 * We want to report owner information regardless of whether a thread
2835 * has changed since the last delta, whether it's a normal stackshot,
2836 * or whether it's nonrunnable
2837 */
2838 if (save_owner_info) {
2839 if (stackshot_thread_has_valid_waitinfo(thread)) {
2840 num_waitinfo_threads++;
2841 }
2842
2843 if (stackshot_thread_has_valid_turnstileinfo(thread)) {
2844 num_turnstileinfo_threads++;
2845 }
2846 }
2847 }
2848 #if STACKSHOT_COLLECTS_LATENCY_INFO
2849 latency_info.task_thread_count_loop_latency = mach_absolute_time() - latency_info.task_thread_count_loop_latency;
2850 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2851
2852
2853 thread_waitinfo_v2_t *thread_waitinfo = NULL;
2854 thread_turnstileinfo_v2_t *thread_turnstileinfo = NULL;
2855 int current_waitinfo_index = 0;
2856 int current_turnstileinfo_index = 0;
2857 /* allocate space for the wait and turnstil info */
2858 if (num_waitinfo_threads > 0 || num_turnstileinfo_threads > 0) {
2859 /* thread waitinfo and turnstileinfo can be quite large, avoid overflowing the stack */
2860 kcdata_compression_window_open(stackshot_kcdata_p);
2861
2862 if (num_waitinfo_threads > 0) {
2863 kcd_exit_on_error(kcdata_get_memory_addr_for_array(stackshot_kcdata_p, STACKSHOT_KCTYPE_THREAD_WAITINFO,
2864 sizeof(thread_waitinfo_v2_t), num_waitinfo_threads, &out_addr));
2865 thread_waitinfo = (thread_waitinfo_v2_t *)out_addr;
2866 }
2867
2868 if (num_turnstileinfo_threads > 0) {
2869 /* get space for the turnstile info */
2870 kcd_exit_on_error(kcdata_get_memory_addr_for_array(stackshot_kcdata_p, STACKSHOT_KCTYPE_THREAD_TURNSTILEINFO,
2871 sizeof(thread_turnstileinfo_v2_t), num_turnstileinfo_threads, &out_addr));
2872 thread_turnstileinfo = (thread_turnstileinfo_v2_t *)out_addr;
2873 }
2874
2875 stackshot_plh_resetgen(); // so we know which portlabel_ids are referenced
2876 }
2877
2878 #if STACKSHOT_COLLECTS_LATENCY_INFO
2879 latency_info.misc_latency = mach_absolute_time() - latency_info.misc_latency;
2880 latency_info.task_thread_data_loop_latency = mach_absolute_time();
2881 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2882
2883 /* Iterate over the task's threads to save the wait and turnstile info */
2884 queue_iterate(&task->threads, thread, thread_t, task_threads)
2885 {
2886 uint64_t thread_uniqueid;
2887
2888 if (active_kthreads_only_p && thread->kernel_stack == 0) {
2889 continue;
2890 }
2891
2892 thread_uniqueid = thread_tid(thread);
2893
2894 /* If we want owner info, we should capture it regardless of its classification */
2895 if (save_owner_info) {
2896 if (stackshot_thread_has_valid_waitinfo(thread)) {
2897 stackshot_thread_wait_owner_info(
2898 thread,
2899 &thread_waitinfo[current_waitinfo_index++]);
2900 }
2901
2902 if (stackshot_thread_has_valid_turnstileinfo(thread)) {
2903 stackshot_thread_turnstileinfo(
2904 thread,
2905 &thread_turnstileinfo[current_turnstileinfo_index++]);
2906 }
2907 }
2908 }
2909
2910 #if STACKSHOT_COLLECTS_LATENCY_INFO
2911 latency_info.task_thread_data_loop_latency = mach_absolute_time() - latency_info.task_thread_data_loop_latency;
2912 latency_info.misc2_latency = mach_absolute_time();
2913 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2914
2915 #if DEBUG || DEVELOPMENT
2916 if (current_delta_snapshot_index != num_delta_thread_snapshots) {
2917 panic("delta thread snapshot count mismatch while capturing snapshots for task %p. expected %d, found %d", task,
2918 num_delta_thread_snapshots, current_delta_snapshot_index);
2919 }
2920 if (current_waitinfo_index != num_waitinfo_threads) {
2921 panic("thread wait info count mismatch while capturing snapshots for task %p. expected %d, found %d", task,
2922 num_waitinfo_threads, current_waitinfo_index);
2923 }
2924 #endif
2925
2926 if (num_waitinfo_threads > 0 || num_turnstileinfo_threads > 0) {
2927 kcd_exit_on_error(kcdata_compression_window_close(stackshot_kcdata_p));
2928 // now, record the portlabel hashes.
2929 kcd_exit_on_error(kdp_stackshot_plh_record());
2930 }
2931
2932 #if IMPORTANCE_INHERITANCE
2933 if (save_donating_pids_p) {
2934 kcd_exit_on_error(
2935 ((((mach_vm_address_t)kcd_end_address(stackshot_kcdata_p) + (TASK_IMP_WALK_LIMIT * sizeof(int32_t))) <
2936 (mach_vm_address_t)kcd_max_address(stackshot_kcdata_p))
2937 ? KERN_SUCCESS
2938 : KERN_RESOURCE_SHORTAGE));
2939 saved_count = task_importance_list_pids(task, TASK_IMP_LIST_DONATING_PIDS,
2940 (void *)kcd_end_address(stackshot_kcdata_p), TASK_IMP_WALK_LIMIT);
2941 if (saved_count > 0) {
2942 /* Variable size array - better not have it on the stack. */
2943 kcdata_compression_window_open(stackshot_kcdata_p);
2944 kcd_exit_on_error(kcdata_get_memory_addr_for_array(stackshot_kcdata_p, STACKSHOT_KCTYPE_DONATING_PIDS,
2945 sizeof(int32_t), saved_count, &out_addr));
2946 kcd_exit_on_error(kcdata_compression_window_close(stackshot_kcdata_p));
2947 }
2948 }
2949 #endif
2950
2951 #if SCHED_HYGIENE_DEBUG && CONFIG_PERVASIVE_CPI
2952 if (!panic_stackshot) {
2953 kcd_exit_on_error(kcdata_add_uint64_with_description(stackshot_kcdata_p, (mt_cur_cpu_cycles() - task_begin_cpu_cycle_count),
2954 "task_cpu_cycle_count"));
2955 }
2956 #endif
2957
2958 #if STACKSHOT_COLLECTS_LATENCY_INFO
2959 latency_info.misc2_latency = mach_absolute_time() - latency_info.misc2_latency;
2960 if (collect_latency_info) {
2961 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_LATENCY_INFO_TASK, sizeof(latency_info), &latency_info));
2962 }
2963 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2964
2965 /* mark end of task snapshot data */
2966 kcd_exit_on_error(kcdata_add_container_marker(stackshot_kcdata_p, KCDATA_TYPE_CONTAINER_END, container_type,
2967 task_uniqueid));
2968 }
2969
2970
2971 error_exit:
2972 return error;
2973 }
2974
2975 /* Record global shared regions */
2976 static kern_return_t
kdp_stackshot_shared_regions(uint64_t trace_flags)2977 kdp_stackshot_shared_regions(uint64_t trace_flags)
2978 {
2979 kern_return_t error = KERN_SUCCESS;
2980
2981 boolean_t collect_delta_stackshot = ((trace_flags & STACKSHOT_COLLECT_DELTA_SNAPSHOT) != 0);
2982 extern queue_head_t vm_shared_region_queue;
2983 vm_shared_region_t sr;
2984
2985 extern queue_head_t vm_shared_region_queue;
2986 queue_iterate(&vm_shared_region_queue,
2987 sr,
2988 vm_shared_region_t,
2989 sr_q) {
2990 struct dyld_shared_cache_loadinfo_v2 scinfo = {0};
2991 if (!_stackshot_validate_kva((vm_offset_t)sr, sizeof(*sr))) {
2992 break;
2993 }
2994 if (collect_delta_stackshot && sr->sr_install_time < stack_snapshot_delta_since_timestamp) {
2995 continue; // only include new shared caches in delta stackshots
2996 }
2997 uint32_t sharedCacheFlags = ((sr == primary_system_shared_region) ? kSharedCacheSystemPrimary : 0) |
2998 (sr->sr_driverkit ? kSharedCacheDriverkit : 0);
2999 kcd_exit_on_error(kcdata_add_container_marker(stackshot_kcdata_p, KCDATA_TYPE_CONTAINER_BEGIN,
3000 STACKSHOT_KCCONTAINER_SHAREDCACHE, sr->sr_id));
3001 kdp_memcpy(scinfo.sharedCacheUUID, sr->sr_uuid, sizeof(sr->sr_uuid));
3002 scinfo.sharedCacheSlide = sr->sr_slide;
3003 scinfo.sharedCacheUnreliableSlidBaseAddress = sr->sr_base_address + sr->sr_first_mapping;
3004 scinfo.sharedCacheSlidFirstMapping = sr->sr_base_address + sr->sr_first_mapping;
3005 scinfo.sharedCacheID = sr->sr_id;
3006 scinfo.sharedCacheFlags = sharedCacheFlags;
3007
3008 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_SHAREDCACHE_INFO,
3009 sizeof(scinfo), &scinfo));
3010
3011 if ((trace_flags & STACKSHOT_COLLECT_SHAREDCACHE_LAYOUT) && sr->sr_images != NULL &&
3012 _stackshot_validate_kva((vm_offset_t)sr->sr_images, sr->sr_images_count * sizeof(struct dyld_uuid_info_64))) {
3013 assert(sr->sr_images_count != 0);
3014 kcd_exit_on_error(kcdata_push_array(stackshot_kcdata_p, STACKSHOT_KCTYPE_SYS_SHAREDCACHE_LAYOUT, sizeof(struct dyld_uuid_info_64), sr->sr_images_count, sr->sr_images));
3015 }
3016 kcd_exit_on_error(kcdata_add_container_marker(stackshot_kcdata_p, KCDATA_TYPE_CONTAINER_END,
3017 STACKSHOT_KCCONTAINER_SHAREDCACHE, sr->sr_id));
3018 }
3019
3020 /*
3021 * For backwards compatibility; this will eventually be removed.
3022 * Another copy of the Primary System Shared Region, for older readers.
3023 */
3024 sr = primary_system_shared_region;
3025 /* record system level shared cache load info (if available) */
3026 if (!collect_delta_stackshot && sr &&
3027 _stackshot_validate_kva((vm_offset_t)sr, sizeof(struct vm_shared_region))) {
3028 struct dyld_shared_cache_loadinfo scinfo = {0};
3029
3030 /*
3031 * Historically, this data was in a dyld_uuid_info_64 structure, but the
3032 * naming of both the structure and fields for this use isn't great. The
3033 * dyld_shared_cache_loadinfo structure has better names, but the same
3034 * layout and content as the original.
3035 *
3036 * The imageSlidBaseAddress/sharedCacheUnreliableSlidBaseAddress field
3037 * has been used inconsistently for STACKSHOT_COLLECT_SHAREDCACHE_LAYOUT
3038 * entries; here, it's the slid base address, and we leave it that way
3039 * for backwards compatibility.
3040 */
3041 kdp_memcpy(scinfo.sharedCacheUUID, &sr->sr_uuid, sizeof(sr->sr_uuid));
3042 scinfo.sharedCacheSlide = sr->sr_slide;
3043 scinfo.sharedCacheUnreliableSlidBaseAddress = sr->sr_slide + sr->sr_base_address;
3044 scinfo.sharedCacheSlidFirstMapping = sr->sr_base_address + sr->sr_first_mapping;
3045
3046 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_SHAREDCACHE_LOADINFO,
3047 sizeof(scinfo), &scinfo));
3048
3049 if (trace_flags & STACKSHOT_COLLECT_SHAREDCACHE_LAYOUT) {
3050 /*
3051 * Include a map of the system shared cache layout if it has been populated
3052 * (which is only when the system is using a custom shared cache).
3053 */
3054 if (sr->sr_images && _stackshot_validate_kva((vm_offset_t)sr->sr_images,
3055 (sr->sr_images_count * sizeof(struct dyld_uuid_info_64)))) {
3056 assert(sr->sr_images_count != 0);
3057 kcd_exit_on_error(kcdata_push_array(stackshot_kcdata_p, STACKSHOT_KCTYPE_SYS_SHAREDCACHE_LAYOUT, sizeof(struct dyld_uuid_info_64), sr->sr_images_count, sr->sr_images));
3058 }
3059 }
3060 }
3061
3062 error_exit:
3063 return error;
3064 }
3065
3066 static kern_return_t
kdp_stackshot_kcdata_format(int pid,uint64_t trace_flags,uint32_t * pBytesTraced,uint32_t * pBytesUncompressed)3067 kdp_stackshot_kcdata_format(int pid, uint64_t trace_flags, uint32_t * pBytesTraced, uint32_t * pBytesUncompressed)
3068 {
3069 kern_return_t error = KERN_SUCCESS;
3070 mach_vm_address_t out_addr = 0;
3071 uint64_t abs_time = 0, abs_time_end = 0;
3072 uint64_t system_state_flags = 0;
3073 task_t task = TASK_NULL;
3074 mach_timebase_info_data_t timebase = {0, 0};
3075 uint32_t length_to_copy = 0, tmp32 = 0;
3076 abs_time = mach_absolute_time();
3077 uint64_t last_task_start_time = 0;
3078
3079 #if STACKSHOT_COLLECTS_LATENCY_INFO
3080 struct stackshot_latency_collection latency_info;
3081 #endif
3082
3083 #if SCHED_HYGIENE_DEBUG && CONFIG_PERVASIVE_CPI
3084 uint64_t stackshot_begin_cpu_cycle_count = 0;
3085
3086 if (!panic_stackshot) {
3087 stackshot_begin_cpu_cycle_count = mt_cur_cpu_cycles();
3088 }
3089 #endif
3090
3091 #if STACKSHOT_COLLECTS_LATENCY_INFO
3092 collect_latency_info = trace_flags & STACKSHOT_DISABLE_LATENCY_INFO ? false : true;
3093 #endif
3094
3095 /* process the flags */
3096 bool collect_delta_stackshot = ((trace_flags & STACKSHOT_COLLECT_DELTA_SNAPSHOT) != 0);
3097 bool use_fault_path = ((trace_flags & (STACKSHOT_ENABLE_UUID_FAULTING | STACKSHOT_ENABLE_BT_FAULTING)) != 0);
3098 stack_enable_faulting = (trace_flags & (STACKSHOT_ENABLE_BT_FAULTING));
3099
3100 /* Currently we only support returning explicit KEXT load info on fileset kernels */
3101 kc_format_t primary_kc_type = KCFormatUnknown;
3102 if (PE_get_primary_kc_format(&primary_kc_type) && (primary_kc_type != KCFormatFileset)) {
3103 trace_flags &= ~(STACKSHOT_SAVE_KEXT_LOADINFO);
3104 }
3105
3106 struct stackshot_context ctx = {};
3107 ctx.trace_flags = trace_flags;
3108 ctx.pid = pid;
3109 ctx.include_drivers = (pid == 0 && (trace_flags & STACKSHOT_INCLUDE_DRIVER_THREADS_IN_KERNEL) != 0);
3110
3111 if (use_fault_path) {
3112 fault_stats.sfs_pages_faulted_in = 0;
3113 fault_stats.sfs_time_spent_faulting = 0;
3114 fault_stats.sfs_stopped_faulting = (uint8_t) FALSE;
3115 }
3116
3117 if (sizeof(void *) == 8) {
3118 system_state_flags |= kKernel64_p;
3119 }
3120
3121 if (stackshot_kcdata_p == NULL || pBytesTraced == NULL) {
3122 error = KERN_INVALID_ARGUMENT;
3123 goto error_exit;
3124 }
3125
3126 _stackshot_validation_reset();
3127 stackshot_plh_setup(stackshot_kcdata_p); /* set up port label hash */
3128
3129 /* setup mach_absolute_time and timebase info -- copy out in some cases and needed to convert since_timestamp to seconds for proc start time */
3130 clock_timebase_info(&timebase);
3131
3132 /* begin saving data into the buffer */
3133 *pBytesTraced = 0;
3134 if (pBytesUncompressed) {
3135 *pBytesUncompressed = 0;
3136 }
3137 kcd_exit_on_error(kcdata_add_uint64_with_description(stackshot_kcdata_p, trace_flags, "stackshot_in_flags"));
3138 kcd_exit_on_error(kcdata_add_uint32_with_description(stackshot_kcdata_p, (uint32_t)pid, "stackshot_in_pid"));
3139 kcd_exit_on_error(kcdata_add_uint64_with_description(stackshot_kcdata_p, system_state_flags, "system_state_flags"));
3140 if (trace_flags & STACKSHOT_PAGE_TABLES) {
3141 kcd_exit_on_error(kcdata_add_uint32_with_description(stackshot_kcdata_p, stack_snapshot_pagetable_mask, "stackshot_pagetable_mask"));
3142 }
3143 if (stackshot_initial_estimate != 0) {
3144 kcd_exit_on_error(kcdata_add_uint32_with_description(stackshot_kcdata_p, stackshot_initial_estimate, "stackshot_size_estimate"));
3145 kcd_exit_on_error(kcdata_add_uint32_with_description(stackshot_kcdata_p, stackshot_initial_estimate_adj, "stackshot_size_estimate_adj"));
3146 }
3147
3148 #if STACKSHOT_COLLECTS_LATENCY_INFO
3149 latency_info.setup_latency = mach_absolute_time();
3150 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
3151
3152 #if CONFIG_JETSAM
3153 tmp32 = memorystatus_get_pressure_status_kdp();
3154 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_JETSAM_LEVEL, sizeof(uint32_t), &tmp32));
3155 #endif
3156
3157 if (!collect_delta_stackshot) {
3158 tmp32 = THREAD_POLICY_INTERNAL_STRUCT_VERSION;
3159 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_THREAD_POLICY_VERSION, sizeof(uint32_t), &tmp32));
3160
3161 tmp32 = PAGE_SIZE;
3162 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_KERN_PAGE_SIZE, sizeof(uint32_t), &tmp32));
3163
3164 /* save boot-args and osversion string */
3165 length_to_copy = MIN((uint32_t)(strlen(version) + 1), OSVERSIZE);
3166 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_OSVERSION, length_to_copy, (const void *)version));
3167
3168
3169 length_to_copy = MIN((uint32_t)(strlen(PE_boot_args()) + 1), BOOT_LINE_LENGTH);
3170 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_BOOTARGS, length_to_copy, PE_boot_args()));
3171
3172 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, KCDATA_TYPE_TIMEBASE, sizeof(timebase), &timebase));
3173 } else {
3174 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_DELTA_SINCE_TIMESTAMP, sizeof(uint64_t), &stack_snapshot_delta_since_timestamp));
3175 }
3176
3177 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, KCDATA_TYPE_MACH_ABSOLUTE_TIME, sizeof(uint64_t), &abs_time));
3178
3179 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, KCDATA_TYPE_USECS_SINCE_EPOCH, sizeof(uint64_t), &stackshot_microsecs));
3180
3181 kcd_exit_on_error(kdp_stackshot_shared_regions(trace_flags));
3182
3183 /* Add requested information first */
3184 if (trace_flags & STACKSHOT_GET_GLOBAL_MEM_STATS) {
3185 struct mem_and_io_snapshot mais = {0};
3186 kdp_mem_and_io_snapshot(&mais);
3187 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_GLOBAL_MEM_STATS, sizeof(mais), &mais));
3188 }
3189
3190 #if CONFIG_THREAD_GROUPS
3191 struct thread_group_snapshot_v3 *thread_groups = NULL;
3192 int num_thread_groups = 0;
3193
3194 #if SCHED_HYGIENE_DEBUG && CONFIG_PERVASIVE_CPI
3195 uint64_t thread_group_begin_cpu_cycle_count = 0;
3196
3197 if (!panic_stackshot && (trace_flags & STACKSHOT_THREAD_GROUP)) {
3198 thread_group_begin_cpu_cycle_count = mt_cur_cpu_cycles();
3199 }
3200 #endif
3201
3202
3203 /* Iterate over thread group names */
3204 if (trace_flags & STACKSHOT_THREAD_GROUP) {
3205 /* Variable size array - better not have it on the stack. */
3206 kcdata_compression_window_open(stackshot_kcdata_p);
3207
3208 if (thread_group_iterate_stackshot(stackshot_thread_group_count, &num_thread_groups) != KERN_SUCCESS) {
3209 trace_flags &= ~(STACKSHOT_THREAD_GROUP);
3210 }
3211
3212 if (num_thread_groups > 0) {
3213 kcd_exit_on_error(kcdata_get_memory_addr_for_array(stackshot_kcdata_p, STACKSHOT_KCTYPE_THREAD_GROUP_SNAPSHOT, sizeof(struct thread_group_snapshot_v3), num_thread_groups, &out_addr));
3214 thread_groups = (struct thread_group_snapshot_v3 *)out_addr;
3215 }
3216
3217 if (thread_group_iterate_stackshot(stackshot_thread_group_snapshot, thread_groups) != KERN_SUCCESS) {
3218 error = KERN_FAILURE;
3219 goto error_exit;
3220 }
3221
3222 kcd_exit_on_error(kcdata_compression_window_close(stackshot_kcdata_p));
3223 }
3224
3225 #if SCHED_HYGIENE_DEBUG && CONFIG_PERVASIVE_CPI
3226 if (!panic_stackshot && (thread_group_begin_cpu_cycle_count != 0)) {
3227 kcd_exit_on_error(kcdata_add_uint64_with_description(stackshot_kcdata_p, (mt_cur_cpu_cycles() - thread_group_begin_cpu_cycle_count),
3228 "thread_groups_cpu_cycle_count"));
3229 }
3230 #endif
3231 #else
3232 trace_flags &= ~(STACKSHOT_THREAD_GROUP);
3233 #endif /* CONFIG_THREAD_GROUPS */
3234
3235
3236 #if STACKSHOT_COLLECTS_LATENCY_INFO
3237 latency_info.setup_latency = mach_absolute_time() - latency_info.setup_latency;
3238 latency_info.total_task_iteration_latency = mach_absolute_time();
3239 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
3240
3241 /* Iterate over tasks */
3242 queue_iterate(&tasks, task, task_t, tasks)
3243 {
3244 if (collect_delta_stackshot) {
3245 uint64_t abstime;
3246 proc_starttime_kdp(get_bsdtask_info(task), NULL, NULL, &abstime);
3247
3248 if (abstime > last_task_start_time) {
3249 last_task_start_time = abstime;
3250 }
3251 }
3252
3253 error = kdp_stackshot_record_task(&ctx, task);
3254 if (error) {
3255 goto error_exit;
3256 }
3257 }
3258
3259
3260 #if STACKSHOT_COLLECTS_LATENCY_INFO
3261 latency_info.total_task_iteration_latency = mach_absolute_time() - latency_info.total_task_iteration_latency;
3262 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
3263
3264 #if CONFIG_COALITIONS
3265 /* Don't collect jetsam coalition snapshots in delta stackshots - these don't change */
3266 if (!collect_delta_stackshot || (last_task_start_time > stack_snapshot_delta_since_timestamp)) {
3267 int num_coalitions = 0;
3268 struct jetsam_coalition_snapshot *coalitions = NULL;
3269
3270 #if SCHED_HYGIENE_DEBUG && CONFIG_PERVASIVE_CPI
3271 uint64_t coalition_begin_cpu_cycle_count = 0;
3272
3273 if (!panic_stackshot && (trace_flags & STACKSHOT_SAVE_JETSAM_COALITIONS)) {
3274 coalition_begin_cpu_cycle_count = mt_cur_cpu_cycles();
3275 }
3276 #endif /* SCHED_HYGIENE_DEBUG && CONFIG_PERVASIVE_CPI */
3277
3278 /* Iterate over coalitions */
3279 if (trace_flags & STACKSHOT_SAVE_JETSAM_COALITIONS) {
3280 if (coalition_iterate_stackshot(stackshot_coalition_jetsam_count, &num_coalitions, COALITION_TYPE_JETSAM) != KERN_SUCCESS) {
3281 trace_flags &= ~(STACKSHOT_SAVE_JETSAM_COALITIONS);
3282 }
3283 }
3284 if (trace_flags & STACKSHOT_SAVE_JETSAM_COALITIONS) {
3285 if (num_coalitions > 0) {
3286 /* Variable size array - better not have it on the stack. */
3287 kcdata_compression_window_open(stackshot_kcdata_p);
3288 kcd_exit_on_error(kcdata_get_memory_addr_for_array(stackshot_kcdata_p, STACKSHOT_KCTYPE_JETSAM_COALITION_SNAPSHOT, sizeof(struct jetsam_coalition_snapshot), num_coalitions, &out_addr));
3289 coalitions = (struct jetsam_coalition_snapshot*)out_addr;
3290
3291 if (coalition_iterate_stackshot(stackshot_coalition_jetsam_snapshot, coalitions, COALITION_TYPE_JETSAM) != KERN_SUCCESS) {
3292 error = KERN_FAILURE;
3293 goto error_exit;
3294 }
3295
3296 kcd_exit_on_error(kcdata_compression_window_close(stackshot_kcdata_p));
3297 }
3298 }
3299 #if SCHED_HYGIENE_DEBUG && CONFIG_PERVASIVE_CPI
3300 if (!panic_stackshot && (coalition_begin_cpu_cycle_count != 0)) {
3301 kcd_exit_on_error(kcdata_add_uint64_with_description(stackshot_kcdata_p, (mt_cur_cpu_cycles() - coalition_begin_cpu_cycle_count),
3302 "coalitions_cpu_cycle_count"));
3303 }
3304 #endif /* SCHED_HYGIENE_DEBUG && CONFIG_PERVASIVE_CPI */
3305 }
3306 #else
3307 trace_flags &= ~(STACKSHOT_SAVE_JETSAM_COALITIONS);
3308 #endif /* CONFIG_COALITIONS */
3309
3310 #if STACKSHOT_COLLECTS_LATENCY_INFO
3311 latency_info.total_terminated_task_iteration_latency = mach_absolute_time();
3312 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
3313
3314 /*
3315 * Iterate over the tasks in the terminated tasks list. We only inspect
3316 * tasks that have a valid bsd_info pointer. The check for task transition
3317 * like past P_LPEXIT during proc_exit() is now checked for inside the
3318 * kdp_stackshot_record_task(), and then a safer and minimal
3319 * transitioning_task_snapshot struct is collected via
3320 * kcdata_record_transitioning_task_snapshot()
3321 */
3322 queue_iterate(&terminated_tasks, task, task_t, tasks)
3323 {
3324 error = kdp_stackshot_record_task(&ctx, task);
3325 if (error) {
3326 goto error_exit;
3327 }
3328 }
3329 #if DEVELOPMENT || DEBUG
3330 kcd_exit_on_error(kdp_stackshot_plh_stats());
3331 #endif /* DEVELOPMENT || DEBUG */
3332
3333 #if STACKSHOT_COLLECTS_LATENCY_INFO
3334 latency_info.total_terminated_task_iteration_latency = mach_absolute_time() - latency_info.total_terminated_task_iteration_latency;
3335 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
3336
3337 if (use_fault_path) {
3338 kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_STACKSHOT_FAULT_STATS,
3339 sizeof(struct stackshot_fault_stats), &fault_stats);
3340 }
3341
3342 #if STACKSHOT_COLLECTS_LATENCY_INFO
3343 if (collect_latency_info) {
3344 latency_info.latency_version = 1;
3345 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_LATENCY_INFO, sizeof(latency_info), &latency_info));
3346 }
3347 #endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
3348
3349 /* update timestamp of the stackshot */
3350 abs_time_end = mach_absolute_time();
3351 struct stackshot_duration_v2 stackshot_duration = {
3352 .stackshot_duration = (abs_time_end - abs_time),
3353 .stackshot_duration_outer = 0,
3354 .stackshot_duration_prior = stackshot_duration_prior_abs,
3355 };
3356
3357 if ((trace_flags & STACKSHOT_DO_COMPRESS) == 0) {
3358 kcd_exit_on_error(kcdata_get_memory_addr(stackshot_kcdata_p, STACKSHOT_KCTYPE_STACKSHOT_DURATION,
3359 sizeof(struct stackshot_duration_v2), &out_addr));
3360 struct stackshot_duration_v2 *duration_p = (void *) out_addr;
3361 kdp_memcpy(duration_p, &stackshot_duration, sizeof(*duration_p));
3362 stackshot_duration_outer = (unaligned_u64 *)&duration_p->stackshot_duration_outer;
3363 } else {
3364 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_STACKSHOT_DURATION, sizeof(stackshot_duration), &stackshot_duration));
3365 stackshot_duration_outer = NULL;
3366 }
3367
3368 #if SCHED_HYGIENE_DEBUG && CONFIG_PERVASIVE_CPI
3369 if (!panic_stackshot) {
3370 kcd_exit_on_error(kcdata_add_uint64_with_description(stackshot_kcdata_p, (mt_cur_cpu_cycles() - stackshot_begin_cpu_cycle_count),
3371 "stackshot_total_cpu_cycle_cnt"));
3372 }
3373 #endif
3374
3375 kcd_finalize_compression(stackshot_kcdata_p);
3376 kcd_exit_on_error(kcdata_add_uint64_with_description(stackshot_kcdata_p, trace_flags, "stackshot_out_flags"));
3377
3378 kcd_exit_on_error(kcdata_write_buffer_end(stackshot_kcdata_p));
3379
3380 /* === END of populating stackshot data === */
3381
3382 *pBytesTraced = (uint32_t) kcdata_memory_get_used_bytes(stackshot_kcdata_p);
3383 *pBytesUncompressed = (uint32_t) kcdata_memory_get_uncompressed_bytes(stackshot_kcdata_p);
3384
3385 error_exit:;
3386
3387 #if SCHED_HYGIENE_DEBUG
3388 bool disable_interrupts_masked_check = kern_feature_override(
3389 KF_INTERRUPT_MASKED_DEBUG_STACKSHOT_OVRD) ||
3390 (trace_flags & STACKSHOT_DO_COMPRESS) != 0;
3391
3392 #if STACKSHOT_INTERRUPTS_MASKED_CHECK_DISABLED
3393 disable_interrupts_masked_check = true;
3394 #endif /* STACKSHOT_INTERRUPTS_MASKED_CHECK_DISABLED */
3395
3396 if (disable_interrupts_masked_check) {
3397 ml_spin_debug_clear_self();
3398 }
3399
3400 if (!panic_stackshot && interrupt_masked_debug_mode) {
3401 /*
3402 * Try to catch instances where stackshot takes too long BEFORE returning from
3403 * the debugger
3404 */
3405 ml_handle_stackshot_interrupt_disabled_duration(current_thread());
3406 }
3407 #endif /* SCHED_HYGIENE_DEBUG */
3408 stackshot_plh_reset();
3409 stack_enable_faulting = FALSE;
3410
3411 return error;
3412 }
3413
3414 static uint64_t
proc_was_throttled_from_task(task_t task)3415 proc_was_throttled_from_task(task_t task)
3416 {
3417 uint64_t was_throttled = 0;
3418 void *bsd_info = get_bsdtask_info(task);
3419
3420 if (bsd_info) {
3421 was_throttled = proc_was_throttled(bsd_info);
3422 }
3423
3424 return was_throttled;
3425 }
3426
3427 static uint64_t
proc_did_throttle_from_task(task_t task)3428 proc_did_throttle_from_task(task_t task)
3429 {
3430 uint64_t did_throttle = 0;
3431 void *bsd_info = get_bsdtask_info(task);
3432
3433 if (bsd_info) {
3434 did_throttle = proc_did_throttle(bsd_info);
3435 }
3436
3437 return did_throttle;
3438 }
3439
3440 static void
kdp_mem_and_io_snapshot(struct mem_and_io_snapshot * memio_snap)3441 kdp_mem_and_io_snapshot(struct mem_and_io_snapshot *memio_snap)
3442 {
3443 unsigned int pages_reclaimed;
3444 unsigned int pages_wanted;
3445 kern_return_t kErr;
3446
3447 uint64_t compressions = 0;
3448 uint64_t decompressions = 0;
3449
3450 compressions = counter_load(&vm_statistics_compressions);
3451 decompressions = counter_load(&vm_statistics_decompressions);
3452
3453 memio_snap->snapshot_magic = STACKSHOT_MEM_AND_IO_SNAPSHOT_MAGIC;
3454 memio_snap->free_pages = vm_page_free_count;
3455 memio_snap->active_pages = vm_page_active_count;
3456 memio_snap->inactive_pages = vm_page_inactive_count;
3457 memio_snap->purgeable_pages = vm_page_purgeable_count;
3458 memio_snap->wired_pages = vm_page_wire_count;
3459 memio_snap->speculative_pages = vm_page_speculative_count;
3460 memio_snap->throttled_pages = vm_page_throttled_count;
3461 memio_snap->busy_buffer_count = count_busy_buffers();
3462 memio_snap->filebacked_pages = vm_page_pageable_external_count;
3463 memio_snap->compressions = (uint32_t)compressions;
3464 memio_snap->decompressions = (uint32_t)decompressions;
3465 memio_snap->compressor_size = VM_PAGE_COMPRESSOR_COUNT;
3466 kErr = mach_vm_pressure_monitor(FALSE, VM_PRESSURE_TIME_WINDOW, &pages_reclaimed, &pages_wanted);
3467
3468 if (!kErr) {
3469 memio_snap->pages_wanted = (uint32_t)pages_wanted;
3470 memio_snap->pages_reclaimed = (uint32_t)pages_reclaimed;
3471 memio_snap->pages_wanted_reclaimed_valid = 1;
3472 } else {
3473 memio_snap->pages_wanted = 0;
3474 memio_snap->pages_reclaimed = 0;
3475 memio_snap->pages_wanted_reclaimed_valid = 0;
3476 }
3477 }
3478
3479 static vm_offset_t
stackshot_find_phys(vm_map_t map,vm_offset_t target_addr,kdp_fault_flags_t fault_flags,uint32_t * kdp_fault_result_flags)3480 stackshot_find_phys(vm_map_t map, vm_offset_t target_addr, kdp_fault_flags_t fault_flags, uint32_t *kdp_fault_result_flags)
3481 {
3482 vm_offset_t result;
3483 struct kdp_fault_result fault_results = {0};
3484 if (fault_stats.sfs_stopped_faulting) {
3485 fault_flags &= ~KDP_FAULT_FLAGS_ENABLE_FAULTING;
3486 }
3487
3488 result = kdp_find_phys(map, target_addr, fault_flags, &fault_results);
3489
3490 if ((fault_results.flags & KDP_FAULT_RESULT_TRIED_FAULT) || (fault_results.flags & KDP_FAULT_RESULT_FAULTED_IN)) {
3491 fault_stats.sfs_time_spent_faulting += fault_results.time_spent_faulting;
3492
3493 if ((fault_stats.sfs_time_spent_faulting >= fault_stats.sfs_system_max_fault_time) && !panic_stackshot) {
3494 fault_stats.sfs_stopped_faulting = (uint8_t) TRUE;
3495 }
3496 }
3497
3498 if (fault_results.flags & KDP_FAULT_RESULT_FAULTED_IN) {
3499 fault_stats.sfs_pages_faulted_in++;
3500 }
3501
3502 if (kdp_fault_result_flags) {
3503 *kdp_fault_result_flags = fault_results.flags;
3504 }
3505
3506 return result;
3507 }
3508
3509 /*
3510 * Wrappers around kdp_generic_copyin, kdp_generic_copyin_word, kdp_generic_copyin_string that use stackshot_find_phys
3511 * in order to:
3512 * 1. collect statistics on the number of pages faulted in
3513 * 2. stop faulting if the time spent faulting has exceeded the limit.
3514 */
3515 static boolean_t
stackshot_copyin(vm_map_t map,uint64_t uaddr,void * dest,size_t size,boolean_t try_fault,kdp_fault_result_flags_t * kdp_fault_result_flags)3516 stackshot_copyin(vm_map_t map, uint64_t uaddr, void *dest, size_t size, boolean_t try_fault, kdp_fault_result_flags_t *kdp_fault_result_flags)
3517 {
3518 kdp_fault_flags_t fault_flags = KDP_FAULT_FLAGS_NONE;
3519 if (try_fault) {
3520 fault_flags |= KDP_FAULT_FLAGS_ENABLE_FAULTING;
3521 }
3522 return kdp_generic_copyin(map, uaddr, dest, size, fault_flags, (find_phys_fn_t)stackshot_find_phys, kdp_fault_result_flags) == KERN_SUCCESS;
3523 }
3524 static boolean_t
stackshot_copyin_word(task_t task,uint64_t addr,uint64_t * result,boolean_t try_fault,kdp_fault_result_flags_t * kdp_fault_result_flags)3525 stackshot_copyin_word(task_t task, uint64_t addr, uint64_t *result, boolean_t try_fault, kdp_fault_result_flags_t *kdp_fault_result_flags)
3526 {
3527 kdp_fault_flags_t fault_flags = KDP_FAULT_FLAGS_NONE;
3528 if (try_fault) {
3529 fault_flags |= KDP_FAULT_FLAGS_ENABLE_FAULTING;
3530 }
3531 return kdp_generic_copyin_word(task, addr, result, fault_flags, (find_phys_fn_t)stackshot_find_phys, kdp_fault_result_flags) == KERN_SUCCESS;
3532 }
3533 static int
stackshot_copyin_string(task_t task,uint64_t addr,char * buf,int buf_sz,boolean_t try_fault,kdp_fault_result_flags_t * kdp_fault_result_flags)3534 stackshot_copyin_string(task_t task, uint64_t addr, char *buf, int buf_sz, boolean_t try_fault, kdp_fault_result_flags_t *kdp_fault_result_flags)
3535 {
3536 kdp_fault_flags_t fault_flags = KDP_FAULT_FLAGS_NONE;
3537 if (try_fault) {
3538 fault_flags |= KDP_FAULT_FLAGS_ENABLE_FAULTING;
3539 }
3540 return kdp_generic_copyin_string(task, addr, buf, buf_sz, fault_flags, (find_phys_fn_t)stackshot_find_phys, kdp_fault_result_flags);
3541 }
3542
3543 kern_return_t
do_stackshot(void * context)3544 do_stackshot(void *context)
3545 {
3546 #pragma unused(context)
3547 kdp_snapshot++;
3548
3549 stack_snapshot_ret = kdp_stackshot_kcdata_format(stack_snapshot_pid,
3550 stack_snapshot_flags,
3551 &stack_snapshot_bytes_traced,
3552 &stack_snapshot_bytes_uncompressed);
3553
3554 if (stack_snapshot_ret == KERN_SUCCESS) {
3555 /* releases and zeros and kcdata_end_alloc()s done */
3556 kcdata_finish(stackshot_kcdata_p);
3557 }
3558
3559 kdp_snapshot--;
3560 return stack_snapshot_ret;
3561 }
3562
3563 boolean_t
stackshot_thread_is_idle_worker_unsafe(thread_t thread)3564 stackshot_thread_is_idle_worker_unsafe(thread_t thread)
3565 {
3566 /* When the pthread kext puts a worker thread to sleep, it will
3567 * set kThreadWaitParkedWorkQueue in the block_hint of the thread
3568 * struct. See parkit() in kern/kern_support.c in libpthread.
3569 */
3570 return (thread->state & TH_WAIT) &&
3571 (thread->block_hint == kThreadWaitParkedWorkQueue);
3572 }
3573
3574 #if CONFIG_COALITIONS
3575 static void
stackshot_coalition_jetsam_count(void * arg,int i,coalition_t coal)3576 stackshot_coalition_jetsam_count(void *arg, int i, coalition_t coal)
3577 {
3578 #pragma unused(i, coal)
3579 unsigned int *coalition_count = (unsigned int*)arg;
3580 (*coalition_count)++;
3581 }
3582
3583 static void
stackshot_coalition_jetsam_snapshot(void * arg,int i,coalition_t coal)3584 stackshot_coalition_jetsam_snapshot(void *arg, int i, coalition_t coal)
3585 {
3586 if (coalition_type(coal) != COALITION_TYPE_JETSAM) {
3587 return;
3588 }
3589
3590 struct jetsam_coalition_snapshot *coalitions = (struct jetsam_coalition_snapshot*)arg;
3591 struct jetsam_coalition_snapshot *jcs = &coalitions[i];
3592 task_t leader = TASK_NULL;
3593 jcs->jcs_id = coalition_id(coal);
3594 jcs->jcs_flags = 0;
3595 jcs->jcs_thread_group = 0;
3596
3597 if (coalition_term_requested(coal)) {
3598 jcs->jcs_flags |= kCoalitionTermRequested;
3599 }
3600 if (coalition_is_terminated(coal)) {
3601 jcs->jcs_flags |= kCoalitionTerminated;
3602 }
3603 if (coalition_is_reaped(coal)) {
3604 jcs->jcs_flags |= kCoalitionReaped;
3605 }
3606 if (coalition_is_privileged(coal)) {
3607 jcs->jcs_flags |= kCoalitionPrivileged;
3608 }
3609
3610 #if CONFIG_THREAD_GROUPS
3611 struct thread_group *thread_group = kdp_coalition_get_thread_group(coal);
3612 if (thread_group) {
3613 jcs->jcs_thread_group = thread_group_get_id(thread_group);
3614 }
3615 #endif /* CONFIG_THREAD_GROUPS */
3616
3617 leader = kdp_coalition_get_leader(coal);
3618 if (leader) {
3619 jcs->jcs_leader_task_uniqueid = get_task_uniqueid(leader);
3620 } else {
3621 jcs->jcs_leader_task_uniqueid = 0;
3622 }
3623 }
3624 #endif /* CONFIG_COALITIONS */
3625
3626 #if CONFIG_THREAD_GROUPS
3627 static void
stackshot_thread_group_count(void * arg,int i,struct thread_group * tg)3628 stackshot_thread_group_count(void *arg, int i, struct thread_group *tg)
3629 {
3630 #pragma unused(i, tg)
3631 unsigned int *n = (unsigned int*)arg;
3632 (*n)++;
3633 }
3634
3635 static void
stackshot_thread_group_snapshot(void * arg,int i,struct thread_group * tg)3636 stackshot_thread_group_snapshot(void *arg, int i, struct thread_group *tg)
3637 {
3638 struct thread_group_snapshot_v3 *thread_groups = arg;
3639 struct thread_group_snapshot_v3 *tgs = &thread_groups[i];
3640 const char *name = thread_group_get_name(tg);
3641 uint32_t flags = thread_group_get_flags(tg);
3642 tgs->tgs_id = thread_group_get_id(tg);
3643 static_assert(THREAD_GROUP_MAXNAME > sizeof(tgs->tgs_name));
3644 kdp_memcpy(tgs->tgs_name, name, sizeof(tgs->tgs_name));
3645 kdp_memcpy(tgs->tgs_name_cont, name + sizeof(tgs->tgs_name),
3646 sizeof(tgs->tgs_name_cont));
3647 tgs->tgs_flags =
3648 ((flags & THREAD_GROUP_FLAGS_EFFICIENT) ? kThreadGroupEfficient : 0) |
3649 ((flags & THREAD_GROUP_FLAGS_APPLICATION) ? kThreadGroupApplication : 0) |
3650 ((flags & THREAD_GROUP_FLAGS_CRITICAL) ? kThreadGroupCritical : 0) |
3651 ((flags & THREAD_GROUP_FLAGS_BEST_EFFORT) ? kThreadGroupBestEffort : 0) |
3652 ((flags & THREAD_GROUP_FLAGS_UI_APP) ? kThreadGroupUIApplication : 0) |
3653 ((flags & THREAD_GROUP_FLAGS_MANAGED) ? kThreadGroupManaged : 0) |
3654 ((flags & THREAD_GROUP_FLAGS_STRICT_TIMERS) ? kThreadGroupStrictTimers : 0) |
3655 0;
3656 }
3657 #endif /* CONFIG_THREAD_GROUPS */
3658
3659 /* Determine if a thread has waitinfo that stackshot can provide */
3660 static int
stackshot_thread_has_valid_waitinfo(thread_t thread)3661 stackshot_thread_has_valid_waitinfo(thread_t thread)
3662 {
3663 if (!(thread->state & TH_WAIT)) {
3664 return 0;
3665 }
3666
3667 switch (thread->block_hint) {
3668 // If set to None or is a parked work queue, ignore it
3669 case kThreadWaitParkedWorkQueue:
3670 case kThreadWaitNone:
3671 return 0;
3672 // There is a short window where the pthread kext removes a thread
3673 // from its ksyn wait queue before waking the thread up
3674 case kThreadWaitPThreadMutex:
3675 case kThreadWaitPThreadRWLockRead:
3676 case kThreadWaitPThreadRWLockWrite:
3677 case kThreadWaitPThreadCondVar:
3678 return kdp_pthread_get_thread_kwq(thread) != NULL;
3679 // All other cases are valid block hints if in a wait state
3680 default:
3681 return 1;
3682 }
3683 }
3684
3685 /* Determine if a thread has turnstileinfo that stackshot can provide */
3686 static int
stackshot_thread_has_valid_turnstileinfo(thread_t thread)3687 stackshot_thread_has_valid_turnstileinfo(thread_t thread)
3688 {
3689 struct turnstile *ts = thread_get_waiting_turnstile(thread);
3690
3691 return stackshot_thread_has_valid_waitinfo(thread) &&
3692 ts != TURNSTILE_NULL;
3693 }
3694
3695 static void
stackshot_thread_turnstileinfo(thread_t thread,thread_turnstileinfo_v2_t * tsinfo)3696 stackshot_thread_turnstileinfo(thread_t thread, thread_turnstileinfo_v2_t *tsinfo)
3697 {
3698 struct turnstile *ts;
3699 struct ipc_service_port_label *ispl = NULL;
3700
3701 /* acquire turnstile information and store it in the stackshot */
3702 ts = thread_get_waiting_turnstile(thread);
3703 tsinfo->waiter = thread_tid(thread);
3704 kdp_turnstile_fill_tsinfo(ts, tsinfo, &ispl);
3705 tsinfo->portlabel_id = stackshot_plh_lookup(ispl,
3706 (tsinfo->turnstile_flags & STACKSHOT_TURNSTILE_STATUS_SENDPORT) ? STACKSHOT_PLH_LOOKUP_SEND :
3707 (tsinfo->turnstile_flags & STACKSHOT_TURNSTILE_STATUS_RECEIVEPORT) ? STACKSHOT_PLH_LOOKUP_RECEIVE :
3708 STACKSHOT_PLH_LOOKUP_UNKNOWN);
3709 }
3710
3711 static void
stackshot_thread_wait_owner_info(thread_t thread,thread_waitinfo_v2_t * waitinfo)3712 stackshot_thread_wait_owner_info(thread_t thread, thread_waitinfo_v2_t *waitinfo)
3713 {
3714 thread_waitinfo_t *waitinfo_v1 = (thread_waitinfo_t *)waitinfo;
3715 struct ipc_service_port_label *ispl = NULL;
3716
3717 waitinfo->waiter = thread_tid(thread);
3718 waitinfo->wait_type = thread->block_hint;
3719 waitinfo->wait_flags = 0;
3720
3721 switch (waitinfo->wait_type) {
3722 case kThreadWaitKernelMutex:
3723 kdp_lck_mtx_find_owner(thread->waitq.wq_q, thread->wait_event, waitinfo_v1);
3724 break;
3725 case kThreadWaitPortReceive:
3726 kdp_mqueue_recv_find_owner(thread->waitq.wq_q, thread->wait_event, waitinfo, &ispl);
3727 waitinfo->portlabel_id = stackshot_plh_lookup(ispl, STACKSHOT_PLH_LOOKUP_RECEIVE);
3728 break;
3729 case kThreadWaitPortSend:
3730 kdp_mqueue_send_find_owner(thread->waitq.wq_q, thread->wait_event, waitinfo, &ispl);
3731 waitinfo->portlabel_id = stackshot_plh_lookup(ispl, STACKSHOT_PLH_LOOKUP_SEND);
3732 break;
3733 case kThreadWaitSemaphore:
3734 kdp_sema_find_owner(thread->waitq.wq_q, thread->wait_event, waitinfo_v1);
3735 break;
3736 case kThreadWaitUserLock:
3737 kdp_ulock_find_owner(thread->waitq.wq_q, thread->wait_event, waitinfo_v1);
3738 break;
3739 case kThreadWaitKernelRWLockRead:
3740 case kThreadWaitKernelRWLockWrite:
3741 case kThreadWaitKernelRWLockUpgrade:
3742 kdp_rwlck_find_owner(thread->waitq.wq_q, thread->wait_event, waitinfo_v1);
3743 break;
3744 case kThreadWaitPThreadMutex:
3745 case kThreadWaitPThreadRWLockRead:
3746 case kThreadWaitPThreadRWLockWrite:
3747 case kThreadWaitPThreadCondVar:
3748 kdp_pthread_find_owner(thread, waitinfo_v1);
3749 break;
3750 case kThreadWaitWorkloopSyncWait:
3751 kdp_workloop_sync_wait_find_owner(thread, thread->wait_event, waitinfo_v1);
3752 break;
3753 case kThreadWaitOnProcess:
3754 kdp_wait4_find_process(thread, thread->wait_event, waitinfo_v1);
3755 break;
3756 case kThreadWaitSleepWithInheritor:
3757 kdp_sleep_with_inheritor_find_owner(thread->waitq.wq_q, thread->wait_event, waitinfo_v1);
3758 break;
3759 case kThreadWaitEventlink:
3760 kdp_eventlink_find_owner(thread->waitq.wq_q, thread->wait_event, waitinfo_v1);
3761 break;
3762 case kThreadWaitCompressor:
3763 kdp_compressor_busy_find_owner(thread->wait_event, waitinfo_v1);
3764 break;
3765 default:
3766 waitinfo->owner = 0;
3767 waitinfo->context = 0;
3768 break;
3769 }
3770 }
3771