]> git.saurik.com Git - apple/xnu.git/blame - osfmk/kern/kern_stackshot.c
xnu-7195.81.3.tar.gz
[apple/xnu.git] / osfmk / kern / kern_stackshot.c
CommitLineData
fe8ab488 1/*
f427ee49 2 * Copyright (c) 2013-2020 Apple Inc. All rights reserved.
fe8ab488
A
3 *
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
5ba3f43e 5 *
fe8ab488
A
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
5ba3f43e 14 *
fe8ab488
A
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
5ba3f43e 17 *
fe8ab488
A
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
5ba3f43e 25 *
fe8ab488
A
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
27 */
28
29#include <mach/mach_types.h>
30#include <mach/vm_param.h>
3e170ce0 31#include <mach/mach_vm.h>
39037602 32#include <mach/clock_types.h>
3e170ce0
A
33#include <sys/errno.h>
34#include <sys/stackshot.h>
fe8ab488
A
35#ifdef IMPORTANCE_INHERITANCE
36#include <ipc/ipc_importance.h>
37#endif
38#include <sys/appleapiopts.h>
39#include <kern/debug.h>
813fb2f6 40#include <kern/block_hint.h>
fe8ab488
A
41#include <uuid/uuid.h>
42
43#include <kdp/kdp_dyld.h>
44#include <kdp/kdp_en_debugger.h>
45
46#include <libsa/types.h>
47#include <libkern/version.h>
d9a64523 48#include <libkern/section_keywords.h>
fe8ab488
A
49
50#include <string.h> /* bcopy */
51
f427ee49 52#include <kern/cambria_layout.h>
5ba3f43e 53#include <kern/coalition.h>
fe8ab488 54#include <kern/processor.h>
f427ee49 55#include <kern/host_statistics.h>
fe8ab488 56#include <kern/thread.h>
5ba3f43e 57#include <kern/thread_group.h>
39037602 58#include <kern/task.h>
3e170ce0 59#include <kern/telemetry.h>
fe8ab488 60#include <kern/clock.h>
39037602 61#include <kern/policy_internal.h>
fe8ab488
A
62#include <vm/vm_map.h>
63#include <vm/vm_kern.h>
64#include <vm/vm_pageout.h>
3e170ce0 65#include <vm/vm_fault.h>
fe8ab488 66#include <vm/vm_shared_region.h>
ea3f0419 67#include <vm/vm_compressor.h>
fe8ab488 68#include <libkern/OSKextLibPrivate.h>
f427ee49 69#include <os/log.h>
fe8ab488 70
d9a64523
A
71#if defined(__x86_64__)
72#include <i386/mp.h>
73#include <i386/cpu_threads.h>
74#endif
75
f427ee49 76#include <pexpert/pexpert.h>
3e170ce0 77
5ba3f43e
A
78#if MONOTONIC
79#include <kern/monotonic.h>
80#endif /* MONOTONIC */
81
82#include <san/kasan.h>
83
f427ee49
A
84#if DEBUG || DEVELOPMENT
85# define STACKSHOT_COLLECTS_LATENCY_INFO 1
86#else
87# define STACKSHOT_COLLECTS_LATENCY_INFO 0
88#endif /* DEBUG || DEVELOPMENT */
89
fe8ab488
A
90extern unsigned int not_in_kdp;
91
39037602 92
813fb2f6
A
93/* indicate to the compiler that some accesses are unaligned */
94typedef uint64_t unaligned_u64 __attribute__((aligned(1)));
95
fe8ab488
A
96extern addr64_t kdp_vtophys(pmap_t pmap, addr64_t va);
97
39037602
A
98int kdp_snapshot = 0;
99static kern_return_t stack_snapshot_ret = 0;
3e170ce0 100static uint32_t stack_snapshot_bytes_traced = 0;
f427ee49 101static uint32_t stack_snapshot_bytes_uncompressed = 0;
fe8ab488 102
f427ee49
A
103#if STACKSHOT_COLLECTS_LATENCY_INFO
104static bool collect_latency_info = true;
105#endif
3e170ce0 106static kcdata_descriptor_t stackshot_kcdata_p = NULL;
fe8ab488
A
107static void *stack_snapshot_buf;
108static uint32_t stack_snapshot_bufsize;
109int stack_snapshot_pid;
f427ee49 110static uint64_t stack_snapshot_flags;
39037602 111static uint64_t stack_snapshot_delta_since_timestamp;
f427ee49 112static uint32_t stack_snapshot_pagetable_mask;
39037602
A
113static boolean_t panic_stackshot;
114
115static boolean_t stack_enable_faulting = FALSE;
116static struct stackshot_fault_stats fault_stats;
3e170ce0 117
813fb2f6 118static unaligned_u64 * stackshot_duration_outer;
39037602 119static uint64_t stackshot_microsecs;
3e170ce0 120
39037602
A
121void * kernel_stackshot_buf = NULL; /* Pointer to buffer for stackshots triggered from the kernel and retrieved later */
122int kernel_stackshot_buf_size = 0;
fe8ab488 123
39037602
A
124void * stackshot_snapbuf = NULL; /* Used by stack_snapshot2 (to be removed) */
125
f427ee49
A
126#if INTERRUPT_MASKED_DEBUG
127extern boolean_t interrupt_masked_debug;
128#endif
129
39037602 130__private_extern__ void stackshot_init( void );
3e170ce0 131static boolean_t memory_iszero(void *addr, size_t size);
0a7de745
A
132uint32_t get_stackshot_estsize(uint32_t prev_size_hint);
133kern_return_t kern_stack_snapshot_internal(int stackshot_config_version, void *stackshot_config,
134 size_t stackshot_config_size, boolean_t stackshot_from_user);
135kern_return_t do_stackshot(void *);
f427ee49 136void kdp_snapshot_preflight(int pid, void * tracebuf, uint32_t tracebuf_size, uint64_t flags, kcdata_descriptor_t data_p, uint64_t since_timestamp, uint32_t pagetable_mask);
39037602 137boolean_t stackshot_thread_is_idle_worker_unsafe(thread_t thread);
f427ee49 138static int kdp_stackshot_kcdata_format(int pid, uint64_t trace_flags, uint32_t *pBytesTraced, uint32_t *pBytesUncompressed);
0a7de745 139uint32_t kdp_stack_snapshot_bytes_traced(void);
f427ee49 140uint32_t kdp_stack_snapshot_bytes_uncompressed(void);
0a7de745
A
141static void kdp_mem_and_io_snapshot(struct mem_and_io_snapshot *memio_snap);
142static boolean_t kdp_copyin(vm_map_t map, uint64_t uaddr, void *dest, size_t size, boolean_t try_fault, uint32_t *kdp_fault_result);
cb323159 143static int kdp_copyin_string(task_t task, uint64_t addr, char *buf, int buf_sz, boolean_t try_fault, uint32_t *kdp_fault_results);
0a7de745
A
144static boolean_t kdp_copyin_word(task_t task, uint64_t addr, uint64_t *result, boolean_t try_fault, uint32_t *kdp_fault_results);
145static uint64_t proc_was_throttled_from_task(task_t task);
146static void stackshot_thread_wait_owner_info(thread_t thread, thread_waitinfo_t * waitinfo);
147static int stackshot_thread_has_valid_waitinfo(thread_t thread);
cb323159
A
148static void stackshot_thread_turnstileinfo(thread_t thread, thread_turnstileinfo_t *tsinfo);
149static int stackshot_thread_has_valid_turnstileinfo(thread_t thread);
fe8ab488 150
5ba3f43e 151#if CONFIG_COALITIONS
0a7de745
A
152static void stackshot_coalition_jetsam_count(void *arg, int i, coalition_t coal);
153static void stackshot_coalition_jetsam_snapshot(void *arg, int i, coalition_t coal);
5ba3f43e
A
154#endif /* CONFIG_COALITIONS */
155
f427ee49
A
156#if CONFIG_THREAD_GROUPS
157static void stackshot_thread_group_count(void *arg, int i, struct thread_group *tg);
158static void stackshot_thread_group_snapshot(void *arg, int i, struct thread_group *tg);
159#endif /* CONFIG_THREAD_GROUPS */
5ba3f43e 160
0a7de745 161extern uint32_t workqueue_get_pwq_state_kdp(void *proc);
39037602 162
f427ee49
A
163struct proc;
164extern int proc_pid(struct proc *p);
0a7de745
A
165extern uint64_t proc_uniqueid(void *p);
166extern uint64_t proc_was_throttled(void *p);
167extern uint64_t proc_did_throttle(void *p);
168extern int proc_exiting(void *p);
169extern int proc_in_teardown(void *p);
170static uint64_t proc_did_throttle_from_task(task_t task);
171extern void proc_name_kdp(task_t task, char * buf, int size);
172extern int proc_threadname_kdp(void * uth, char * buf, size_t size);
173extern void proc_starttime_kdp(void * p, uint64_t * tv_sec, uint64_t * tv_usec, uint64_t * abstime);
f427ee49 174extern void proc_archinfo_kdp(void* p, cpu_type_t* cputype, cpu_subtype_t* cpusubtype);
cb323159 175extern boolean_t proc_binary_uuid_kdp(task_t task, uuid_t uuid);
0a7de745
A
176extern int memorystatus_get_pressure_status_kdp(void);
177extern void memorystatus_proc_flags_unsafe(void * v, boolean_t *is_dirty, boolean_t *is_dirty_tracked, boolean_t *allow_idle_exit);
39037602
A
178
179extern int count_busy_buffers(void); /* must track with declaration in bsd/sys/buf_internal.h */
180extern void bcopy_phys(addr64_t, addr64_t, vm_size_t);
181
182#if CONFIG_TELEMETRY
183extern kern_return_t stack_microstackshot(user_addr_t tracebuf, uint32_t tracebuf_size, uint32_t flags, int32_t *retval);
184#endif /* CONFIG_TELEMETRY */
fe8ab488 185
39037602
A
186extern kern_return_t kern_stack_snapshot_with_reason(char* reason);
187extern kern_return_t kern_stack_snapshot_internal(int stackshot_config_version, void *stackshot_config, size_t stackshot_config_size, boolean_t stackshot_from_user);
fe8ab488 188
39037602
A
189/*
190 * Validates that the given address is both a valid page and has
191 * default caching attributes for the current map. Returns
fe8ab488
A
192 * 0 if the address is invalid, and a kernel virtual address for
193 * the given address if it is valid.
194 */
3e170ce0 195vm_offset_t machine_trace_thread_get_kva(vm_offset_t cur_target_addr, vm_map_t map, uint32_t *thread_trace_flags);
fe8ab488 196
39037602
A
197#define KDP_FAULT_RESULT_PAGED_OUT 0x1 /* some data was unable to be retrieved */
198#define KDP_FAULT_RESULT_TRIED_FAULT 0x2 /* tried to fault in data */
199#define KDP_FAULT_RESULT_FAULTED_IN 0x4 /* successfully faulted in data */
200
201/*
202 * Looks up the physical translation for the given address in the target map, attempting
203 * to fault data in if requested and it is not resident. Populates thread_trace_flags if requested
204 * as well.
205 */
206vm_offset_t kdp_find_phys(vm_map_t map, vm_offset_t target_addr, boolean_t try_fault, uint32_t *kdp_fault_results);
207
208static size_t stackshot_strlcpy(char *dst, const char *src, size_t maxlen);
f427ee49 209void stackshot_memcpy(void *dst, const void *src, size_t len);
39037602 210
fe8ab488 211/* Clears caching information used by the above validation routine
39037602 212 * (in case the current map has been changed or cleared).
fe8ab488
A
213 */
214void machine_trace_thread_clear_validation_cache(void);
215
216#define MAX_FRAMES 1000
3e170ce0 217#define MAX_LOADINFOS 500
3e170ce0 218#define TASK_IMP_WALK_LIMIT 20
fe8ab488
A
219
220typedef struct thread_snapshot *thread_snapshot_t;
221typedef struct task_snapshot *task_snapshot_t;
222
223#if CONFIG_KDP_INTERACTIVE_DEBUGGING
224extern kdp_send_t kdp_en_send_pkt;
0a7de745 225#endif
fe8ab488
A
226
227/*
228 * Globals to support machine_trace_thread_get_kva.
229 */
230static vm_offset_t prev_target_page = 0;
231static vm_offset_t prev_target_kva = 0;
232static boolean_t validate_next_addr = TRUE;
233
3e170ce0
A
234/*
235 * Stackshot locking and other defines.
236 */
f427ee49
A
237static LCK_GRP_DECLARE(stackshot_subsys_lck_grp, "stackshot_subsys_lock");
238static LCK_MTX_DECLARE(stackshot_subsys_mutex, &stackshot_subsys_lck_grp);
3e170ce0
A
239
240#define STACKSHOT_SUBSYS_LOCK() lck_mtx_lock(&stackshot_subsys_mutex)
39037602 241#define STACKSHOT_SUBSYS_TRY_LOCK() lck_mtx_try_lock(&stackshot_subsys_mutex)
3e170ce0 242#define STACKSHOT_SUBSYS_UNLOCK() lck_mtx_unlock(&stackshot_subsys_mutex)
3e170ce0 243
0a7de745
A
244#define SANE_BOOTPROFILE_TRACEBUF_SIZE (64ULL * 1024ULL * 1024ULL)
245#define SANE_TRACEBUF_SIZE (8ULL * 1024ULL * 1024ULL)
246
247#define TRACEBUF_SIZE_PER_GB (1024ULL * 1024ULL)
f427ee49 248#define GIGABYTES (1024ULL * 1024ULL * 1024ULL)
39037602 249
d9a64523
A
250SECURITY_READ_ONLY_LATE(static uint32_t) max_tracebuf_size = SANE_TRACEBUF_SIZE;
251
39037602
A
252/*
253 * We currently set a ceiling of 3 milliseconds spent in the kdp fault path
254 * for non-panic stackshots where faulting is requested.
255 */
256#define KDP_FAULT_PATH_MAX_TIME_PER_STACKSHOT_NSECS (3 * NSEC_PER_MSEC)
257
258#define STACKSHOT_SUPP_SIZE (16 * 1024) /* Minimum stackshot size */
259#define TASK_UUID_AVG_SIZE (16 * sizeof(uuid_t)) /* Average space consumed by UUIDs/task */
260
0a7de745
A
261#ifndef ROUNDUP
262#define ROUNDUP(x, y) ((((x)+(y)-1)/(y))*(y))
263#endif
264
cb323159
A
265#define STACKSHOT_QUEUE_LABEL_MAXSIZE 64
266
39037602
A
267/*
268 * Initialize the mutex governing access to the stack snapshot subsystem
269 * and other stackshot related bits.
270 */
3e170ce0 271__private_extern__ void
39037602 272stackshot_init( void )
3e170ce0 273{
39037602
A
274 mach_timebase_info_data_t timebase;
275
39037602 276 clock_timebase_info(&timebase);
0a7de745
A
277 fault_stats.sfs_system_max_fault_time = ((KDP_FAULT_PATH_MAX_TIME_PER_STACKSHOT_NSECS * timebase.denom) / timebase.numer);
278
f427ee49 279 max_tracebuf_size = MAX(max_tracebuf_size, ((ROUNDUP(max_mem, GIGABYTES) / GIGABYTES) * TRACEBUF_SIZE_PER_GB));
d9a64523
A
280
281 PE_parse_boot_argn("stackshot_maxsz", &max_tracebuf_size, sizeof(max_tracebuf_size));
39037602 282}
fe8ab488 283
0a7de745
A
284/*
285 * Method for grabbing timer values safely, in the sense that no infinite loop will occur
286 * Certain flavors of the timer_grab function, which would seem to be the thing to use,
287 * can loop infinitely if called while the timer is in the process of being updated.
288 * Unfortunately, it is (rarely) possible to get inconsistent top and bottom halves of
289 * the timer using this method. This seems insoluble, since stackshot runs in a context
290 * where the timer might be half-updated, and has no way of yielding control just long
291 * enough to finish the update.
fe8ab488
A
292 */
293
0a7de745
A
294static uint64_t
295safe_grab_timer_value(struct timer *t)
fe8ab488
A
296{
297#if defined(__LP64__)
0a7de745 298 return t->all_bits;
fe8ab488 299#else
0a7de745
A
300 uint64_t time = t->high_bits; /* endian independent grab */
301 time = (time << 32) | t->low_bits;
302 return time;
fe8ab488
A
303#endif
304}
305
5ba3f43e
A
306/*
307 * Called with interrupts disabled after stackshot context has been
308 * initialized. Updates stack_snapshot_ret.
309 */
0a7de745 310static kern_return_t
5ba3f43e
A
311stackshot_trap()
312{
0a7de745 313 kern_return_t rv;
d9a64523
A
314
315#if defined(__x86_64__)
316 /*
317 * Since mp_rendezvous and stackshot both attempt to capture cpus then perform an
318 * operation, it's essential to apply mutual exclusion to the other when one
319 * mechanism is in operation, lest there be a deadlock as the mechanisms race to
320 * capture CPUs.
321 *
322 * Further, we assert that invoking stackshot from mp_rendezvous*() is not
323 * allowed, so we check to ensure there there is no rendezvous in progress before
324 * trying to grab the lock (if there is, a deadlock will occur when we try to
325 * grab the lock). This is accomplished by setting cpu_rendezvous_in_progress to
326 * TRUE in the mp rendezvous action function. If stackshot_trap() is called by
327 * a subordinate of the call chain within the mp rendezvous action, this flag will
328 * be set and can be used to detect the inevitable deadlock that would occur
329 * if this thread tried to grab the rendezvous lock.
330 */
331
332 if (current_cpu_datap()->cpu_rendezvous_in_progress == TRUE) {
333 panic("Calling stackshot from a rendezvous is not allowed!");
334 }
335
336 mp_rendezvous_lock();
337#endif
338
339 rv = DebuggerTrapWithState(DBOP_STACKSHOT, NULL, NULL, NULL, 0, NULL, FALSE, 0);
340
341#if defined(__x86_64__)
342 mp_rendezvous_unlock();
343#endif
0a7de745 344 return rv;
5ba3f43e
A
345}
346
347
3e170ce0 348kern_return_t
f427ee49 349stack_snapshot_from_kernel(int pid, void *buf, uint32_t size, uint64_t flags, uint64_t delta_since_timestamp, uint32_t pagetable_mask, unsigned *bytes_traced)
3e170ce0 350{
39037602 351 kern_return_t error = KERN_SUCCESS;
3e170ce0
A
352 boolean_t istate;
353
5ba3f43e
A
354#if DEVELOPMENT || DEBUG
355 if (kern_feature_override(KF_STACKSHOT_OVRD) == TRUE) {
356 error = KERN_NOT_SUPPORTED;
357 goto out;
358 }
359#endif
3e170ce0
A
360 if ((buf == NULL) || (size <= 0) || (bytes_traced == NULL)) {
361 return KERN_INVALID_ARGUMENT;
362 }
363
d9a64523
A
364 /* cap in individual stackshot to max_tracebuf_size */
365 if (size > max_tracebuf_size) {
366 size = max_tracebuf_size;
3e170ce0
A
367 }
368
369 /* Serialize tracing */
39037602
A
370 if (flags & STACKSHOT_TRYLOCK) {
371 if (!STACKSHOT_SUBSYS_TRY_LOCK()) {
372 return KERN_LOCK_OWNED;
373 }
374 } else {
375 STACKSHOT_SUBSYS_LOCK();
376 }
377
39037602
A
378 struct kcdata_descriptor kcdata;
379 uint32_t hdr_tag = (flags & STACKSHOT_COLLECT_DELTA_SNAPSHOT) ?
0a7de745 380 KCDATA_BUFFER_BEGIN_DELTA_STACKSHOT : KCDATA_BUFFER_BEGIN_STACKSHOT;
39037602
A
381
382 error = kcdata_memory_static_init(&kcdata, (mach_vm_address_t)buf, hdr_tag, size,
0a7de745 383 KCFLAG_USE_MEMCOPY | KCFLAG_NO_AUTO_ENDBUFFER);
39037602
A
384 if (error) {
385 goto out;
386 }
3e170ce0 387
5ba3f43e
A
388 istate = ml_set_interrupts_enabled(FALSE);
389
3e170ce0 390 /* Preload trace parameters*/
f427ee49
A
391 kdp_snapshot_preflight(pid, buf, size, flags, &kcdata,
392 delta_since_timestamp, pagetable_mask);
3e170ce0 393
5ba3f43e
A
394 /*
395 * Trap to the debugger to obtain a coherent stack snapshot; this populates
3e170ce0
A
396 * the trace buffer
397 */
5ba3f43e 398 error = stackshot_trap();
3e170ce0
A
399
400 ml_set_interrupts_enabled(istate);
401
402 *bytes_traced = kdp_stack_snapshot_bytes_traced();
403
39037602 404out:
5ba3f43e 405 stackshot_kcdata_p = NULL;
3e170ce0 406 STACKSHOT_SUBSYS_UNLOCK();
3e170ce0
A
407 return error;
408}
409
410#if CONFIG_TELEMETRY
411kern_return_t
412stack_microstackshot(user_addr_t tracebuf, uint32_t tracebuf_size, uint32_t flags, int32_t *retval)
413{
414 int error = KERN_SUCCESS;
415 uint32_t bytes_traced = 0;
416
417 *retval = -1;
418
419 /*
420 * Control related operations
421 */
422 if (flags & STACKSHOT_GLOBAL_MICROSTACKSHOT_ENABLE) {
423 telemetry_global_ctl(1);
424 *retval = 0;
425 goto exit;
426 } else if (flags & STACKSHOT_GLOBAL_MICROSTACKSHOT_DISABLE) {
427 telemetry_global_ctl(0);
428 *retval = 0;
429 goto exit;
430 }
431
3e170ce0
A
432 /*
433 * Data related operations
434 */
435 *retval = -1;
436
437 if ((((void*)tracebuf) == NULL) || (tracebuf_size == 0)) {
438 error = KERN_INVALID_ARGUMENT;
439 goto exit;
440 }
441
442 STACKSHOT_SUBSYS_LOCK();
443
444 if (flags & STACKSHOT_GET_MICROSTACKSHOT) {
d9a64523 445 if (tracebuf_size > max_tracebuf_size) {
3e170ce0
A
446 error = KERN_INVALID_ARGUMENT;
447 goto unlock_exit;
448 }
449
450 bytes_traced = tracebuf_size;
451 error = telemetry_gather(tracebuf, &bytes_traced,
0a7de745 452 (flags & STACKSHOT_SET_MICROSTACKSHOT_MARK) ? TRUE : FALSE);
3e170ce0
A
453 *retval = (int)bytes_traced;
454 goto unlock_exit;
455 }
456
3e170ce0
A
457unlock_exit:
458 STACKSHOT_SUBSYS_UNLOCK();
459exit:
460 return error;
461}
462#endif /* CONFIG_TELEMETRY */
463
464/*
465 * Return the estimated size of a stackshot based on the
466 * number of currently running threads and tasks.
467 */
468uint32_t
469get_stackshot_estsize(uint32_t prev_size_hint)
470{
471 vm_size_t thread_total;
472 vm_size_t task_total;
473 uint32_t estimated_size;
f427ee49
A
474 size_t est_thread_size = sizeof(struct thread_snapshot);
475 size_t est_task_size = sizeof(struct task_snapshot) + TASK_UUID_AVG_SIZE;
3e170ce0 476
f427ee49
A
477#if STACKSHOT_COLLECTS_LATENCY_INFO
478 if (collect_latency_info) {
479 est_thread_size += sizeof(struct stackshot_latency_thread);
480 est_task_size += sizeof(struct stackshot_latency_task);
481 }
482#endif
483
484 thread_total = (threads_count * est_thread_size);
485 task_total = (tasks_count * est_task_size);
3e170ce0
A
486
487 estimated_size = (uint32_t) VM_MAP_ROUND_PAGE((thread_total + task_total + STACKSHOT_SUPP_SIZE), PAGE_MASK);
488 if (estimated_size < prev_size_hint) {
489 estimated_size = (uint32_t) VM_MAP_ROUND_PAGE(prev_size_hint, PAGE_MASK);
490 }
491
492 return estimated_size;
493}
494
495/*
496 * stackshot_remap_buffer: Utility function to remap bytes_traced bytes starting at stackshotbuf
497 * into the current task's user space and subsequently copy out the address
498 * at which the buffer has been mapped in user space to out_buffer_addr.
499 *
500 * Inputs: stackshotbuf - pointer to the original buffer in the kernel's address space
501 * bytes_traced - length of the buffer to remap starting from stackshotbuf
502 * out_buffer_addr - pointer to placeholder where newly mapped buffer will be mapped.
503 * out_size_addr - pointer to be filled in with the size of the buffer
504 *
505 * Outputs: ENOSPC if there is not enough free space in the task's address space to remap the buffer
506 * EINVAL for all other errors returned by task_remap_buffer/mach_vm_remap
507 * an error from copyout
508 */
509static kern_return_t
510stackshot_remap_buffer(void *stackshotbuf, uint32_t bytes_traced, uint64_t out_buffer_addr, uint64_t out_size_addr)
511{
0a7de745
A
512 int error = 0;
513 mach_vm_offset_t stackshotbuf_user_addr = (mach_vm_offset_t)NULL;
514 vm_prot_t cur_prot, max_prot;
3e170ce0 515
5ba3f43e 516 error = mach_vm_remap_kernel(get_task_map(current_task()), &stackshotbuf_user_addr, bytes_traced, 0,
0a7de745 517 VM_FLAGS_ANYWHERE, VM_KERN_MEMORY_NONE, kernel_map, (mach_vm_offset_t)stackshotbuf, FALSE, &cur_prot, &max_prot, VM_INHERIT_DEFAULT);
3e170ce0
A
518 /*
519 * If the call to mach_vm_remap fails, we return the appropriate converted error
520 */
521 if (error == KERN_SUCCESS) {
522 /*
523 * If we fail to copy out the address or size of the new buffer, we remove the buffer mapping that
524 * we just made in the task's user space.
525 */
526 error = copyout(CAST_DOWN(void *, &stackshotbuf_user_addr), (user_addr_t)out_buffer_addr, sizeof(stackshotbuf_user_addr));
527 if (error != KERN_SUCCESS) {
528 mach_vm_deallocate(get_task_map(current_task()), stackshotbuf_user_addr, (mach_vm_size_t)bytes_traced);
529 return error;
530 }
531 error = copyout(&bytes_traced, (user_addr_t)out_size_addr, sizeof(bytes_traced));
532 if (error != KERN_SUCCESS) {
533 mach_vm_deallocate(get_task_map(current_task()), stackshotbuf_user_addr, (mach_vm_size_t)bytes_traced);
534 return error;
535 }
536 }
537 return error;
538}
539
540kern_return_t
541kern_stack_snapshot_internal(int stackshot_config_version, void *stackshot_config, size_t stackshot_config_size, boolean_t stackshot_from_user)
542{
543 int error = 0;
544 boolean_t prev_interrupt_state;
545 uint32_t bytes_traced = 0;
546 uint32_t stackshotbuf_size = 0;
547 void * stackshotbuf = NULL;
548 kcdata_descriptor_t kcdata_p = NULL;
549
550 void * buf_to_free = NULL;
551 int size_to_free = 0;
552
553 /* Parsed arguments */
0a7de745
A
554 uint64_t out_buffer_addr;
555 uint64_t out_size_addr;
556 int pid = -1;
f427ee49 557 uint64_t flags;
0a7de745
A
558 uint64_t since_timestamp;
559 uint32_t size_hint = 0;
f427ee49 560 uint32_t pagetable_mask = STACKSHOT_PAGETABLES_MASK_ALL;
0a7de745
A
561
562 if (stackshot_config == NULL) {
563 return KERN_INVALID_ARGUMENT;
3e170ce0 564 }
5ba3f43e
A
565#if DEVELOPMENT || DEBUG
566 /* TBD: ask stackshot clients to avoid issuing stackshots in this
567 * configuration in lieu of the kernel feature override.
568 */
569 if (kern_feature_override(KF_STACKSHOT_OVRD) == TRUE) {
570 return KERN_NOT_SUPPORTED;
571 }
572#endif
3e170ce0
A
573
574 switch (stackshot_config_version) {
0a7de745
A
575 case STACKSHOT_CONFIG_TYPE:
576 if (stackshot_config_size != sizeof(stackshot_config_t)) {
577 return KERN_INVALID_ARGUMENT;
578 }
579 stackshot_config_t *config = (stackshot_config_t *) stackshot_config;
580 out_buffer_addr = config->sc_out_buffer_addr;
581 out_size_addr = config->sc_out_size_addr;
582 pid = config->sc_pid;
583 flags = config->sc_flags;
584 since_timestamp = config->sc_delta_timestamp;
585 if (config->sc_size <= max_tracebuf_size) {
586 size_hint = config->sc_size;
587 }
f427ee49
A
588 /*
589 * Retain the pre-sc_pagetable_mask behavior of STACKSHOT_PAGE_TABLES,
590 * dump every level if the pagetable_mask is not set
591 */
592 if (flags & STACKSHOT_PAGE_TABLES && config->sc_pagetable_mask) {
593 pagetable_mask = config->sc_pagetable_mask;
594 }
0a7de745
A
595 break;
596 default:
597 return KERN_NOT_SUPPORTED;
598 }
599
600 /*
601 * Currently saving a kernel buffer and trylock are only supported from the
602 * internal/KEXT API.
603 */
604 if (stackshot_from_user) {
605 if (flags & (STACKSHOT_TRYLOCK | STACKSHOT_SAVE_IN_KERNEL_BUFFER | STACKSHOT_FROM_PANIC)) {
606 return KERN_NO_ACCESS;
607 }
f427ee49
A
608#if !DEVELOPMENT && !DEBUG
609 if (flags & (STACKSHOT_DO_COMPRESS)) {
610 return KERN_NO_ACCESS;
611 }
612#endif
0a7de745 613 } else {
3e170ce0
A
614 if (!(flags & STACKSHOT_SAVE_IN_KERNEL_BUFFER)) {
615 return KERN_NOT_SUPPORTED;
616 }
617 }
618
d190cdc3 619 if (!((flags & STACKSHOT_KCDATA_FORMAT) || (flags & STACKSHOT_RETRIEVE_EXISTING_BUFFER))) {
3e170ce0
A
620 return KERN_NOT_SUPPORTED;
621 }
622
f427ee49
A
623 /* Compresssed delta stackshots or page dumps are not yet supported */
624 if (((flags & STACKSHOT_COLLECT_DELTA_SNAPSHOT) || (flags & STACKSHOT_PAGE_TABLES))
625 && (flags & STACKSHOT_DO_COMPRESS)) {
626 return KERN_NOT_SUPPORTED;
627 }
628
3e170ce0 629 /*
d190cdc3 630 * If we're not saving the buffer in the kernel pointer, we need a place to copy into.
3e170ce0
A
631 */
632 if ((!out_buffer_addr || !out_size_addr) && !(flags & STACKSHOT_SAVE_IN_KERNEL_BUFFER)) {
633 return KERN_INVALID_ARGUMENT;
634 }
635
39037602
A
636 if (since_timestamp != 0 && ((flags & STACKSHOT_COLLECT_DELTA_SNAPSHOT) == 0)) {
637 return KERN_INVALID_ARGUMENT;
3e170ce0
A
638 }
639
5ba3f43e
A
640#if MONOTONIC
641 if (!mt_core_supported) {
642 flags &= ~STACKSHOT_INSTRS_CYCLES;
643 }
644#else /* MONOTONIC */
645 flags &= ~STACKSHOT_INSTRS_CYCLES;
646#endif /* !MONOTONIC */
647
3e170ce0
A
648 STACKSHOT_SUBSYS_LOCK();
649
650 if (flags & STACKSHOT_SAVE_IN_KERNEL_BUFFER) {
651 /*
652 * Don't overwrite an existing stackshot
653 */
654 if (kernel_stackshot_buf != NULL) {
655 error = KERN_MEMORY_PRESENT;
656 goto error_exit;
657 }
658 } else if (flags & STACKSHOT_RETRIEVE_EXISTING_BUFFER) {
659 if ((kernel_stackshot_buf == NULL) || (kernel_stackshot_buf_size <= 0)) {
660 error = KERN_NOT_IN_SET;
661 goto error_exit;
662 }
663 error = stackshot_remap_buffer(kernel_stackshot_buf, kernel_stackshot_buf_size,
0a7de745 664 out_buffer_addr, out_size_addr);
3e170ce0 665 /*
0a7de745 666 * If we successfully remapped the buffer into the user's address space, we
3e170ce0
A
667 * set buf_to_free and size_to_free so the prior kernel mapping will be removed
668 * and then clear the kernel stackshot pointer and associated size.
669 */
670 if (error == KERN_SUCCESS) {
671 buf_to_free = kernel_stackshot_buf;
672 size_to_free = (int) VM_MAP_ROUND_PAGE(kernel_stackshot_buf_size, PAGE_MASK);
673 kernel_stackshot_buf = NULL;
674 kernel_stackshot_buf_size = 0;
675 }
0a7de745 676
3e170ce0
A
677 goto error_exit;
678 }
679
39037602
A
680 if (flags & STACKSHOT_GET_BOOT_PROFILE) {
681 void *bootprofile = NULL;
682 uint32_t len = 0;
683#if CONFIG_TELEMETRY
684 bootprofile_get(&bootprofile, &len);
685#endif
686 if (!bootprofile || !len) {
687 error = KERN_NOT_IN_SET;
688 goto error_exit;
689 }
690 error = stackshot_remap_buffer(bootprofile, len, out_buffer_addr, out_size_addr);
691 goto error_exit;
692 }
693
3e170ce0
A
694 stackshotbuf_size = get_stackshot_estsize(size_hint);
695
d9a64523 696 for (; stackshotbuf_size <= max_tracebuf_size; stackshotbuf_size <<= 1) {
c6bf4f31 697 if (kmem_alloc_flags(kernel_map, (vm_offset_t *)&stackshotbuf, stackshotbuf_size, VM_KERN_MEMORY_DIAG, KMA_ZERO) != KERN_SUCCESS) {
3e170ce0
A
698 error = KERN_RESOURCE_SHORTAGE;
699 goto error_exit;
700 }
701
3e170ce0 702
f427ee49
A
703 uint32_t hdr_tag = (flags & STACKSHOT_COLLECT_DELTA_SNAPSHOT) ? KCDATA_BUFFER_BEGIN_DELTA_STACKSHOT
704 : (flags & STACKSHOT_DO_COMPRESS) ? KCDATA_BUFFER_BEGIN_COMPRESSED
705 : KCDATA_BUFFER_BEGIN_STACKSHOT;
39037602 706 kcdata_p = kcdata_memory_alloc_init((mach_vm_address_t)stackshotbuf, hdr_tag, stackshotbuf_size,
0a7de745 707 KCFLAG_USE_MEMCOPY | KCFLAG_NO_AUTO_ENDBUFFER);
3e170ce0 708
39037602
A
709 stackshot_duration_outer = NULL;
710 uint64_t time_start = mach_absolute_time();
3e170ce0 711
f427ee49
A
712 /* if compression was requested, allocate the extra zlib scratch area */
713 if (flags & STACKSHOT_DO_COMPRESS) {
714 hdr_tag = (flags & STACKSHOT_COLLECT_DELTA_SNAPSHOT) ? KCDATA_BUFFER_BEGIN_DELTA_STACKSHOT
715 : KCDATA_BUFFER_BEGIN_STACKSHOT;
716 error = kcdata_init_compress(kcdata_p, hdr_tag, stackshot_memcpy, KCDCT_ZLIB);
717 if (error != KERN_SUCCESS) {
718 os_log(OS_LOG_DEFAULT, "failed to initialize compression: %d!\n",
719 (int) error);
720 goto error_exit;
721 }
722 }
723
3e170ce0
A
724 /*
725 * Disable interrupts and save the current interrupt state.
726 */
727 prev_interrupt_state = ml_set_interrupts_enabled(FALSE);
728
729 /*
730 * Load stackshot parameters.
731 */
f427ee49
A
732 kdp_snapshot_preflight(pid, stackshotbuf, stackshotbuf_size, flags, kcdata_p, since_timestamp,
733 pagetable_mask);
3e170ce0 734
5ba3f43e 735 error = stackshot_trap();
3e170ce0
A
736
737 ml_set_interrupts_enabled(prev_interrupt_state);
738
39037602
A
739 /* record the duration that interupts were disabled */
740
741 uint64_t time_end = mach_absolute_time();
742 if (stackshot_duration_outer) {
743 *stackshot_duration_outer = time_end - time_start;
744 }
745
39037602 746 if (error != KERN_SUCCESS) {
3e170ce0
A
747 if (kcdata_p != NULL) {
748 kcdata_memory_destroy(kcdata_p);
749 kcdata_p = NULL;
750 stackshot_kcdata_p = NULL;
751 }
752 kmem_free(kernel_map, (vm_offset_t)stackshotbuf, stackshotbuf_size);
753 stackshotbuf = NULL;
39037602
A
754 if (error == KERN_INSUFFICIENT_BUFFER_SIZE) {
755 /*
756 * If we didn't allocate a big enough buffer, deallocate and try again.
757 */
758 continue;
759 } else {
760 goto error_exit;
761 }
3e170ce0
A
762 }
763
764 bytes_traced = kdp_stack_snapshot_bytes_traced();
765
766 if (bytes_traced <= 0) {
39037602 767 error = KERN_ABORTED;
3e170ce0
A
768 goto error_exit;
769 }
770
771 assert(bytes_traced <= stackshotbuf_size);
772 if (!(flags & STACKSHOT_SAVE_IN_KERNEL_BUFFER)) {
773 error = stackshot_remap_buffer(stackshotbuf, bytes_traced, out_buffer_addr, out_size_addr);
774 goto error_exit;
775 }
776
777 /*
778 * Save the stackshot in the kernel buffer.
779 */
780 kernel_stackshot_buf = stackshotbuf;
781 kernel_stackshot_buf_size = bytes_traced;
782 /*
783 * Figure out if we didn't use all the pages in the buffer. If so, we set buf_to_free to the beginning of
784 * the next page after the end of the stackshot in the buffer so that the kmem_free clips the buffer and
785 * update size_to_free for kmem_free accordingly.
786 */
787 size_to_free = stackshotbuf_size - (int) VM_MAP_ROUND_PAGE(bytes_traced, PAGE_MASK);
788
789 assert(size_to_free >= 0);
790
791 if (size_to_free != 0) {
792 buf_to_free = (void *)((uint64_t)stackshotbuf + stackshotbuf_size - size_to_free);
793 }
794
795 stackshotbuf = NULL;
796 stackshotbuf_size = 0;
797 goto error_exit;
798 }
799
d9a64523 800 if (stackshotbuf_size > max_tracebuf_size) {
3e170ce0
A
801 error = KERN_RESOURCE_SHORTAGE;
802 }
803
804error_exit:
805 if (kcdata_p != NULL) {
806 kcdata_memory_destroy(kcdata_p);
807 kcdata_p = NULL;
808 stackshot_kcdata_p = NULL;
809 }
810
811 if (stackshotbuf != NULL) {
812 kmem_free(kernel_map, (vm_offset_t)stackshotbuf, stackshotbuf_size);
813 }
0a7de745 814 if (buf_to_free != NULL) {
3e170ce0
A
815 kmem_free(kernel_map, (vm_offset_t)buf_to_free, size_to_free);
816 }
817 STACKSHOT_SUBSYS_UNLOCK();
818 return error;
819}
820
5ba3f43e
A
821/*
822 * Cache stack snapshot parameters in preparation for a trace.
823 */
fe8ab488 824void
f427ee49
A
825kdp_snapshot_preflight(int pid, void * tracebuf, uint32_t tracebuf_size, uint64_t flags,
826 kcdata_descriptor_t data_p, uint64_t since_timestamp, uint32_t pagetable_mask)
fe8ab488 827{
39037602
A
828 uint64_t microsecs = 0, secs = 0;
829 clock_get_calendar_microtime((clock_sec_t *)&secs, (clock_usec_t *)&microsecs);
830
831 stackshot_microsecs = microsecs + (secs * USEC_PER_SEC);
fe8ab488
A
832 stack_snapshot_pid = pid;
833 stack_snapshot_buf = tracebuf;
834 stack_snapshot_bufsize = tracebuf_size;
835 stack_snapshot_flags = flags;
39037602 836 stack_snapshot_delta_since_timestamp = since_timestamp;
f427ee49 837 stack_snapshot_pagetable_mask = pagetable_mask;
39037602
A
838
839 panic_stackshot = ((flags & STACKSHOT_FROM_PANIC) != 0);
840
5ba3f43e
A
841 assert(data_p != NULL);
842 assert(stackshot_kcdata_p == NULL);
843 stackshot_kcdata_p = data_p;
844
845 stack_snapshot_bytes_traced = 0;
f427ee49 846 stack_snapshot_bytes_uncompressed = 0;
fe8ab488
A
847}
848
cc8bc92a
A
849void
850panic_stackshot_reset_state()
851{
852 stackshot_kcdata_p = NULL;
853}
854
5ba3f43e
A
855boolean_t
856stackshot_active()
fe8ab488 857{
0a7de745 858 return stackshot_kcdata_p != NULL;
fe8ab488
A
859}
860
3e170ce0 861uint32_t
fe8ab488
A
862kdp_stack_snapshot_bytes_traced(void)
863{
864 return stack_snapshot_bytes_traced;
865}
866
f427ee49
A
867uint32_t
868kdp_stack_snapshot_bytes_uncompressed(void)
869{
870 return stack_snapshot_bytes_uncompressed;
871}
872
0a7de745
A
873static boolean_t
874memory_iszero(void *addr, size_t size)
3e170ce0
A
875{
876 char *data = (char *)addr;
0a7de745
A
877 for (size_t i = 0; i < size; i++) {
878 if (data[i] != 0) {
3e170ce0 879 return FALSE;
0a7de745 880 }
3e170ce0
A
881 }
882 return TRUE;
883}
884
3e170ce0
A
885#define kcd_end_address(kcd) ((void *)((uint64_t)((kcd)->kcd_addr_begin) + kcdata_memory_get_used_bytes((kcd))))
886#define kcd_max_address(kcd) ((void *)((kcd)->kcd_addr_begin + (kcd)->kcd_length))
39037602
A
887/*
888 * Use of the kcd_exit_on_error(action) macro requires a local
889 * 'kern_return_t error' variable and 'error_exit' label.
890 */
891#define kcd_exit_on_error(action) \
892 do { \
0a7de745
A
893 if (KERN_SUCCESS != (error = (action))) { \
894 if (error == KERN_RESOURCE_SHORTAGE) { \
895 error = KERN_INSUFFICIENT_BUFFER_SIZE; \
896 } \
897 goto error_exit; \
898 } \
3e170ce0
A
899 } while (0); /* end kcd_exit_on_error */
900
39037602
A
901static uint64_t
902kcdata_get_task_ss_flags(task_t task)
903{
904 uint64_t ss_flags = 0;
d9a64523 905 boolean_t task_64bit_addr = task_has_64Bit_addr(task);
39037602 906
0a7de745 907 if (task_64bit_addr) {
39037602 908 ss_flags |= kUser64_p;
0a7de745
A
909 }
910 if (!task->active || task_is_a_corpse(task) || proc_exiting(task->bsd_info)) {
39037602 911 ss_flags |= kTerminatedSnapshot;
0a7de745
A
912 }
913 if (task->pidsuspended) {
39037602 914 ss_flags |= kPidSuspended;
0a7de745
A
915 }
916 if (task->frozen) {
39037602 917 ss_flags |= kFrozen;
0a7de745
A
918 }
919 if (task->effective_policy.tep_darwinbg == 1) {
39037602 920 ss_flags |= kTaskDarwinBG;
0a7de745
A
921 }
922 if (task->requested_policy.trp_role == TASK_FOREGROUND_APPLICATION) {
39037602 923 ss_flags |= kTaskIsForeground;
0a7de745
A
924 }
925 if (task->requested_policy.trp_boosted == 1) {
39037602 926 ss_flags |= kTaskIsBoosted;
0a7de745
A
927 }
928 if (task->effective_policy.tep_sup_active == 1) {
39037602 929 ss_flags |= kTaskIsSuppressed;
0a7de745 930 }
39037602 931#if CONFIG_MEMORYSTATUS
d9a64523
A
932
933 boolean_t dirty = FALSE, dirty_tracked = FALSE, allow_idle_exit = FALSE;
934 memorystatus_proc_flags_unsafe(task->bsd_info, &dirty, &dirty_tracked, &allow_idle_exit);
0a7de745 935 if (dirty) {
39037602 936 ss_flags |= kTaskIsDirty;
0a7de745
A
937 }
938 if (dirty_tracked) {
d9a64523 939 ss_flags |= kTaskIsDirtyTracked;
0a7de745
A
940 }
941 if (allow_idle_exit) {
d9a64523 942 ss_flags |= kTaskAllowIdleExit;
0a7de745 943 }
d9a64523 944
39037602 945#endif
0a7de745 946 if (task->effective_policy.tep_tal_engaged) {
d9a64523 947 ss_flags |= kTaskTALEngaged;
0a7de745 948 }
39037602
A
949
950 ss_flags |= (0x7 & workqueue_get_pwq_state_kdp(task->bsd_info)) << 17;
951
952#if IMPORTANCE_INHERITANCE
953 if (task->task_imp_base) {
0a7de745 954 if (task->task_imp_base->iit_donor) {
39037602 955 ss_flags |= kTaskIsImpDonor;
0a7de745
A
956 }
957 if (task->task_imp_base->iit_live_donor) {
39037602 958 ss_flags |= kTaskIsLiveImpDonor;
0a7de745 959 }
39037602
A
960 }
961#endif
39037602
A
962 return ss_flags;
963}
964
965static kern_return_t
d9a64523 966kcdata_record_shared_cache_info(kcdata_descriptor_t kcd, task_t task, unaligned_u64 *task_snap_ss_flags)
39037602
A
967{
968 kern_return_t error = KERN_SUCCESS;
3e170ce0 969
39037602
A
970 uint64_t shared_cache_slide = 0;
971 uint64_t shared_cache_base_address = 0;
39037602 972 uint32_t kdp_fault_results = 0;
f427ee49
A
973 struct dyld_uuid_info_64_v2 shared_cache_data = {0};
974
3e170ce0 975
39037602 976 assert(task_snap_ss_flags != NULL);
3e170ce0 977
39037602
A
978 if (task->shared_region && ml_validate_nofault((vm_offset_t)task->shared_region, sizeof(struct vm_shared_region))) {
979 struct vm_shared_region *sr = task->shared_region;
980 shared_cache_base_address = sr->sr_base_address + sr->sr_first_mapping;
f427ee49 981
39037602
A
982 } else {
983 *task_snap_ss_flags |= kTaskSharedRegionInfoUnavailable;
5ba3f43e 984 goto error_exit;
39037602 985 }
3e170ce0 986
5ba3f43e
A
987 /* We haven't copied in the shared region UUID yet as part of setup */
988 if (!shared_cache_base_address || !task->shared_region->sr_uuid_copied) {
3e170ce0
A
989 goto error_exit;
990 }
991
f427ee49 992
5ba3f43e 993 /*
f427ee49 994 * No refcounting here, but we are in debugger context, so that should be safe.
5ba3f43e 995 */
f427ee49 996 shared_cache_slide = task->shared_region->sr_slide;
3e170ce0 997
d9a64523
A
998 if (task->shared_region == init_task_shared_region) {
999 /* skip adding shared cache info -- it's the same as the system level one */
1000 goto error_exit;
39037602 1001 }
3e170ce0 1002
f427ee49
A
1003 shared_cache_data.imageLoadAddress = shared_cache_slide;
1004 stackshot_memcpy(&shared_cache_data.imageUUID, task->shared_region->sr_uuid, sizeof(task->shared_region->sr_uuid));
1005 shared_cache_data.imageSlidBaseAddress = shared_cache_base_address;
1006 kcd_exit_on_error(kcdata_push_data(kcd, STACKSHOT_KCTYPE_SHAREDCACHE_LOADINFO, sizeof(struct dyld_uuid_info_64_v2), &shared_cache_data));
3e170ce0 1007
39037602
A
1008error_exit:
1009 if (kdp_fault_results & KDP_FAULT_RESULT_PAGED_OUT) {
1010 *task_snap_ss_flags |= kTaskUUIDInfoMissing;
1011 }
3e170ce0 1012
39037602
A
1013 if (kdp_fault_results & KDP_FAULT_RESULT_TRIED_FAULT) {
1014 *task_snap_ss_flags |= kTaskUUIDInfoTriedFault;
1015 }
3e170ce0 1016
39037602
A
1017 if (kdp_fault_results & KDP_FAULT_RESULT_FAULTED_IN) {
1018 *task_snap_ss_flags |= kTaskUUIDInfoFaultedIn;
1019 }
3e170ce0 1020
39037602
A
1021 return error;
1022}
3e170ce0 1023
39037602 1024static kern_return_t
f427ee49 1025kcdata_record_uuid_info(kcdata_descriptor_t kcd, task_t task, uint64_t trace_flags, boolean_t have_pmap, unaligned_u64 *task_snap_ss_flags)
39037602
A
1026{
1027 boolean_t save_loadinfo_p = ((trace_flags & STACKSHOT_SAVE_LOADINFO) != 0);
1028 boolean_t save_kextloadinfo_p = ((trace_flags & STACKSHOT_SAVE_KEXT_LOADINFO) != 0);
39037602 1029 boolean_t should_fault = (trace_flags & STACKSHOT_ENABLE_UUID_FAULTING);
3e170ce0 1030
39037602
A
1031 kern_return_t error = KERN_SUCCESS;
1032 mach_vm_address_t out_addr = 0;
3e170ce0 1033
39037602
A
1034 uint32_t uuid_info_count = 0;
1035 mach_vm_address_t uuid_info_addr = 0;
1036 uint64_t uuid_info_timestamp = 0;
1037 uint32_t kdp_fault_results = 0;
1038
f427ee49 1039
39037602
A
1040 assert(task_snap_ss_flags != NULL);
1041
1042 int task_pid = pid_from_task(task);
d9a64523 1043 boolean_t task_64bit_addr = task_has_64Bit_addr(task);
39037602
A
1044
1045 if (save_loadinfo_p && have_pmap && task->active && task_pid > 0) {
1046 /* Read the dyld_all_image_infos struct from the task memory to get UUID array count and location */
d9a64523 1047 if (task_64bit_addr) {
39037602
A
1048 struct user64_dyld_all_image_infos task_image_infos;
1049 if (kdp_copyin(task->map, task->all_image_info_addr, &task_image_infos,
0a7de745 1050 sizeof(struct user64_dyld_all_image_infos), should_fault, &kdp_fault_results)) {
39037602
A
1051 uuid_info_count = (uint32_t)task_image_infos.uuidArrayCount;
1052 uuid_info_addr = task_image_infos.uuidArray;
5ba3f43e 1053 if (task_image_infos.version >= DYLD_ALL_IMAGE_INFOS_TIMESTAMP_MINIMUM_VERSION) {
39037602
A
1054 uuid_info_timestamp = task_image_infos.timestamp;
1055 }
f427ee49 1056
39037602
A
1057 }
1058 } else {
1059 struct user32_dyld_all_image_infos task_image_infos;
1060 if (kdp_copyin(task->map, task->all_image_info_addr, &task_image_infos,
0a7de745 1061 sizeof(struct user32_dyld_all_image_infos), should_fault, &kdp_fault_results)) {
39037602
A
1062 uuid_info_count = task_image_infos.uuidArrayCount;
1063 uuid_info_addr = task_image_infos.uuidArray;
5ba3f43e 1064 if (task_image_infos.version >= DYLD_ALL_IMAGE_INFOS_TIMESTAMP_MINIMUM_VERSION) {
39037602
A
1065 uuid_info_timestamp = task_image_infos.timestamp;
1066 }
3e170ce0
A
1067 }
1068 }
1069
39037602
A
1070 /*
1071 * If we get a NULL uuid_info_addr (which can happen when we catch dyld in the middle of updating
1072 * this data structure), we zero the uuid_info_count so that we won't even try to save load info
1073 * for this task.
1074 */
1075 if (!uuid_info_addr) {
1076 uuid_info_count = 0;
1077 }
f427ee49
A
1078
1079
39037602 1080 }
3e170ce0 1081
39037602
A
1082 if (have_pmap && task_pid == 0) {
1083 if (save_kextloadinfo_p && ml_validate_nofault((vm_offset_t)(gLoadedKextSummaries), sizeof(OSKextLoadedKextSummaryHeader))) {
1084 uuid_info_count = gLoadedKextSummaries->numSummaries + 1; /* include main kernel UUID */
1085 } else {
1086 uuid_info_count = 1; /* include kernelcache UUID (embedded) or kernel UUID (desktop) */
1087 }
1088 }
3e170ce0 1089
cb323159
A
1090 if (save_loadinfo_p && task_pid > 0 && (uuid_info_count < MAX_LOADINFOS)) {
1091 uint32_t copied_uuid_count = 0;
1092 uint32_t uuid_info_size = (uint32_t)(task_64bit_addr ? sizeof(struct user64_dyld_uuid_info) : sizeof(struct user32_dyld_uuid_info));
1093 uint32_t uuid_info_array_size = 0;
3e170ce0 1094
f427ee49
A
1095 /* Open a compression window to avoid overflowing the stack */
1096 kcdata_compression_window_open(kcd);
1097
cb323159
A
1098 /* If we found some UUID information, first try to copy it in -- this will only be non-zero if we had a pmap above */
1099 if (uuid_info_count > 0) {
1100 uuid_info_array_size = uuid_info_count * uuid_info_size;
3e170ce0 1101
cb323159
A
1102 kcd_exit_on_error(kcdata_get_memory_addr_for_array(kcd, (task_64bit_addr ? KCDATA_TYPE_LIBRARY_LOADINFO64 : KCDATA_TYPE_LIBRARY_LOADINFO),
1103 uuid_info_size, uuid_info_count, &out_addr));
1104
1105 if (!kdp_copyin(task->map, uuid_info_addr, (void *)out_addr, uuid_info_array_size, should_fault, &kdp_fault_results)) {
1106 bzero((void *)out_addr, uuid_info_array_size);
1107 } else {
1108 copied_uuid_count = uuid_info_count;
1109 }
1110 }
1111
1112 uuid_t binary_uuid;
1113 if (!copied_uuid_count && proc_binary_uuid_kdp(task, binary_uuid)) {
1114 /* We failed to copyin the UUID information, try to store the UUID of the main binary we have in the proc */
1115 if (uuid_info_array_size == 0) {
1116 /* We just need to store one UUID */
1117 uuid_info_array_size = uuid_info_size;
1118 kcd_exit_on_error(kcdata_get_memory_addr_for_array(kcd, (task_64bit_addr ? KCDATA_TYPE_LIBRARY_LOADINFO64 : KCDATA_TYPE_LIBRARY_LOADINFO),
1119 uuid_info_size, 1, &out_addr));
1120 }
1121
1122 if (task_64bit_addr) {
1123 struct user64_dyld_uuid_info *uuid_info = (struct user64_dyld_uuid_info *)out_addr;
1124 uint64_t image_load_address = task->mach_header_vm_address;
1125
1126 stackshot_memcpy(&uuid_info->imageUUID, binary_uuid, sizeof(uuid_t));
1127 stackshot_memcpy(&uuid_info->imageLoadAddress, &image_load_address, sizeof(image_load_address));
1128 } else {
1129 struct user32_dyld_uuid_info *uuid_info = (struct user32_dyld_uuid_info *)out_addr;
1130 uint32_t image_load_address = (uint32_t) task->mach_header_vm_address;
1131
1132 stackshot_memcpy(&uuid_info->imageUUID, binary_uuid, sizeof(uuid_t));
1133 stackshot_memcpy(&uuid_info->imageLoadAddress, &image_load_address, sizeof(image_load_address));
1134 }
39037602 1135 }
f427ee49
A
1136
1137 kcd_exit_on_error(kcdata_compression_window_close(kcd));
39037602 1138 } else if (task_pid == 0 && uuid_info_count > 0 && uuid_info_count < MAX_LOADINFOS) {
39037602
A
1139 uintptr_t image_load_address;
1140
1141 do {
f427ee49 1142#if defined(__arm__) || defined(__arm64__)
d9a64523 1143 if (kernelcache_uuid_valid && !save_kextloadinfo_p) {
f427ee49
A
1144 struct dyld_uuid_info_64 kc_uuid = {0};
1145 kc_uuid.imageLoadAddress = VM_MIN_KERNEL_AND_KEXT_ADDRESS;
1146 stackshot_memcpy(&kc_uuid.imageUUID, &kernelcache_uuid, sizeof(uuid_t));
1147 kcd_exit_on_error(kcdata_push_data(kcd, STACKSHOT_KCTYPE_KERNELCACHE_LOADINFO, sizeof(struct dyld_uuid_info_64), &kc_uuid));
5ba3f43e
A
1148 break;
1149 }
f427ee49 1150#endif /* defined(__arm__) || defined(__arm64__) */
39037602
A
1151
1152 if (!kernel_uuid || !ml_validate_nofault((vm_offset_t)kernel_uuid, sizeof(uuid_t))) {
1153 /* Kernel UUID not found or inaccessible */
1154 break;
3e170ce0 1155 }
3e170ce0 1156
f427ee49
A
1157 uint32_t uuid_type = KCDATA_TYPE_LIBRARY_LOADINFO;
1158 if ((sizeof(kernel_uuid_info) == sizeof(struct user64_dyld_uuid_info))) {
1159 uuid_type = KCDATA_TYPE_LIBRARY_LOADINFO64;
1160#if defined(__arm64__)
1161 kc_format_t primary_kc_type = KCFormatUnknown;
1162 if (PE_get_primary_kc_format(&primary_kc_type) && (primary_kc_type == KCFormatFileset)) {
1163 /* return TEXT_EXEC based load information on arm devices running with fileset kernelcaches */
1164 uuid_type = STACKSHOT_KCTYPE_LOADINFO64_TEXT_EXEC;
1165 }
1166#endif
1167 }
1168
1169 /*
1170 * The element count of the array can vary - avoid overflowing the
1171 * stack by opening a window.
1172 */
1173 kcdata_compression_window_open(kcd);
1174 kcd_exit_on_error(kcdata_get_memory_addr_for_array(kcd, uuid_type,
1175 sizeof(kernel_uuid_info), uuid_info_count, &out_addr));
39037602 1176 kernel_uuid_info *uuid_info_array = (kernel_uuid_info *)out_addr;
f427ee49 1177
39037602 1178 image_load_address = (uintptr_t)VM_KERNEL_UNSLIDE(vm_kernel_stext);
f427ee49
A
1179#if defined(__arm64__)
1180 if (uuid_type == STACKSHOT_KCTYPE_LOADINFO64_TEXT_EXEC) {
1181 /* If we're reporting TEXT_EXEC load info, populate the TEXT_EXEC base instead */
1182 extern vm_offset_t segTEXTEXECB;
1183 image_load_address = (uintptr_t)VM_KERNEL_UNSLIDE(segTEXTEXECB);
1184 }
1185#endif
39037602
A
1186 uuid_info_array[0].imageLoadAddress = image_load_address;
1187 stackshot_memcpy(&uuid_info_array[0].imageUUID, kernel_uuid, sizeof(uuid_t));
1188
0a7de745
A
1189 if (save_kextloadinfo_p &&
1190 ml_validate_nofault((vm_offset_t)(gLoadedKextSummaries), sizeof(OSKextLoadedKextSummaryHeader)) &&
1191 ml_validate_nofault((vm_offset_t)(&gLoadedKextSummaries->summaries[0]),
1192 gLoadedKextSummaries->entry_size * gLoadedKextSummaries->numSummaries)) {
39037602 1193 uint32_t kexti;
0a7de745 1194 for (kexti = 0; kexti < gLoadedKextSummaries->numSummaries; kexti++) {
39037602 1195 image_load_address = (uintptr_t)VM_KERNEL_UNSLIDE(gLoadedKextSummaries->summaries[kexti].address);
f427ee49
A
1196#if defined(__arm64__)
1197 if (uuid_type == STACKSHOT_KCTYPE_LOADINFO64_TEXT_EXEC) {
1198 /* If we're reporting TEXT_EXEC load info, populate the TEXT_EXEC base instead */
1199 image_load_address = (uintptr_t)VM_KERNEL_UNSLIDE(gLoadedKextSummaries->summaries[kexti].text_exec_address);
1200 }
1201#endif
39037602
A
1202 uuid_info_array[kexti + 1].imageLoadAddress = image_load_address;
1203 stackshot_memcpy(&uuid_info_array[kexti + 1].imageUUID, &gLoadedKextSummaries->summaries[kexti].uuid, sizeof(uuid_t));
3e170ce0 1204 }
39037602 1205 }
f427ee49 1206 kcd_exit_on_error(kcdata_compression_window_close(kcd));
0a7de745 1207 } while (0);
39037602 1208 }
3e170ce0 1209
39037602
A
1210error_exit:
1211 if (kdp_fault_results & KDP_FAULT_RESULT_PAGED_OUT) {
1212 *task_snap_ss_flags |= kTaskUUIDInfoMissing;
1213 }
3e170ce0 1214
39037602
A
1215 if (kdp_fault_results & KDP_FAULT_RESULT_TRIED_FAULT) {
1216 *task_snap_ss_flags |= kTaskUUIDInfoTriedFault;
1217 }
3e170ce0 1218
39037602
A
1219 if (kdp_fault_results & KDP_FAULT_RESULT_FAULTED_IN) {
1220 *task_snap_ss_flags |= kTaskUUIDInfoFaultedIn;
1221 }
3e170ce0 1222
39037602
A
1223 return error;
1224}
3e170ce0 1225
39037602
A
1226static kern_return_t
1227kcdata_record_task_iostats(kcdata_descriptor_t kcd, task_t task)
1228{
1229 kern_return_t error = KERN_SUCCESS;
1230 mach_vm_address_t out_addr = 0;
3e170ce0 1231
39037602
A
1232 /* I/O Statistics if any counters are non zero */
1233 assert(IO_NUM_PRIORITIES == STACKSHOT_IO_NUM_PRIORITIES);
1234 if (task->task_io_stats && !memory_iszero(task->task_io_stats, sizeof(struct io_stat_info))) {
f427ee49
A
1235 /* struct io_stats_snapshot is quite large - avoid overflowing the stack. */
1236 kcdata_compression_window_open(kcd);
39037602
A
1237 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_IOSTATS, sizeof(struct io_stats_snapshot), &out_addr));
1238 struct io_stats_snapshot *_iostat = (struct io_stats_snapshot *)out_addr;
1239 _iostat->ss_disk_reads_count = task->task_io_stats->disk_reads.count;
1240 _iostat->ss_disk_reads_size = task->task_io_stats->disk_reads.size;
1241 _iostat->ss_disk_writes_count = (task->task_io_stats->total_io.count - task->task_io_stats->disk_reads.count);
1242 _iostat->ss_disk_writes_size = (task->task_io_stats->total_io.size - task->task_io_stats->disk_reads.size);
1243 _iostat->ss_paging_count = task->task_io_stats->paging.count;
1244 _iostat->ss_paging_size = task->task_io_stats->paging.size;
1245 _iostat->ss_non_paging_count = (task->task_io_stats->total_io.count - task->task_io_stats->paging.count);
1246 _iostat->ss_non_paging_size = (task->task_io_stats->total_io.size - task->task_io_stats->paging.size);
1247 _iostat->ss_metadata_count = task->task_io_stats->metadata.count;
1248 _iostat->ss_metadata_size = task->task_io_stats->metadata.size;
1249 _iostat->ss_data_count = (task->task_io_stats->total_io.count - task->task_io_stats->metadata.count);
1250 _iostat->ss_data_size = (task->task_io_stats->total_io.size - task->task_io_stats->metadata.size);
0a7de745 1251 for (int i = 0; i < IO_NUM_PRIORITIES; i++) {
39037602
A
1252 _iostat->ss_io_priority_count[i] = task->task_io_stats->io_priority[i].count;
1253 _iostat->ss_io_priority_size[i] = task->task_io_stats->io_priority[i].size;
1254 }
f427ee49 1255 kcd_exit_on_error(kcdata_compression_window_close(kcd));
39037602
A
1256 }
1257
f427ee49 1258
39037602
A
1259error_exit:
1260 return error;
1261}
1262
a39ff7e2
A
1263#if MONOTONIC
1264static kern_return_t
1265kcdata_record_task_instrs_cycles(kcdata_descriptor_t kcd, task_t task)
1266{
f427ee49
A
1267 struct instrs_cycles_snapshot instrs_cycles = {0};
1268 uint64_t ics_instructions;
1269 uint64_t ics_cycles;
a39ff7e2 1270
f427ee49
A
1271 mt_stackshot_task(task, &ics_instructions, &ics_cycles);
1272 instrs_cycles.ics_instructions = ics_instructions;
1273 instrs_cycles.ics_cycles = ics_cycles;
a39ff7e2 1274
f427ee49 1275 return kcdata_push_data(kcd, STACKSHOT_KCTYPE_INSTRS_CYCLES, sizeof(instrs_cycles), &instrs_cycles);
a39ff7e2
A
1276}
1277#endif /* MONOTONIC */
1278
39037602 1279static kern_return_t
f427ee49
A
1280kcdata_record_task_cpu_architecture(kcdata_descriptor_t kcd, task_t task)
1281{
1282 struct stackshot_cpu_architecture cpu_architecture = {0};
1283 int32_t cputype;
1284 int32_t cpusubtype;
1285
1286 proc_archinfo_kdp(task->bsd_info, &cputype, &cpusubtype);
1287 cpu_architecture.cputype = cputype;
1288 cpu_architecture.cpusubtype = cpusubtype;
1289
1290 return kcdata_push_data(kcd, STACKSHOT_KCTYPE_TASK_CPU_ARCHITECTURE, sizeof(struct stackshot_cpu_architecture), &cpu_architecture);
1291}
1292
1293static kern_return_t
1294#if STACKSHOT_COLLECTS_LATENCY_INFO
1295kcdata_record_task_snapshot(kcdata_descriptor_t kcd, task_t task, uint64_t trace_flags, boolean_t have_pmap, unaligned_u64 task_snap_ss_flags, struct stackshot_latency_task *latency_info)
1296#else
1297kcdata_record_task_snapshot(kcdata_descriptor_t kcd, task_t task, uint64_t trace_flags, boolean_t have_pmap, unaligned_u64 task_snap_ss_flags)
1298#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
39037602
A
1299{
1300 boolean_t collect_delta_stackshot = ((trace_flags & STACKSHOT_COLLECT_DELTA_SNAPSHOT) != 0);
d9a64523 1301 boolean_t collect_iostats = !collect_delta_stackshot && !(trace_flags & STACKSHOT_NO_IO_STATS);
5ba3f43e
A
1302#if MONOTONIC
1303 boolean_t collect_instrs_cycles = ((trace_flags & STACKSHOT_INSTRS_CYCLES) != 0);
1304#endif /* MONOTONIC */
d9a64523
A
1305#if __arm__ || __arm64__
1306 boolean_t collect_asid = ((trace_flags & STACKSHOT_ASID) != 0);
1307#endif
1308 boolean_t collect_pagetables = ((trace_flags & STACKSHOT_PAGE_TABLES) != 0);
0a7de745 1309
39037602
A
1310
1311 kern_return_t error = KERN_SUCCESS;
1312 mach_vm_address_t out_addr = 0;
1313 struct task_snapshot_v2 * cur_tsnap = NULL;
f427ee49
A
1314#if STACKSHOT_COLLECTS_LATENCY_INFO
1315 latency_info->cur_tsnap_latency = mach_absolute_time();
1316#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
39037602
A
1317
1318 int task_pid = pid_from_task(task);
1319 uint64_t task_uniqueid = get_task_uniqueid(task);
813fb2f6 1320 uint64_t proc_starttime_secs = 0;
39037602 1321
f427ee49
A
1322 if (task_pid && (task_did_exec_internal(task) || task_is_exec_copy_internal(task))) {
1323 /*
1324 * if this task is a transit task from another one, show the pid as
1325 * negative
1326 */
1327 task_pid = 0 - task_pid;
1328 }
1329
1330 /* the task_snapshot_v2 struct is large - avoid overflowing the stack */
1331 kcdata_compression_window_open(kcd);
39037602 1332 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_TASK_SNAPSHOT, sizeof(struct task_snapshot_v2), &out_addr));
39037602 1333 cur_tsnap = (struct task_snapshot_v2 *)out_addr;
d9a64523 1334 bzero(cur_tsnap, sizeof(*cur_tsnap));
39037602
A
1335
1336 cur_tsnap->ts_unique_pid = task_uniqueid;
1337 cur_tsnap->ts_ss_flags = kcdata_get_task_ss_flags(task);
f427ee49 1338 cur_tsnap->ts_ss_flags |= task_snap_ss_flags;
39037602
A
1339 cur_tsnap->ts_user_time_in_terminated_threads = task->total_user_time;
1340 cur_tsnap->ts_system_time_in_terminated_threads = task->total_system_time;
1341
813fb2f6
A
1342 proc_starttime_kdp(task->bsd_info, &proc_starttime_secs, NULL, NULL);
1343 cur_tsnap->ts_p_start_sec = proc_starttime_secs;
5ba3f43e 1344 cur_tsnap->ts_task_size = have_pmap ? get_task_phys_footprint(task) : 0;
39037602 1345 cur_tsnap->ts_max_resident_size = get_task_resident_max(task);
d9a64523
A
1346 cur_tsnap->ts_was_throttled = (uint32_t) proc_was_throttled_from_task(task);
1347 cur_tsnap->ts_did_throttle = (uint32_t) proc_did_throttle_from_task(task);
1348
39037602
A
1349 cur_tsnap->ts_suspend_count = task->suspend_count;
1350 cur_tsnap->ts_faults = task->faults;
1351 cur_tsnap->ts_pageins = task->pageins;
1352 cur_tsnap->ts_cow_faults = task->cow_faults;
39037602 1353 cur_tsnap->ts_latency_qos = (task->effective_policy.tep_latency_qos == LATENCY_QOS_TIER_UNSPECIFIED) ?
0a7de745 1354 LATENCY_QOS_TIER_UNSPECIFIED : ((0xFF << 16) | task->effective_policy.tep_latency_qos);
39037602
A
1355 cur_tsnap->ts_pid = task_pid;
1356
f427ee49
A
1357 /* Add the BSD process identifiers */
1358 if (task_pid != -1 && task->bsd_info != NULL) {
1359 proc_name_kdp(task, cur_tsnap->ts_p_comm, sizeof(cur_tsnap->ts_p_comm));
1360 } else {
1361 cur_tsnap->ts_p_comm[0] = '\0';
1362#if IMPORTANCE_INHERITANCE && (DEVELOPMENT || DEBUG)
1363 if (task->task_imp_base != NULL) {
1364 stackshot_strlcpy(cur_tsnap->ts_p_comm, &task->task_imp_base->iit_procname[0],
1365 MIN((int)sizeof(task->task_imp_base->iit_procname), (int)sizeof(cur_tsnap->ts_p_comm)));
1366 }
1367#endif /* IMPORTANCE_INHERITANCE && (DEVELOPMENT || DEBUG) */
1368 }
1369
1370 kcd_exit_on_error(kcdata_compression_window_close(kcd));
1371
1372#if CONFIG_COALITIONS
1373 if (task_pid != -1 && task->bsd_info != NULL &&
1374 ((trace_flags & STACKSHOT_SAVE_JETSAM_COALITIONS) && (task->coalition[COALITION_TYPE_JETSAM] != NULL))) {
1375 uint64_t jetsam_coal_id = coalition_id(task->coalition[COALITION_TYPE_JETSAM]);
1376 kcd_exit_on_error(kcdata_push_data(kcd, STACKSHOT_KCTYPE_JETSAM_COALITION, sizeof(jetsam_coal_id), &jetsam_coal_id));
1377 }
1378#endif /* CONFIG_COALITIONS */
1379
d9a64523
A
1380#if __arm__ || __arm64__
1381 if (collect_asid && have_pmap) {
cb323159 1382 uint32_t asid = PMAP_VASID(task->map->pmap);
f427ee49 1383 kcd_exit_on_error(kcdata_push_data(kcd, STACKSHOT_KCTYPE_ASID, sizeof(asid), &asid));
d9a64523
A
1384 }
1385#endif
f427ee49
A
1386
1387#if STACKSHOT_COLLECTS_LATENCY_INFO
1388 latency_info->cur_tsnap_latency = mach_absolute_time() - latency_info->cur_tsnap_latency;
1389 latency_info->pmap_latency = mach_absolute_time();
1390#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
1391
d9a64523
A
1392 if (collect_pagetables && have_pmap) {
1393#if INTERRUPT_MASKED_DEBUG
1394 // pagetable dumps can be large; reset the interrupt timeout to avoid a panic
1395 ml_spin_debug_clear_self();
1396#endif
f427ee49
A
1397 size_t bytes_dumped = 0;
1398 error = pmap_dump_page_tables(task->map->pmap, kcd_end_address(kcd), kcd_max_address(kcd), stack_snapshot_pagetable_mask, &bytes_dumped);
1399 if (error != KERN_SUCCESS) {
d9a64523
A
1400 goto error_exit;
1401 } else {
f427ee49
A
1402 /* Variable size array - better not have it on the stack. */
1403 kcdata_compression_window_open(kcd);
d9a64523
A
1404 kcd_exit_on_error(kcdata_get_memory_addr_for_array(kcd, STACKSHOT_KCTYPE_PAGE_TABLES,
1405 sizeof(uint64_t), (uint32_t)(bytes_dumped / sizeof(uint64_t)), &out_addr));
f427ee49 1406 kcd_exit_on_error(kcdata_compression_window_close(kcd));
d9a64523
A
1407 }
1408 }
1409
f427ee49
A
1410#if STACKSHOT_COLLECTS_LATENCY_INFO
1411 latency_info->pmap_latency = mach_absolute_time() - latency_info->pmap_latency;
1412 latency_info->bsd_proc_ids_latency = mach_absolute_time();
1413#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
1414
1415#if STACKSHOT_COLLECTS_LATENCY_INFO
1416 latency_info->bsd_proc_ids_latency = mach_absolute_time() - latency_info->bsd_proc_ids_latency;
1417 latency_info->end_latency = mach_absolute_time();
1418#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
3e170ce0 1419
39037602
A
1420 if (collect_iostats) {
1421 kcd_exit_on_error(kcdata_record_task_iostats(kcd, task));
1422 }
3e170ce0 1423
5ba3f43e
A
1424#if MONOTONIC
1425 if (collect_instrs_cycles) {
a39ff7e2 1426 kcd_exit_on_error(kcdata_record_task_instrs_cycles(kcd, task));
5ba3f43e
A
1427 }
1428#endif /* MONOTONIC */
1429
f427ee49
A
1430 kcd_exit_on_error(kcdata_record_task_cpu_architecture(kcd, task));
1431
1432#if STACKSHOT_COLLECTS_LATENCY_INFO
1433 latency_info->end_latency = mach_absolute_time() - latency_info->end_latency;
1434#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
1435
39037602
A
1436error_exit:
1437 return error;
1438}
3e170ce0 1439
39037602 1440static kern_return_t
f427ee49 1441kcdata_record_task_delta_snapshot(kcdata_descriptor_t kcd, task_t task, uint64_t trace_flags, boolean_t have_pmap, unaligned_u64 task_snap_ss_flags)
39037602 1442{
d9a64523
A
1443#if !MONOTONIC
1444#pragma unused(trace_flags)
1445#endif /* !MONOTONIC */
39037602
A
1446 kern_return_t error = KERN_SUCCESS;
1447 struct task_delta_snapshot_v2 * cur_tsnap = NULL;
1448 mach_vm_address_t out_addr = 0;
d9a64523
A
1449 (void) trace_flags;
1450#if __arm__ || __arm64__
1451 boolean_t collect_asid = ((trace_flags & STACKSHOT_ASID) != 0);
1452#endif
a39ff7e2
A
1453#if MONOTONIC
1454 boolean_t collect_instrs_cycles = ((trace_flags & STACKSHOT_INSTRS_CYCLES) != 0);
a39ff7e2 1455#endif /* MONOTONIC */
3e170ce0 1456
39037602 1457 uint64_t task_uniqueid = get_task_uniqueid(task);
3e170ce0 1458
39037602 1459 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_TASK_DELTA_SNAPSHOT, sizeof(struct task_delta_snapshot_v2), &out_addr));
3e170ce0 1460
39037602 1461 cur_tsnap = (struct task_delta_snapshot_v2 *)out_addr;
3e170ce0 1462
39037602
A
1463 cur_tsnap->tds_unique_pid = task_uniqueid;
1464 cur_tsnap->tds_ss_flags = kcdata_get_task_ss_flags(task);
f427ee49 1465 cur_tsnap->tds_ss_flags |= task_snap_ss_flags;
3e170ce0 1466
39037602
A
1467 cur_tsnap->tds_user_time_in_terminated_threads = task->total_user_time;
1468 cur_tsnap->tds_system_time_in_terminated_threads = task->total_system_time;
3e170ce0 1469
5ba3f43e 1470 cur_tsnap->tds_task_size = have_pmap ? get_task_phys_footprint(task) : 0;
3e170ce0 1471
39037602
A
1472 cur_tsnap->tds_max_resident_size = get_task_resident_max(task);
1473 cur_tsnap->tds_suspend_count = task->suspend_count;
1474 cur_tsnap->tds_faults = task->faults;
1475 cur_tsnap->tds_pageins = task->pageins;
1476 cur_tsnap->tds_cow_faults = task->cow_faults;
1477 cur_tsnap->tds_was_throttled = (uint32_t)proc_was_throttled_from_task(task);
1478 cur_tsnap->tds_did_throttle = (uint32_t)proc_did_throttle_from_task(task);
0a7de745
A
1479 cur_tsnap->tds_latency_qos = (task->effective_policy.tep_latency_qos == LATENCY_QOS_TIER_UNSPECIFIED)
1480 ? LATENCY_QOS_TIER_UNSPECIFIED
1481 : ((0xFF << 16) | task->effective_policy.tep_latency_qos);
d9a64523
A
1482
1483#if __arm__ || __arm64__
1484 if (collect_asid && have_pmap) {
cb323159 1485 uint32_t asid = PMAP_VASID(task->map->pmap);
d9a64523
A
1486 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_ASID, sizeof(uint32_t), &out_addr));
1487 stackshot_memcpy((void*)out_addr, &asid, sizeof(asid));
1488 }
1489#endif
3e170ce0 1490
a39ff7e2
A
1491#if MONOTONIC
1492 if (collect_instrs_cycles) {
1493 kcd_exit_on_error(kcdata_record_task_instrs_cycles(kcd, task));
1494 }
1495#endif /* MONOTONIC */
1496
39037602
A
1497error_exit:
1498 return error;
1499}
3e170ce0 1500
39037602
A
1501static kern_return_t
1502kcdata_record_thread_iostats(kcdata_descriptor_t kcd, thread_t thread)
1503{
1504 kern_return_t error = KERN_SUCCESS;
1505 mach_vm_address_t out_addr = 0;
3e170ce0 1506
39037602
A
1507 /* I/O Statistics */
1508 assert(IO_NUM_PRIORITIES == STACKSHOT_IO_NUM_PRIORITIES);
1509 if (thread->thread_io_stats && !memory_iszero(thread->thread_io_stats, sizeof(struct io_stat_info))) {
1510 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_IOSTATS, sizeof(struct io_stats_snapshot), &out_addr));
1511 struct io_stats_snapshot *_iostat = (struct io_stats_snapshot *)out_addr;
1512 _iostat->ss_disk_reads_count = thread->thread_io_stats->disk_reads.count;
1513 _iostat->ss_disk_reads_size = thread->thread_io_stats->disk_reads.size;
1514 _iostat->ss_disk_writes_count = (thread->thread_io_stats->total_io.count - thread->thread_io_stats->disk_reads.count);
1515 _iostat->ss_disk_writes_size = (thread->thread_io_stats->total_io.size - thread->thread_io_stats->disk_reads.size);
1516 _iostat->ss_paging_count = thread->thread_io_stats->paging.count;
1517 _iostat->ss_paging_size = thread->thread_io_stats->paging.size;
1518 _iostat->ss_non_paging_count = (thread->thread_io_stats->total_io.count - thread->thread_io_stats->paging.count);
1519 _iostat->ss_non_paging_size = (thread->thread_io_stats->total_io.size - thread->thread_io_stats->paging.size);
1520 _iostat->ss_metadata_count = thread->thread_io_stats->metadata.count;
1521 _iostat->ss_metadata_size = thread->thread_io_stats->metadata.size;
1522 _iostat->ss_data_count = (thread->thread_io_stats->total_io.count - thread->thread_io_stats->metadata.count);
1523 _iostat->ss_data_size = (thread->thread_io_stats->total_io.size - thread->thread_io_stats->metadata.size);
0a7de745 1524 for (int i = 0; i < IO_NUM_PRIORITIES; i++) {
39037602
A
1525 _iostat->ss_io_priority_count[i] = thread->thread_io_stats->io_priority[i].count;
1526 _iostat->ss_io_priority_size[i] = thread->thread_io_stats->io_priority[i].size;
1527 }
1528 }
3e170ce0 1529
39037602
A
1530error_exit:
1531 return error;
1532}
3e170ce0 1533
39037602
A
1534static kern_return_t
1535kcdata_record_thread_snapshot(
f427ee49 1536 kcdata_descriptor_t kcd, thread_t thread, task_t task, uint64_t trace_flags, boolean_t have_pmap, boolean_t thread_on_core)
39037602
A
1537{
1538 boolean_t dispatch_p = ((trace_flags & STACKSHOT_GET_DQ) != 0);
1539 boolean_t active_kthreads_only_p = ((trace_flags & STACKSHOT_ACTIVE_KERNEL_THREADS_ONLY) != 0);
39037602 1540 boolean_t collect_delta_stackshot = ((trace_flags & STACKSHOT_COLLECT_DELTA_SNAPSHOT) != 0);
d9a64523 1541 boolean_t collect_iostats = !collect_delta_stackshot && !(trace_flags & STACKSHOT_NO_IO_STATS);
5ba3f43e
A
1542#if MONOTONIC
1543 boolean_t collect_instrs_cycles = ((trace_flags & STACKSHOT_INSTRS_CYCLES) != 0);
1544#endif /* MONOTONIC */
39037602 1545 kern_return_t error = KERN_SUCCESS;
f427ee49
A
1546
1547#if STACKSHOT_COLLECTS_LATENCY_INFO
1548 struct stackshot_latency_thread latency_info;
1549 latency_info.cur_thsnap1_latency = mach_absolute_time();
1550#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
1551
39037602
A
1552 mach_vm_address_t out_addr = 0;
1553 int saved_count = 0;
1554
5ba3f43e 1555 struct thread_snapshot_v4 * cur_thread_snap = NULL;
39037602
A
1556 char cur_thread_name[STACKSHOT_MAX_THREAD_NAME_SIZE];
1557 uint64_t tval = 0;
d9a64523 1558 const boolean_t is_64bit_data = task_has_64Bit_data(task);
39037602 1559
5ba3f43e
A
1560 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_THREAD_SNAPSHOT, sizeof(struct thread_snapshot_v4), &out_addr));
1561 cur_thread_snap = (struct thread_snapshot_v4 *)out_addr;
39037602
A
1562
1563 /* Populate the thread snapshot header */
cb323159
A
1564 cur_thread_snap->ths_ss_flags = 0;
1565 cur_thread_snap->ths_thread_id = thread_tid(thread);
39037602
A
1566 cur_thread_snap->ths_wait_event = VM_KERNEL_UNSLIDE_OR_PERM(thread->wait_event);
1567 cur_thread_snap->ths_continuation = VM_KERNEL_UNSLIDE(thread->continuation);
1568 cur_thread_snap->ths_total_syscalls = thread->syscalls_mach + thread->syscalls_unix;
1569
0a7de745 1570 if (IPC_VOUCHER_NULL != thread->ith_voucher) {
39037602 1571 cur_thread_snap->ths_voucher_identifier = VM_KERNEL_ADDRPERM(thread->ith_voucher);
0a7de745 1572 } else {
39037602 1573 cur_thread_snap->ths_voucher_identifier = 0;
0a7de745 1574 }
39037602 1575
f427ee49
A
1576#if STACKSHOT_COLLECTS_LATENCY_INFO
1577 latency_info.cur_thsnap1_latency = mach_absolute_time() - latency_info.cur_thsnap1_latency;
1578 latency_info.dispatch_serial_latency = mach_absolute_time();
1579 latency_info.dispatch_label_latency = 0;
1580#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
1581
39037602
A
1582 cur_thread_snap->ths_dqserialnum = 0;
1583 if (dispatch_p && (task != kernel_task) && (task->active) && have_pmap) {
1584 uint64_t dqkeyaddr = thread_dispatchqaddr(thread);
1585 if (dqkeyaddr != 0) {
1586 uint64_t dqaddr = 0;
1587 boolean_t copyin_ok = kdp_copyin_word(task, dqkeyaddr, &dqaddr, FALSE, NULL);
1588 if (copyin_ok && dqaddr != 0) {
1589 uint64_t dqserialnumaddr = dqaddr + get_task_dispatchqueue_serialno_offset(task);
1590 uint64_t dqserialnum = 0;
1591 copyin_ok = kdp_copyin_word(task, dqserialnumaddr, &dqserialnum, FALSE, NULL);
1592 if (copyin_ok) {
1593 cur_thread_snap->ths_ss_flags |= kHasDispatchSerial;
1594 cur_thread_snap->ths_dqserialnum = dqserialnum;
3e170ce0 1595 }
cb323159 1596
f427ee49
A
1597#if STACKSHOT_COLLECTS_LATENCY_INFO
1598 latency_info.dispatch_serial_latency = mach_absolute_time() - latency_info.dispatch_serial_latency;
1599 latency_info.dispatch_label_latency = mach_absolute_time();
1600#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
1601
cb323159
A
1602 /* try copying in the queue label */
1603 uint64_t label_offs = get_task_dispatchqueue_label_offset(task);
1604 if (label_offs) {
1605 uint64_t dqlabeladdr = dqaddr + label_offs;
1606 uint64_t actual_dqlabeladdr = 0;
1607
1608 copyin_ok = kdp_copyin_word(task, dqlabeladdr, &actual_dqlabeladdr, FALSE, NULL);
1609 if (copyin_ok && actual_dqlabeladdr != 0) {
1610 char label_buf[STACKSHOT_QUEUE_LABEL_MAXSIZE];
1611 int len;
1612
1613 bzero(label_buf, STACKSHOT_QUEUE_LABEL_MAXSIZE * sizeof(char));
1614 len = kdp_copyin_string(task, actual_dqlabeladdr, label_buf, STACKSHOT_QUEUE_LABEL_MAXSIZE, FALSE, NULL);
1615 if (len > 0) {
1616 mach_vm_address_t label_addr = 0;
1617 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_THREAD_DISPATCH_QUEUE_LABEL, len, &label_addr));
1618 stackshot_strlcpy((char*)label_addr, &label_buf[0], len);
1619 }
1620 }
1621 }
f427ee49
A
1622#if STACKSHOT_COLLECTS_LATENCY_INFO
1623 latency_info.dispatch_label_latency = mach_absolute_time() - latency_info.dispatch_label_latency;
1624#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
39037602
A
1625 }
1626 }
1627 }
3e170ce0 1628
f427ee49
A
1629#if STACKSHOT_COLLECTS_LATENCY_INFO
1630 if ((cur_thread_snap->ths_ss_flags & kHasDispatchSerial) == 0) {
1631 latency_info.dispatch_serial_latency = 0;
1632 }
1633 latency_info.cur_thsnap2_latency = mach_absolute_time();
1634#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
1635
39037602
A
1636 tval = safe_grab_timer_value(&thread->user_timer);
1637 cur_thread_snap->ths_user_time = tval;
1638 tval = safe_grab_timer_value(&thread->system_timer);
3e170ce0 1639
39037602
A
1640 if (thread->precise_user_kernel_time) {
1641 cur_thread_snap->ths_sys_time = tval;
1642 } else {
1643 cur_thread_snap->ths_user_time += tval;
1644 cur_thread_snap->ths_sys_time = 0;
1645 }
3e170ce0 1646
0a7de745 1647 if (thread->thread_tag & THREAD_TAG_MAINTHREAD) {
5ba3f43e 1648 cur_thread_snap->ths_ss_flags |= kThreadMain;
0a7de745
A
1649 }
1650 if (thread->effective_policy.thep_darwinbg) {
39037602 1651 cur_thread_snap->ths_ss_flags |= kThreadDarwinBG;
0a7de745
A
1652 }
1653 if (proc_get_effective_thread_policy(thread, TASK_POLICY_PASSIVE_IO)) {
39037602 1654 cur_thread_snap->ths_ss_flags |= kThreadIOPassive;
0a7de745
A
1655 }
1656 if (thread->suspend_count > 0) {
39037602 1657 cur_thread_snap->ths_ss_flags |= kThreadSuspended;
0a7de745
A
1658 }
1659 if (thread->options & TH_OPT_GLOBAL_FORCED_IDLE) {
39037602 1660 cur_thread_snap->ths_ss_flags |= kGlobalForcedIdle;
0a7de745
A
1661 }
1662 if (thread_on_core) {
39037602 1663 cur_thread_snap->ths_ss_flags |= kThreadOnCore;
0a7de745
A
1664 }
1665 if (stackshot_thread_is_idle_worker_unsafe(thread)) {
39037602 1666 cur_thread_snap->ths_ss_flags |= kThreadIdleWorker;
0a7de745 1667 }
39037602
A
1668
1669 /* make sure state flags defined in kcdata.h still match internal flags */
1670 static_assert(SS_TH_WAIT == TH_WAIT);
1671 static_assert(SS_TH_SUSP == TH_SUSP);
1672 static_assert(SS_TH_RUN == TH_RUN);
1673 static_assert(SS_TH_UNINT == TH_UNINT);
1674 static_assert(SS_TH_TERMINATE == TH_TERMINATE);
1675 static_assert(SS_TH_TERMINATE2 == TH_TERMINATE2);
1676 static_assert(SS_TH_IDLE == TH_IDLE);
1677
1678 cur_thread_snap->ths_last_run_time = thread->last_run_time;
1679 cur_thread_snap->ths_last_made_runnable_time = thread->last_made_runnable_time;
1680 cur_thread_snap->ths_state = thread->state;
1681 cur_thread_snap->ths_sched_flags = thread->sched_flags;
1682 cur_thread_snap->ths_base_priority = thread->base_pri;
1683 cur_thread_snap->ths_sched_priority = thread->sched_pri;
1684 cur_thread_snap->ths_eqos = thread->effective_policy.thep_qos;
1685 cur_thread_snap->ths_rqos = thread->requested_policy.thrp_qos;
d9a64523 1686 cur_thread_snap->ths_rqos_override = MAX(thread->requested_policy.thrp_qos_override,
0a7de745 1687 thread->requested_policy.thrp_qos_workq_override);
f427ee49 1688 cur_thread_snap->ths_io_tier = (uint8_t) proc_get_effective_thread_policy(thread, TASK_POLICY_IO);
5ba3f43e
A
1689 cur_thread_snap->ths_thread_t = VM_KERNEL_UNSLIDE_OR_PERM(thread);
1690
1691 static_assert(sizeof(thread->effective_policy) == sizeof(uint64_t));
1692 static_assert(sizeof(thread->requested_policy) == sizeof(uint64_t));
1693 cur_thread_snap->ths_requested_policy = *(unaligned_u64 *) &thread->requested_policy;
1694 cur_thread_snap->ths_effective_policy = *(unaligned_u64 *) &thread->effective_policy;
39037602 1695
f427ee49
A
1696#if STACKSHOT_COLLECTS_LATENCY_INFO
1697 latency_info.cur_thsnap2_latency = mach_absolute_time() - latency_info.cur_thsnap2_latency;
1698 latency_info.thread_name_latency = mach_absolute_time();
1699#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
1700
39037602
A
1701 /* if there is thread name then add to buffer */
1702 cur_thread_name[0] = '\0';
1703 proc_threadname_kdp(thread->uthread, cur_thread_name, STACKSHOT_MAX_THREAD_NAME_SIZE);
1704 if (strnlen(cur_thread_name, STACKSHOT_MAX_THREAD_NAME_SIZE) > 0) {
1705 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_THREAD_NAME, sizeof(cur_thread_name), &out_addr));
1706 stackshot_memcpy((void *)out_addr, (void *)cur_thread_name, sizeof(cur_thread_name));
1707 }
3e170ce0 1708
f427ee49
A
1709#if STACKSHOT_COLLECTS_LATENCY_INFO
1710 latency_info.thread_name_latency = mach_absolute_time() - latency_info.thread_name_latency;
1711 latency_info.sur_times_latency = mach_absolute_time();
1712#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
1713
d9a64523
A
1714 /* record system, user, and runnable times */
1715 time_value_t user_time, system_time, runnable_time;
1716 thread_read_times(thread, &user_time, &system_time, &runnable_time);
1717 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_CPU_TIMES, sizeof(struct stackshot_cpu_times_v2), &out_addr));
1718 struct stackshot_cpu_times_v2 *stackshot_cpu_times = (struct stackshot_cpu_times_v2 *)out_addr;
1719 *stackshot_cpu_times = (struct stackshot_cpu_times_v2){
1720 .user_usec = (uint64_t)user_time.seconds * USEC_PER_SEC + user_time.microseconds,
1721 .system_usec = (uint64_t)system_time.seconds * USEC_PER_SEC + system_time.microseconds,
1722 .runnable_usec = (uint64_t)runnable_time.seconds * USEC_PER_SEC + runnable_time.microseconds,
1723 };
39037602 1724
f427ee49
A
1725#if STACKSHOT_COLLECTS_LATENCY_INFO
1726 latency_info.sur_times_latency = mach_absolute_time() - latency_info.sur_times_latency;
1727 latency_info.user_stack_latency = mach_absolute_time();
1728#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
1729
39037602
A
1730 /* Trace user stack, if any */
1731 if (!active_kthreads_only_p && task->active && thread->task->map != kernel_map) {
1732 uint32_t thread_snapshot_flags = 0;
d9a64523
A
1733
1734 /* Uses 64-bit machine state? */
1735 if (is_64bit_data) {
1736 uint64_t sp = 0;
39037602 1737 out_addr = (mach_vm_address_t)kcd_end_address(kcd);
f427ee49
A
1738
1739 uintptr_t fp = 0;
1740
1741
39037602 1742 saved_count = machine_trace_thread64(thread, (char *)out_addr, (char *)kcd_max_address(kcd), MAX_FRAMES, TRUE,
f427ee49 1743 &thread_snapshot_flags, &sp, fp);
39037602 1744 if (saved_count > 0) {
f427ee49
A
1745 int frame_size = sizeof(uint64_t);
1746 kcd_exit_on_error(kcdata_get_memory_addr_for_array(kcd, STACKSHOT_KCTYPE_USER_STACKLR64,
0a7de745 1747 frame_size, saved_count / frame_size, &out_addr));
39037602
A
1748 cur_thread_snap->ths_ss_flags |= kUser64_p;
1749 }
d9a64523
A
1750#if __x86_64__
1751 if (sp) {
1752 // I'm using 8 here and not sizeof(stack_contents) because this
1753 // code would not work if you just made stack_contents bigger.
1754 vm_offset_t kern_virt_addr = machine_trace_thread_get_kva(sp, thread->task->map, &thread_snapshot_flags);
1755 if (kern_virt_addr && (kern_virt_addr % 8) == 0) {
1756 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_USER_STACKTOP, sizeof(struct stack_snapshot_stacktop), &out_addr));
1757 struct stack_snapshot_stacktop *stacktop = (struct stack_snapshot_stacktop *)out_addr;
1758 stacktop->sp = sp;
1759 memcpy(stacktop->stack_contents, (void*) kern_virt_addr, 8);
1760 }
1761 }
f427ee49 1762#endif /* __x86_64__ */
39037602
A
1763 } else {
1764 out_addr = (mach_vm_address_t)kcd_end_address(kcd);
f427ee49 1765 saved_count = machine_trace_thread(thread, (char *)out_addr, (char *)kcd_max_address(kcd), MAX_FRAMES, TRUE,
0a7de745 1766 &thread_snapshot_flags);
39037602 1767 if (saved_count > 0) {
f427ee49
A
1768 int frame_size = sizeof(uint32_t);
1769 kcd_exit_on_error(kcdata_get_memory_addr_for_array(kcd, STACKSHOT_KCTYPE_USER_STACKLR,
0a7de745 1770 frame_size, saved_count / frame_size, &out_addr));
39037602
A
1771 }
1772 }
3e170ce0 1773
39037602
A
1774 if (thread_snapshot_flags != 0) {
1775 cur_thread_snap->ths_ss_flags |= thread_snapshot_flags;
1776 }
1777 }
3e170ce0 1778
f427ee49
A
1779#if STACKSHOT_COLLECTS_LATENCY_INFO
1780 latency_info.user_stack_latency = mach_absolute_time() - latency_info.user_stack_latency;
1781 latency_info.kernel_stack_latency = mach_absolute_time();
1782#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
1783
39037602
A
1784 /* Call through to the machine specific trace routines
1785 * Frames are added past the snapshot header.
1786 */
1787 if (thread->kernel_stack != 0) {
1788 uint32_t thread_snapshot_flags = 0;
3e170ce0 1789#if defined(__LP64__)
39037602 1790 out_addr = (mach_vm_address_t)kcd_end_address(kcd);
f427ee49
A
1791 saved_count = machine_trace_thread64(thread, (char *)out_addr, (char *)kcd_max_address(kcd), MAX_FRAMES, FALSE,
1792 &thread_snapshot_flags, NULL, 0);
39037602 1793 if (saved_count > 0) {
f427ee49 1794 int frame_size = sizeof(uint64_t);
39037602 1795 cur_thread_snap->ths_ss_flags |= kKernel64_p;
f427ee49 1796 kcd_exit_on_error(kcdata_get_memory_addr_for_array(kcd, STACKSHOT_KCTYPE_KERN_STACKLR64,
0a7de745 1797 frame_size, saved_count / frame_size, &out_addr));
39037602 1798 }
3e170ce0 1799#else
39037602 1800 out_addr = (mach_vm_address_t)kcd_end_address(kcd);
f427ee49 1801 saved_count = machine_trace_thread(thread, (char *)out_addr, (char *)kcd_max_address(kcd), MAX_FRAMES, FALSE,
0a7de745 1802 &thread_snapshot_flags);
39037602 1803 if (saved_count > 0) {
f427ee49 1804 int frame_size = sizeof(uint32_t);
39037602 1805 kcd_exit_on_error(
f427ee49
A
1806 kcdata_get_memory_addr_for_array(kcd, STACKSHOT_KCTYPE_KERN_STACKLR, frame_size,
1807 saved_count / frame_size, &out_addr));
39037602 1808 }
3e170ce0 1809#endif
39037602
A
1810 if (thread_snapshot_flags != 0) {
1811 cur_thread_snap->ths_ss_flags |= thread_snapshot_flags;
3e170ce0
A
1812 }
1813 }
1814
f427ee49
A
1815#if STACKSHOT_COLLECTS_LATENCY_INFO
1816 latency_info.kernel_stack_latency = mach_absolute_time() - latency_info.kernel_stack_latency;
1817 latency_info.misc_latency = mach_absolute_time();
1818#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
1819
1820#if CONFIG_THREAD_GROUPS
1821 if (trace_flags & STACKSHOT_THREAD_GROUP) {
1822 uint64_t thread_group_id = thread->thread_group ? thread_group_get_id(thread->thread_group) : 0;
1823 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_THREAD_GROUP, sizeof(thread_group_id), &out_addr));
1824 stackshot_memcpy((void*)out_addr, &thread_group_id, sizeof(uint64_t));
1825 }
1826#endif /* CONFIG_THREAD_GROUPS */
5ba3f43e 1827
39037602
A
1828 if (collect_iostats) {
1829 kcd_exit_on_error(kcdata_record_thread_iostats(kcd, thread));
1830 }
3e170ce0 1831
5ba3f43e
A
1832#if MONOTONIC
1833 if (collect_instrs_cycles) {
1834 uint64_t instrs = 0, cycles = 0;
1835 mt_stackshot_thread(thread, &instrs, &cycles);
1836
1837 kcd_exit_on_error(kcdata_get_memory_addr(kcd, STACKSHOT_KCTYPE_INSTRS_CYCLES, sizeof(struct instrs_cycles_snapshot), &out_addr));
1838 struct instrs_cycles_snapshot *instrs_cycles = (struct instrs_cycles_snapshot *)out_addr;
1839 instrs_cycles->ics_instructions = instrs;
1840 instrs_cycles->ics_cycles = cycles;
1841 }
1842#endif /* MONOTONIC */
1843
f427ee49
A
1844#if STACKSHOT_COLLECTS_LATENCY_INFO
1845 latency_info.misc_latency = mach_absolute_time() - latency_info.misc_latency;
1846 if (collect_latency_info) {
1847 kcd_exit_on_error(kcdata_push_data(kcd, STACKSHOT_KCTYPE_LATENCY_INFO_THREAD, sizeof(latency_info), &latency_info));
1848 }
1849#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
1850
3e170ce0 1851error_exit:
3e170ce0
A
1852 return error;
1853}
1854
1855static int
a39ff7e2 1856kcdata_record_thread_delta_snapshot(struct thread_delta_snapshot_v3 * cur_thread_snap, thread_t thread, boolean_t thread_on_core)
39037602
A
1857{
1858 cur_thread_snap->tds_thread_id = thread_tid(thread);
0a7de745 1859 if (IPC_VOUCHER_NULL != thread->ith_voucher) {
39037602 1860 cur_thread_snap->tds_voucher_identifier = VM_KERNEL_ADDRPERM(thread->ith_voucher);
0a7de745 1861 } else {
39037602 1862 cur_thread_snap->tds_voucher_identifier = 0;
0a7de745 1863 }
39037602
A
1864
1865 cur_thread_snap->tds_ss_flags = 0;
0a7de745 1866 if (thread->effective_policy.thep_darwinbg) {
39037602 1867 cur_thread_snap->tds_ss_flags |= kThreadDarwinBG;
0a7de745
A
1868 }
1869 if (proc_get_effective_thread_policy(thread, TASK_POLICY_PASSIVE_IO)) {
39037602 1870 cur_thread_snap->tds_ss_flags |= kThreadIOPassive;
0a7de745
A
1871 }
1872 if (thread->suspend_count > 0) {
39037602 1873 cur_thread_snap->tds_ss_flags |= kThreadSuspended;
0a7de745
A
1874 }
1875 if (thread->options & TH_OPT_GLOBAL_FORCED_IDLE) {
39037602 1876 cur_thread_snap->tds_ss_flags |= kGlobalForcedIdle;
0a7de745
A
1877 }
1878 if (thread_on_core) {
39037602 1879 cur_thread_snap->tds_ss_flags |= kThreadOnCore;
0a7de745
A
1880 }
1881 if (stackshot_thread_is_idle_worker_unsafe(thread)) {
39037602 1882 cur_thread_snap->tds_ss_flags |= kThreadIdleWorker;
0a7de745 1883 }
39037602
A
1884
1885 cur_thread_snap->tds_last_made_runnable_time = thread->last_made_runnable_time;
1886 cur_thread_snap->tds_state = thread->state;
1887 cur_thread_snap->tds_sched_flags = thread->sched_flags;
1888 cur_thread_snap->tds_base_priority = thread->base_pri;
1889 cur_thread_snap->tds_sched_priority = thread->sched_pri;
1890 cur_thread_snap->tds_eqos = thread->effective_policy.thep_qos;
1891 cur_thread_snap->tds_rqos = thread->requested_policy.thrp_qos;
d9a64523 1892 cur_thread_snap->tds_rqos_override = MAX(thread->requested_policy.thrp_qos_override,
0a7de745 1893 thread->requested_policy.thrp_qos_workq_override);
f427ee49 1894 cur_thread_snap->tds_io_tier = (uint8_t) proc_get_effective_thread_policy(thread, TASK_POLICY_IO);
39037602 1895
a39ff7e2
A
1896 static_assert(sizeof(thread->effective_policy) == sizeof(uint64_t));
1897 static_assert(sizeof(thread->requested_policy) == sizeof(uint64_t));
1898 cur_thread_snap->tds_requested_policy = *(unaligned_u64 *) &thread->requested_policy;
1899 cur_thread_snap->tds_effective_policy = *(unaligned_u64 *) &thread->effective_policy;
1900
39037602
A
1901 return 0;
1902}
1903
1904/*
1905 * Why 12? 12 strikes a decent balance between allocating a large array on
1906 * the stack and having large kcdata item overheads for recording nonrunable
1907 * tasks.
1908 */
1909#define UNIQUEIDSPERFLUSH 12
1910
1911struct saved_uniqueids {
1912 uint64_t ids[UNIQUEIDSPERFLUSH];
1913 unsigned count;
1914};
1915
39037602
A
1916enum thread_classification {
1917 tc_full_snapshot, /* take a full snapshot */
1918 tc_delta_snapshot, /* take a delta snapshot */
39037602
A
1919};
1920
1921static enum thread_classification
f427ee49 1922classify_thread(thread_t thread, boolean_t * thread_on_core_p, uint64_t trace_flags)
fe8ab488 1923{
39037602 1924 boolean_t collect_delta_stackshot = ((trace_flags & STACKSHOT_COLLECT_DELTA_SNAPSHOT) != 0);
fe8ab488 1925
39037602
A
1926 processor_t last_processor = thread->last_processor;
1927
1928 boolean_t thread_on_core =
cb323159
A
1929 (last_processor != PROCESSOR_NULL &&
1930 (last_processor->state == PROCESSOR_SHUTDOWN || last_processor->state == PROCESSOR_RUNNING) &&
1931 last_processor->active_thread == thread);
39037602
A
1932
1933 *thread_on_core_p = thread_on_core;
1934
1935 /* Capture the full thread snapshot if this is not a delta stackshot or if the thread has run subsequent to the
1936 * previous full stackshot */
1937 if (!collect_delta_stackshot || thread_on_core || (thread->last_run_time > stack_snapshot_delta_since_timestamp)) {
1938 return tc_full_snapshot;
1939 } else {
d9a64523
A
1940 return tc_delta_snapshot;
1941 }
1942}
1943
0a7de745 1944struct stackshot_context {
d9a64523 1945 int pid;
f427ee49 1946 uint64_t trace_flags;
d9a64523
A
1947};
1948
1949static kern_return_t
1950kdp_stackshot_record_task(struct stackshot_context *ctx, task_t task)
1951{
1952 boolean_t active_kthreads_only_p = ((ctx->trace_flags & STACKSHOT_ACTIVE_KERNEL_THREADS_ONLY) != 0);
1953 boolean_t save_donating_pids_p = ((ctx->trace_flags & STACKSHOT_SAVE_IMP_DONATION_PIDS) != 0);
1954 boolean_t collect_delta_stackshot = ((ctx->trace_flags & STACKSHOT_COLLECT_DELTA_SNAPSHOT) != 0);
1955 boolean_t save_owner_info = ((ctx->trace_flags & STACKSHOT_THREAD_WAITINFO) != 0);
1956
d9a64523
A
1957 kern_return_t error = KERN_SUCCESS;
1958 mach_vm_address_t out_addr = 0;
1959 int saved_count = 0;
1960
1961 int task_pid = 0;
1962 uint64_t task_uniqueid = 0;
1963 int num_delta_thread_snapshots = 0;
d9a64523 1964 int num_waitinfo_threads = 0;
cb323159 1965 int num_turnstileinfo_threads = 0;
d9a64523
A
1966
1967 uint64_t task_start_abstime = 0;
d9a64523
A
1968 boolean_t have_map = FALSE, have_pmap = FALSE;
1969 boolean_t some_thread_ran = FALSE;
f427ee49
A
1970 unaligned_u64 task_snap_ss_flags = 0;
1971
1972#if STACKSHOT_COLLECTS_LATENCY_INFO
1973 struct stackshot_latency_task latency_info;
1974 latency_info.setup_latency = mach_absolute_time();
1975#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
d9a64523 1976
cb323159
A
1977#if INTERRUPT_MASKED_DEBUG && MONOTONIC
1978 uint64_t task_begin_cpu_cycle_count = 0;
1979 if (!panic_stackshot) {
1980 task_begin_cpu_cycle_count = mt_cur_cpu_cycles();
1981 }
1982#endif
1983
d9a64523
A
1984 if ((task == NULL) || !ml_validate_nofault((vm_offset_t)task, sizeof(struct task))) {
1985 error = KERN_FAILURE;
1986 goto error_exit;
1987 }
1988
1989 have_map = (task->map != NULL) && (ml_validate_nofault((vm_offset_t)(task->map), sizeof(struct _vm_map)));
1990 have_pmap = have_map && (task->map->pmap != NULL) && (ml_validate_nofault((vm_offset_t)(task->map->pmap), sizeof(struct pmap)));
1991
1992 task_pid = pid_from_task(task);
1993 task_uniqueid = get_task_uniqueid(task);
1994
f427ee49 1995 if (!task->active || task_is_a_corpse(task) || task_is_a_corpse_fork(task)) {
d9a64523 1996 /*
f427ee49 1997 * Not interested in terminated tasks without threads.
d9a64523
A
1998 */
1999 if (queue_empty(&task->threads) || task_pid == -1) {
2000 return KERN_SUCCESS;
2001 }
2002 }
2003
f427ee49
A
2004 /* All PIDs should have the MSB unset */
2005 assert((task_pid & (1ULL << 31)) == 0);
2006
2007#if STACKSHOT_COLLECTS_LATENCY_INFO
2008 latency_info.setup_latency = mach_absolute_time() - latency_info.setup_latency;
2009 latency_info.task_uniqueid = task_uniqueid;
2010#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
d9a64523
A
2011
2012 /* Trace everything, unless a process was specified */
2013 if ((ctx->pid == -1) || (ctx->pid == task_pid)) {
d9a64523
A
2014 /* add task snapshot marker */
2015 kcd_exit_on_error(kcdata_add_container_marker(stackshot_kcdata_p, KCDATA_TYPE_CONTAINER_BEGIN,
0a7de745 2016 STACKSHOT_KCCONTAINER_TASK, task_uniqueid));
d9a64523 2017
f427ee49
A
2018 if (collect_delta_stackshot) {
2019 /*
2020 * For delta stackshots we need to know if a thread from this task has run since the
2021 * previous timestamp to decide whether we're going to record a full snapshot and UUID info.
2022 */
2023 thread_t thread = THREAD_NULL;
2024 queue_iterate(&task->threads, thread, thread_t, task_threads)
2025 {
2026 if ((thread == NULL) || !ml_validate_nofault((vm_offset_t)thread, sizeof(struct thread))) {
2027 error = KERN_FAILURE;
2028 goto error_exit;
2029 }
2030
2031 if (active_kthreads_only_p && thread->kernel_stack == 0) {
2032 continue;
2033 }
2034
2035 boolean_t thread_on_core;
2036 enum thread_classification thread_classification = classify_thread(thread, &thread_on_core, ctx->trace_flags);
2037
2038 switch (thread_classification) {
2039 case tc_full_snapshot:
2040 some_thread_ran = TRUE;
2041 break;
2042 case tc_delta_snapshot:
2043 num_delta_thread_snapshots++;
2044 break;
2045 }
2046 }
2047 }
2048
2049 if (collect_delta_stackshot) {
2050 proc_starttime_kdp(task->bsd_info, NULL, NULL, &task_start_abstime);
2051 }
2052
2053 /* Next record any relevant UUID info and store the task snapshot */
2054 if (!collect_delta_stackshot ||
2055 (task_start_abstime == 0) ||
2056 (task_start_abstime > stack_snapshot_delta_since_timestamp) ||
2057 some_thread_ran) {
2058 /*
2059 * Collect full task information in these scenarios:
2060 *
2061 * 1) a full stackshot
2062 * 2) a delta stackshot where the task started after the previous full stackshot
2063 * 3) a delta stackshot where any thread from the task has run since the previous full stackshot
2064 *
2065 * because the task may have exec'ed, changing its name, architecture, load info, etc
2066 */
2067
2068 kcd_exit_on_error(kcdata_record_shared_cache_info(stackshot_kcdata_p, task, &task_snap_ss_flags));
2069 kcd_exit_on_error(kcdata_record_uuid_info(stackshot_kcdata_p, task, ctx->trace_flags, have_pmap, &task_snap_ss_flags));
2070#if STACKSHOT_COLLECTS_LATENCY_INFO
2071 kcd_exit_on_error(kcdata_record_task_snapshot(stackshot_kcdata_p, task, ctx->trace_flags, have_pmap, task_snap_ss_flags, &latency_info));
2072#else
2073 kcd_exit_on_error(kcdata_record_task_snapshot(stackshot_kcdata_p, task, ctx->trace_flags, have_pmap, task_snap_ss_flags));
2074#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
39037602 2075 } else {
f427ee49
A
2076 kcd_exit_on_error(kcdata_record_task_delta_snapshot(stackshot_kcdata_p, task, ctx->trace_flags, have_pmap, task_snap_ss_flags));
2077 }
2078
2079#if STACKSHOT_COLLECTS_LATENCY_INFO
2080 latency_info.misc_latency = mach_absolute_time();
2081#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2082
2083 struct thread_delta_snapshot_v3 * delta_snapshots = NULL;
2084 int current_delta_snapshot_index = 0;
2085 if (num_delta_thread_snapshots > 0) {
2086 kcd_exit_on_error(kcdata_get_memory_addr_for_array(stackshot_kcdata_p, STACKSHOT_KCTYPE_THREAD_DELTA_SNAPSHOT,
2087 sizeof(struct thread_delta_snapshot_v3),
2088 num_delta_thread_snapshots, &out_addr));
2089 delta_snapshots = (struct thread_delta_snapshot_v3 *)out_addr;
39037602 2090 }
d9a64523 2091
f427ee49
A
2092
2093#if STACKSHOT_COLLECTS_LATENCY_INFO
2094 latency_info.task_thread_count_loop_latency = mach_absolute_time();
2095#endif
2096 /*
2097 * Iterate over the task threads to save thread snapshots and determine
2098 * how much space we need for waitinfo and turnstile info
2099 */
d9a64523
A
2100 thread_t thread = THREAD_NULL;
2101 queue_iterate(&task->threads, thread, thread_t, task_threads)
2102 {
d9a64523
A
2103 if ((thread == NULL) || !ml_validate_nofault((vm_offset_t)thread, sizeof(struct thread))) {
2104 error = KERN_FAILURE;
2105 goto error_exit;
2106 }
2107
f427ee49 2108 uint64_t thread_uniqueid;
0a7de745 2109 if (active_kthreads_only_p && thread->kernel_stack == 0) {
d9a64523 2110 continue;
0a7de745 2111 }
d9a64523
A
2112 thread_uniqueid = thread_tid(thread);
2113
2114 boolean_t thread_on_core;
2115 enum thread_classification thread_classification = classify_thread(thread, &thread_on_core, ctx->trace_flags);
2116
2117 switch (thread_classification) {
2118 case tc_full_snapshot:
2119 /* add thread marker */
2120 kcd_exit_on_error(kcdata_add_container_marker(stackshot_kcdata_p, KCDATA_TYPE_CONTAINER_BEGIN,
0a7de745 2121 STACKSHOT_KCCONTAINER_THREAD, thread_uniqueid));
f427ee49
A
2122
2123 /* thread snapshot can be large, including strings, avoid overflowing the stack. */
2124 kcdata_compression_window_open(stackshot_kcdata_p);
2125
2126 kcd_exit_on_error(kcdata_record_thread_snapshot(stackshot_kcdata_p, thread, task, ctx->trace_flags, have_pmap, thread_on_core));
2127
2128 kcd_exit_on_error(kcdata_compression_window_close(stackshot_kcdata_p));
d9a64523
A
2129
2130 /* mark end of thread snapshot data */
2131 kcd_exit_on_error(kcdata_add_container_marker(stackshot_kcdata_p, KCDATA_TYPE_CONTAINER_END,
0a7de745 2132 STACKSHOT_KCCONTAINER_THREAD, thread_uniqueid));
d9a64523 2133 break;
d9a64523 2134 case tc_delta_snapshot:
f427ee49 2135 kcd_exit_on_error(kcdata_record_thread_delta_snapshot(&delta_snapshots[current_delta_snapshot_index++], thread, thread_on_core));
d9a64523
A
2136 break;
2137 }
2138
f427ee49
A
2139 /*
2140 * We want to report owner information regardless of whether a thread
d9a64523 2141 * has changed since the last delta, whether it's a normal stackshot,
f427ee49
A
2142 * or whether it's nonrunnable
2143 */
cb323159
A
2144 if (save_owner_info) {
2145 if (stackshot_thread_has_valid_waitinfo(thread)) {
2146 num_waitinfo_threads++;
2147 }
2148
2149 if (stackshot_thread_has_valid_turnstileinfo(thread)) {
2150 num_turnstileinfo_threads++;
2151 }
0a7de745 2152 }
d9a64523 2153 }
f427ee49
A
2154#if STACKSHOT_COLLECTS_LATENCY_INFO
2155 latency_info.task_thread_count_loop_latency = mach_absolute_time() - latency_info.task_thread_count_loop_latency;
2156#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
d9a64523 2157
d9a64523 2158
cb323159
A
2159 thread_waitinfo_t *thread_waitinfo = NULL;
2160 thread_turnstileinfo_t *thread_turnstileinfo = NULL;
2161 int current_waitinfo_index = 0;
2162 int current_turnstileinfo_index = 0;
f427ee49
A
2163 /* allocate space for the wait and turnstil info */
2164 if (num_waitinfo_threads > 0 || num_turnstileinfo_threads > 0) {
2165 /* thread waitinfo and turnstileinfo can be quite large, avoid overflowing the stack */
2166 kcdata_compression_window_open(stackshot_kcdata_p);
2167
2168 if (num_waitinfo_threads > 0) {
2169 kcd_exit_on_error(kcdata_get_memory_addr_for_array(stackshot_kcdata_p, STACKSHOT_KCTYPE_THREAD_WAITINFO,
2170 sizeof(thread_waitinfo_t), num_waitinfo_threads, &out_addr));
2171 thread_waitinfo = (thread_waitinfo_t *)out_addr;
2172 }
d9a64523 2173
f427ee49
A
2174 if (num_turnstileinfo_threads > 0) {
2175 /* get space for the turnstile info */
2176 kcd_exit_on_error(kcdata_get_memory_addr_for_array(stackshot_kcdata_p, STACKSHOT_KCTYPE_THREAD_TURNSTILEINFO,
2177 sizeof(thread_turnstileinfo_t), num_turnstileinfo_threads, &out_addr));
2178 thread_turnstileinfo = (thread_turnstileinfo_t *)out_addr;
2179 }
cb323159
A
2180 }
2181
f427ee49
A
2182#if STACKSHOT_COLLECTS_LATENCY_INFO
2183 latency_info.misc_latency = mach_absolute_time() - latency_info.misc_latency;
2184 latency_info.task_thread_data_loop_latency = mach_absolute_time();
2185#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
d9a64523 2186
f427ee49
A
2187 /* Iterate over the task's threads to save the wait and turnstile info */
2188 queue_iterate(&task->threads, thread, thread_t, task_threads)
2189 {
2190 uint64_t thread_uniqueid;
cb323159 2191
f427ee49
A
2192 if (active_kthreads_only_p && thread->kernel_stack == 0) {
2193 continue;
2194 }
d9a64523 2195
f427ee49 2196 thread_uniqueid = thread_tid(thread);
d9a64523 2197
f427ee49
A
2198 /* If we want owner info, we should capture it regardless of its classification */
2199 if (save_owner_info) {
2200 if (stackshot_thread_has_valid_waitinfo(thread)) {
2201 stackshot_thread_wait_owner_info(
2202 thread,
2203 &thread_waitinfo[current_waitinfo_index++]);
2204 }
d9a64523 2205
f427ee49
A
2206 if (stackshot_thread_has_valid_turnstileinfo(thread)) {
2207 stackshot_thread_turnstileinfo(
2208 thread,
2209 &thread_turnstileinfo[current_turnstileinfo_index++]);
d9a64523
A
2210 }
2211 }
f427ee49
A
2212 }
2213
2214#if STACKSHOT_COLLECTS_LATENCY_INFO
2215 latency_info.task_thread_data_loop_latency = mach_absolute_time() - latency_info.task_thread_data_loop_latency;
2216 latency_info.misc2_latency = mach_absolute_time();
2217#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
d9a64523
A
2218
2219#if DEBUG || DEVELOPMENT
f427ee49
A
2220 if (current_delta_snapshot_index != num_delta_thread_snapshots) {
2221 panic("delta thread snapshot count mismatch while capturing snapshots for task %p. expected %d, found %d", task,
2222 num_delta_thread_snapshots, current_delta_snapshot_index);
2223 }
2224 if (current_waitinfo_index != num_waitinfo_threads) {
2225 panic("thread wait info count mismatch while capturing snapshots for task %p. expected %d, found %d", task,
2226 num_waitinfo_threads, current_waitinfo_index);
2227 }
d9a64523 2228#endif
f427ee49
A
2229
2230 if (num_waitinfo_threads > 0 || num_turnstileinfo_threads > 0) {
2231 kcd_exit_on_error(kcdata_compression_window_close(stackshot_kcdata_p));
d9a64523
A
2232 }
2233
2234#if IMPORTANCE_INHERITANCE
2235 if (save_donating_pids_p) {
2236 kcd_exit_on_error(
2237 ((((mach_vm_address_t)kcd_end_address(stackshot_kcdata_p) + (TASK_IMP_WALK_LIMIT * sizeof(int32_t))) <
0a7de745
A
2238 (mach_vm_address_t)kcd_max_address(stackshot_kcdata_p))
2239 ? KERN_SUCCESS
2240 : KERN_RESOURCE_SHORTAGE));
d9a64523 2241 saved_count = task_importance_list_pids(task, TASK_IMP_LIST_DONATING_PIDS,
0a7de745
A
2242 (void *)kcd_end_address(stackshot_kcdata_p), TASK_IMP_WALK_LIMIT);
2243 if (saved_count > 0) {
f427ee49
A
2244 /* Variable size array - better not have it on the stack. */
2245 kcdata_compression_window_open(stackshot_kcdata_p);
d9a64523 2246 kcd_exit_on_error(kcdata_get_memory_addr_for_array(stackshot_kcdata_p, STACKSHOT_KCTYPE_DONATING_PIDS,
0a7de745 2247 sizeof(int32_t), saved_count, &out_addr));
f427ee49 2248 kcd_exit_on_error(kcdata_compression_window_close(stackshot_kcdata_p));
0a7de745 2249 }
d9a64523
A
2250 }
2251#endif
2252
cb323159
A
2253#if INTERRUPT_MASKED_DEBUG && MONOTONIC
2254 if (!panic_stackshot) {
2255 kcd_exit_on_error(kcdata_add_uint64_with_description(stackshot_kcdata_p, (mt_cur_cpu_cycles() - task_begin_cpu_cycle_count),
2256 "task_cpu_cycle_count"));
2257 }
2258#endif
f427ee49
A
2259
2260#if STACKSHOT_COLLECTS_LATENCY_INFO
2261 latency_info.misc2_latency = mach_absolute_time() - latency_info.misc2_latency;
2262 if (collect_latency_info) {
2263 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_LATENCY_INFO_TASK, sizeof(latency_info), &latency_info));
2264 }
2265#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2266
d9a64523
A
2267 /* mark end of task snapshot data */
2268 kcd_exit_on_error(kcdata_add_container_marker(stackshot_kcdata_p, KCDATA_TYPE_CONTAINER_END, STACKSHOT_KCCONTAINER_TASK,
0a7de745 2269 task_uniqueid));
39037602 2270 }
d9a64523 2271
f427ee49 2272
d9a64523
A
2273error_exit:
2274 return error;
39037602
A
2275}
2276
d9a64523 2277
39037602 2278static kern_return_t
f427ee49 2279kdp_stackshot_kcdata_format(int pid, uint64_t trace_flags, uint32_t * pBytesTraced, uint32_t * pBytesUncompressed)
39037602
A
2280{
2281 kern_return_t error = KERN_SUCCESS;
2282 mach_vm_address_t out_addr = 0;
2283 uint64_t abs_time = 0, abs_time_end = 0;
39037602 2284 uint64_t system_state_flags = 0;
fe8ab488 2285 task_t task = TASK_NULL;
39037602
A
2286 mach_timebase_info_data_t timebase = {0, 0};
2287 uint32_t length_to_copy = 0, tmp32 = 0;
39037602 2288 abs_time = mach_absolute_time();
f427ee49
A
2289 uint64_t last_task_start_time = 0;
2290
2291#if STACKSHOT_COLLECTS_LATENCY_INFO
2292 struct stackshot_latency_collection latency_info;
2293#endif
39037602 2294
cb323159
A
2295#if INTERRUPT_MASKED_DEBUG && MONOTONIC
2296 uint64_t stackshot_begin_cpu_cycle_count = 0;
2297
2298 if (!panic_stackshot) {
2299 stackshot_begin_cpu_cycle_count = mt_cur_cpu_cycles();
2300 }
2301#endif
2302
f427ee49
A
2303#if STACKSHOT_COLLECTS_LATENCY_INFO
2304 collect_latency_info = trace_flags & STACKSHOT_DISABLE_LATENCY_INFO ? false : true;
2305#endif
2306
39037602 2307 /* process the flags */
39037602 2308 boolean_t collect_delta_stackshot = ((trace_flags & STACKSHOT_COLLECT_DELTA_SNAPSHOT) != 0);
39037602 2309 boolean_t use_fault_path = ((trace_flags & (STACKSHOT_ENABLE_UUID_FAULTING | STACKSHOT_ENABLE_BT_FAULTING)) != 0);
39037602
A
2310 stack_enable_faulting = (trace_flags & (STACKSHOT_ENABLE_BT_FAULTING));
2311
f427ee49
A
2312 /* Currently we only support returning explicit KEXT load info on fileset kernels */
2313 kc_format_t primary_kc_type = KCFormatUnknown;
2314 if (PE_get_primary_kc_format(&primary_kc_type) && (primary_kc_type != KCFormatFileset)) {
2315 trace_flags &= ~(STACKSHOT_SAVE_KEXT_LOADINFO);
2316 }
39037602 2317
d9a64523
A
2318 struct stackshot_context ctx = {};
2319 ctx.trace_flags = trace_flags;
2320 ctx.pid = pid;
39037602
A
2321
2322 if (use_fault_path) {
2323 fault_stats.sfs_pages_faulted_in = 0;
2324 fault_stats.sfs_time_spent_faulting = 0;
2325 fault_stats.sfs_stopped_faulting = (uint8_t) FALSE;
2326 }
2327
0a7de745 2328 if (sizeof(void *) == 8) {
39037602 2329 system_state_flags |= kKernel64_p;
0a7de745 2330 }
39037602
A
2331
2332 if (stackshot_kcdata_p == NULL || pBytesTraced == NULL) {
2333 error = KERN_INVALID_ARGUMENT;
2334 goto error_exit;
2335 }
2336
2337 /* setup mach_absolute_time and timebase info -- copy out in some cases and needed to convert since_timestamp to seconds for proc start time */
2338 clock_timebase_info(&timebase);
2339
2340 /* begin saving data into the buffer */
2341 *pBytesTraced = 0;
f427ee49
A
2342 if (pBytesUncompressed) {
2343 *pBytesUncompressed = 0;
2344 }
2345 kcd_exit_on_error(kcdata_add_uint64_with_description(stackshot_kcdata_p, trace_flags, "stackshot_in_flags"));
39037602
A
2346 kcd_exit_on_error(kcdata_add_uint32_with_description(stackshot_kcdata_p, (uint32_t)pid, "stackshot_in_pid"));
2347 kcd_exit_on_error(kcdata_add_uint64_with_description(stackshot_kcdata_p, system_state_flags, "system_state_flags"));
f427ee49
A
2348 if (trace_flags & STACKSHOT_PAGE_TABLES) {
2349 kcd_exit_on_error(kcdata_add_uint32_with_description(stackshot_kcdata_p, stack_snapshot_pagetable_mask, "stackshot_pagetable_mask"));
2350 }
2351
2352#if STACKSHOT_COLLECTS_LATENCY_INFO
2353 latency_info.setup_latency = mach_absolute_time();
2354#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
39037602
A
2355
2356#if CONFIG_JETSAM
2357 tmp32 = memorystatus_get_pressure_status_kdp();
f427ee49 2358 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_JETSAM_LEVEL, sizeof(uint32_t), &tmp32));
39037602
A
2359#endif
2360
2361 if (!collect_delta_stackshot) {
5ba3f43e 2362 tmp32 = THREAD_POLICY_INTERNAL_STRUCT_VERSION;
f427ee49 2363 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_THREAD_POLICY_VERSION, sizeof(uint32_t), &tmp32));
5ba3f43e 2364
39037602 2365 tmp32 = PAGE_SIZE;
f427ee49 2366 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_KERN_PAGE_SIZE, sizeof(uint32_t), &tmp32));
39037602
A
2367
2368 /* save boot-args and osversion string */
2369 length_to_copy = MIN((uint32_t)(strlen(version) + 1), OSVERSIZE);
f427ee49
A
2370 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_OSVERSION, length_to_copy, (const void *)version));
2371
39037602 2372
4ba76501 2373 length_to_copy = MIN((uint32_t)(strlen(PE_boot_args()) + 1), BOOT_LINE_LENGTH);
f427ee49 2374 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_BOOTARGS, length_to_copy, PE_boot_args()));
39037602 2375
f427ee49 2376 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, KCDATA_TYPE_TIMEBASE, sizeof(timebase), &timebase));
39037602 2377 } else {
f427ee49 2378 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_DELTA_SINCE_TIMESTAMP, sizeof(uint64_t), &stack_snapshot_delta_since_timestamp));
39037602
A
2379 }
2380
f427ee49 2381 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, KCDATA_TYPE_MACH_ABSOLUTE_TIME, sizeof(uint64_t), &abs_time));
39037602 2382
f427ee49 2383 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, KCDATA_TYPE_USECS_SINCE_EPOCH, sizeof(uint64_t), &stackshot_microsecs));
39037602 2384
d9a64523
A
2385 /* record system level shared cache load info (if available) */
2386 if (!collect_delta_stackshot && init_task_shared_region &&
0a7de745 2387 ml_validate_nofault((vm_offset_t)init_task_shared_region, sizeof(struct vm_shared_region))) {
f427ee49
A
2388 struct dyld_uuid_info_64_v2 sys_shared_cache_info = {0};
2389
2390 stackshot_memcpy(sys_shared_cache_info.imageUUID, &init_task_shared_region->sr_uuid, sizeof(init_task_shared_region->sr_uuid));
2391 sys_shared_cache_info.imageLoadAddress =
2392 init_task_shared_region->sr_slide;
2393 sys_shared_cache_info.imageSlidBaseAddress =
2394 init_task_shared_region->sr_slide + init_task_shared_region->sr_base_address;
d9a64523 2395
f427ee49
A
2396 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_SHAREDCACHE_LOADINFO,
2397 sizeof(struct dyld_uuid_info_64_v2), &sys_shared_cache_info));
d9a64523
A
2398
2399 if (trace_flags & STACKSHOT_COLLECT_SHAREDCACHE_LAYOUT) {
2400 /*
2401 * Include a map of the system shared cache layout if it has been populated
2402 * (which is only when the system is using a custom shared cache).
2403 */
2404 if (init_task_shared_region->sr_images && ml_validate_nofault((vm_offset_t)init_task_shared_region->sr_images,
0a7de745 2405 (init_task_shared_region->sr_images_count * sizeof(struct dyld_uuid_info_64)))) {
d9a64523 2406 assert(init_task_shared_region->sr_images_count != 0);
f427ee49 2407 kcd_exit_on_error(kcdata_push_array(stackshot_kcdata_p, STACKSHOT_KCTYPE_SYS_SHAREDCACHE_LAYOUT, sizeof(struct dyld_uuid_info_64), init_task_shared_region->sr_images_count, init_task_shared_region->sr_images));
d9a64523
A
2408 }
2409 }
fe8ab488 2410 }
fe8ab488 2411
39037602
A
2412 /* Add requested information first */
2413 if (trace_flags & STACKSHOT_GET_GLOBAL_MEM_STATS) {
f427ee49
A
2414 struct mem_and_io_snapshot mais = {0};
2415 kdp_mem_and_io_snapshot(&mais);
2416 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_GLOBAL_MEM_STATS, sizeof(mais), &mais));
39037602
A
2417 }
2418
f427ee49
A
2419#if CONFIG_THREAD_GROUPS
2420 struct thread_group_snapshot_v2 *thread_groups = NULL;
2421 int num_thread_groups = 0;
cb323159
A
2422
2423#if INTERRUPT_MASKED_DEBUG && MONOTONIC
f427ee49 2424 uint64_t thread_group_begin_cpu_cycle_count = 0;
cb323159 2425
f427ee49
A
2426 if (!panic_stackshot && (trace_flags & STACKSHOT_THREAD_GROUP)) {
2427 thread_group_begin_cpu_cycle_count = mt_cur_cpu_cycles();
cb323159
A
2428 }
2429#endif
2430
f427ee49
A
2431
2432 /* Iterate over thread group names */
2433 if (trace_flags & STACKSHOT_THREAD_GROUP) {
2434 /* Variable size array - better not have it on the stack. */
2435 kcdata_compression_window_open(stackshot_kcdata_p);
2436
2437 if (thread_group_iterate_stackshot(stackshot_thread_group_count, &num_thread_groups) != KERN_SUCCESS) {
2438 trace_flags &= ~(STACKSHOT_THREAD_GROUP);
5ba3f43e 2439 }
f427ee49
A
2440
2441 if (num_thread_groups > 0) {
2442 kcd_exit_on_error(kcdata_get_memory_addr_for_array(stackshot_kcdata_p, STACKSHOT_KCTYPE_THREAD_GROUP_SNAPSHOT, sizeof(struct thread_group_snapshot_v2), num_thread_groups, &out_addr));
2443 thread_groups = (struct thread_group_snapshot_v2 *)out_addr;
5ba3f43e
A
2444 }
2445
f427ee49 2446 if (thread_group_iterate_stackshot(stackshot_thread_group_snapshot, thread_groups) != KERN_SUCCESS) {
5ba3f43e
A
2447 error = KERN_FAILURE;
2448 goto error_exit;
2449 }
f427ee49
A
2450
2451 kcd_exit_on_error(kcdata_compression_window_close(stackshot_kcdata_p));
5ba3f43e 2452 }
f427ee49 2453
cb323159 2454#if INTERRUPT_MASKED_DEBUG && MONOTONIC
f427ee49
A
2455 if (!panic_stackshot && (thread_group_begin_cpu_cycle_count != 0)) {
2456 kcd_exit_on_error(kcdata_add_uint64_with_description(stackshot_kcdata_p, (mt_cur_cpu_cycles() - thread_group_begin_cpu_cycle_count),
2457 "thread_groups_cpu_cycle_count"));
cb323159
A
2458 }
2459#endif
5ba3f43e 2460#else
5ba3f43e 2461 trace_flags &= ~(STACKSHOT_THREAD_GROUP);
f427ee49
A
2462#endif /* CONFIG_THREAD_GROUPS */
2463
5ba3f43e 2464
f427ee49
A
2465#if STACKSHOT_COLLECTS_LATENCY_INFO
2466 latency_info.setup_latency = mach_absolute_time() - latency_info.setup_latency;
2467 latency_info.total_task_iteration_latency = mach_absolute_time();
2468#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
d9a64523 2469
39037602 2470 /* Iterate over tasks */
d9a64523
A
2471 queue_iterate(&tasks, task, task_t, tasks)
2472 {
f427ee49
A
2473 if (collect_delta_stackshot) {
2474 uint64_t abstime;
2475 proc_starttime_kdp(task->bsd_info, NULL, NULL, &abstime);
2476
2477 if (abstime > last_task_start_time) {
2478 last_task_start_time = abstime;
2479 }
2480 }
2481
d9a64523 2482 error = kdp_stackshot_record_task(&ctx, task);
0a7de745 2483 if (error) {
fe8ab488 2484 goto error_exit;
0a7de745 2485 }
fe8ab488 2486 }
f427ee49
A
2487
2488
2489#if STACKSHOT_COLLECTS_LATENCY_INFO
2490 latency_info.total_task_iteration_latency = mach_absolute_time() - latency_info.total_task_iteration_latency;
2491#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2492
2493#if CONFIG_COALITIONS
2494 /* Don't collect jetsam coalition data in delta stakshots - these don't change */
2495 if (!collect_delta_stackshot || (last_task_start_time > stack_snapshot_delta_since_timestamp)) {
2496 int num_coalitions = 0;
2497 struct jetsam_coalition_snapshot *coalitions = NULL;
2498
2499#if INTERRUPT_MASKED_DEBUG && MONOTONIC
2500 uint64_t coalition_begin_cpu_cycle_count = 0;
2501
2502 if (!panic_stackshot && (trace_flags & STACKSHOT_SAVE_JETSAM_COALITIONS)) {
2503 coalition_begin_cpu_cycle_count = mt_cur_cpu_cycles();
2504 }
2505#endif
2506
2507 /* Iterate over coalitions */
2508 if (trace_flags & STACKSHOT_SAVE_JETSAM_COALITIONS) {
2509 if (coalition_iterate_stackshot(stackshot_coalition_jetsam_count, &num_coalitions, COALITION_TYPE_JETSAM) != KERN_SUCCESS) {
2510 trace_flags &= ~(STACKSHOT_SAVE_JETSAM_COALITIONS);
2511 }
2512 }
2513 if (trace_flags & STACKSHOT_SAVE_JETSAM_COALITIONS) {
2514 if (num_coalitions > 0) {
2515 /* Variable size array - better not have it on the stack. */
2516 kcdata_compression_window_open(stackshot_kcdata_p);
2517 kcd_exit_on_error(kcdata_get_memory_addr_for_array(stackshot_kcdata_p, STACKSHOT_KCTYPE_JETSAM_COALITION_SNAPSHOT, sizeof(struct jetsam_coalition_snapshot), num_coalitions, &out_addr));
2518 coalitions = (struct jetsam_coalition_snapshot*)out_addr;
2519
2520 if (coalition_iterate_stackshot(stackshot_coalition_jetsam_snapshot, coalitions, COALITION_TYPE_JETSAM) != KERN_SUCCESS) {
2521 error = KERN_FAILURE;
2522 goto error_exit;
2523 }
2524
2525 kcd_exit_on_error(kcdata_compression_window_close(stackshot_kcdata_p));
2526 }
2527 }
2528#if INTERRUPT_MASKED_DEBUG && MONOTONIC
2529 if (!panic_stackshot && (coalition_begin_cpu_cycle_count != 0)) {
2530 kcd_exit_on_error(kcdata_add_uint64_with_description(stackshot_kcdata_p, (mt_cur_cpu_cycles() - coalition_begin_cpu_cycle_count),
2531 "coalitions_cpu_cycle_count"));
2532 }
2533#endif
2534 }
2535#else
2536 trace_flags &= ~(STACKSHOT_SAVE_JETSAM_COALITIONS);
2537#endif /* CONFIG_COALITIONS */
2538
2539#if STACKSHOT_COLLECTS_LATENCY_INFO
2540 latency_info.total_terminated_task_iteration_latency = mach_absolute_time();
2541#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2542
d9a64523
A
2543 /*
2544 * Iterate over the tasks in the terminated tasks list. We only inspect
2545 * tasks that have a valid bsd_info pointer where P_LPEXIT is NOT set.
2546 * We're only interested in tasks that have remaining threads (which
2547 * could be involved in a deadlock, etc), and the last thread that tears
2548 * itself down during exit sets P_LPEXIT during proc_exit().
2549 */
2550 queue_iterate(&terminated_tasks, task, task_t, tasks)
2551 {
2552 if (task->bsd_info && !proc_in_teardown(task->bsd_info)) {
2553 error = kdp_stackshot_record_task(&ctx, task);
0a7de745 2554 if (error) {
d9a64523 2555 goto error_exit;
0a7de745 2556 }
d9a64523 2557 }
39037602
A
2558 }
2559
f427ee49
A
2560
2561#if STACKSHOT_COLLECTS_LATENCY_INFO
2562 latency_info.total_terminated_task_iteration_latency = mach_absolute_time() - latency_info.total_terminated_task_iteration_latency;
2563#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
2564
39037602 2565 if (use_fault_path) {
f427ee49
A
2566 kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_STACKSHOT_FAULT_STATS,
2567 sizeof(struct stackshot_fault_stats), &fault_stats);
2568 }
2569
2570#if STACKSHOT_COLLECTS_LATENCY_INFO
2571 if (collect_latency_info) {
2572 latency_info.latency_version = 1;
2573 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_LATENCY_INFO, sizeof(latency_info), &latency_info));
fe8ab488 2574 }
f427ee49 2575#endif /* STACKSHOT_COLLECTS_LATENCY_INFO */
fe8ab488 2576
39037602
A
2577 /* update timestamp of the stackshot */
2578 abs_time_end = mach_absolute_time();
2579#if DEVELOPMENT || DEBUG
f427ee49
A
2580 struct stackshot_duration stackshot_duration;
2581 stackshot_duration.stackshot_duration = (abs_time_end - abs_time);
2582 stackshot_duration.stackshot_duration_outer = 0;
2583
2584 if ((trace_flags & STACKSHOT_DO_COMPRESS) == 0) {
2585 kcd_exit_on_error(kcdata_get_memory_addr(stackshot_kcdata_p, STACKSHOT_KCTYPE_STACKSHOT_DURATION,
2586 sizeof(struct stackshot_duration), &out_addr));
2587 struct stackshot_duration *duration_p = (void *) out_addr;
2588 stackshot_memcpy(duration_p, &stackshot_duration, sizeof(*duration_p));
2589 stackshot_duration_outer = (unaligned_u64 *)&duration_p->stackshot_duration_outer;
2590 } else {
2591 kcd_exit_on_error(kcdata_push_data(stackshot_kcdata_p, STACKSHOT_KCTYPE_STACKSHOT_DURATION, sizeof(stackshot_duration), &stackshot_duration));
2592 stackshot_duration_outer = NULL;
2593 }
39037602 2594#endif
39037602 2595
cb323159
A
2596#if INTERRUPT_MASKED_DEBUG && MONOTONIC
2597 if (!panic_stackshot) {
2598 kcd_exit_on_error(kcdata_add_uint64_with_description(stackshot_kcdata_p, (mt_cur_cpu_cycles() - stackshot_begin_cpu_cycle_count),
2599 "stackshot_total_cpu_cycle_cnt"));
2600 }
2601#endif
2602
f427ee49
A
2603 kcd_finalize_compression(stackshot_kcdata_p);
2604 kcd_exit_on_error(kcdata_add_uint64_with_description(stackshot_kcdata_p, trace_flags, "stackshot_out_flags"));
2605
39037602
A
2606 kcd_exit_on_error(kcdata_write_buffer_end(stackshot_kcdata_p));
2607
2608 /* === END of populating stackshot data === */
2609
2610 *pBytesTraced = (uint32_t) kcdata_memory_get_used_bytes(stackshot_kcdata_p);
f427ee49
A
2611 *pBytesUncompressed = (uint32_t) kcdata_memory_get_uncompressed_bytes(stackshot_kcdata_p);
2612
fe8ab488 2613error_exit:
fe8ab488 2614
5ba3f43e 2615#if INTERRUPT_MASKED_DEBUG
f427ee49
A
2616 if (trace_flags & STACKSHOT_DO_COMPRESS) {
2617 ml_spin_debug_clear_self();
2618 }
2619#if defined(STACKSHOT_INTERRUPTS_MASKED_CHECK_DISABLED)
2620 ml_spin_debug_clear_self();
2621#endif
2622
2623 if (!panic_stackshot && interrupt_masked_debug) {
5ba3f43e
A
2624 /*
2625 * Try to catch instances where stackshot takes too long BEFORE returning from
2626 * the debugger
2627 */
f427ee49 2628 ml_check_stackshot_interrupt_disabled_duration(current_thread());
5ba3f43e
A
2629 }
2630#endif
2631
39037602 2632 stack_enable_faulting = FALSE;
fe8ab488
A
2633
2634 return error;
2635}
2636
fe8ab488
A
2637static uint64_t
2638proc_was_throttled_from_task(task_t task)
2639{
2640 uint64_t was_throttled = 0;
2641
0a7de745 2642 if (task->bsd_info) {
fe8ab488 2643 was_throttled = proc_was_throttled(task->bsd_info);
0a7de745
A
2644 }
2645
fe8ab488
A
2646 return was_throttled;
2647}
2648
2649static uint64_t
2650proc_did_throttle_from_task(task_t task)
2651{
2652 uint64_t did_throttle = 0;
2653
0a7de745 2654 if (task->bsd_info) {
fe8ab488 2655 did_throttle = proc_did_throttle(task->bsd_info);
0a7de745
A
2656 }
2657
fe8ab488
A
2658 return did_throttle;
2659}
2660
2661static void
2662kdp_mem_and_io_snapshot(struct mem_and_io_snapshot *memio_snap)
2663{
2664 unsigned int pages_reclaimed;
2665 unsigned int pages_wanted;
2666 kern_return_t kErr;
2667
f427ee49
A
2668 uint64_t compressions = 0;
2669 uint64_t decompressions = 0;
fe8ab488 2670
f427ee49
A
2671 percpu_foreach(stat, vm_stat) {
2672 compressions += stat->compressions;
2673 decompressions += stat->decompressions;
fe8ab488
A
2674 }
2675
2676 memio_snap->snapshot_magic = STACKSHOT_MEM_AND_IO_SNAPSHOT_MAGIC;
2677 memio_snap->free_pages = vm_page_free_count;
2678 memio_snap->active_pages = vm_page_active_count;
2679 memio_snap->inactive_pages = vm_page_inactive_count;
2680 memio_snap->purgeable_pages = vm_page_purgeable_count;
2681 memio_snap->wired_pages = vm_page_wire_count;
2682 memio_snap->speculative_pages = vm_page_speculative_count;
2683 memio_snap->throttled_pages = vm_page_throttled_count;
2684 memio_snap->busy_buffer_count = count_busy_buffers();
2685 memio_snap->filebacked_pages = vm_page_pageable_external_count;
f427ee49
A
2686 memio_snap->compressions = (uint32_t)compressions;
2687 memio_snap->decompressions = (uint32_t)decompressions;
fe8ab488
A
2688 memio_snap->compressor_size = VM_PAGE_COMPRESSOR_COUNT;
2689 kErr = mach_vm_pressure_monitor(FALSE, VM_PRESSURE_TIME_WINDOW, &pages_reclaimed, &pages_wanted);
2690
0a7de745 2691 if (!kErr) {
fe8ab488
A
2692 memio_snap->pages_wanted = (uint32_t)pages_wanted;
2693 memio_snap->pages_reclaimed = (uint32_t)pages_reclaimed;
2694 memio_snap->pages_wanted_reclaimed_valid = 1;
2695 } else {
2696 memio_snap->pages_wanted = 0;
2697 memio_snap->pages_reclaimed = 0;
2698 memio_snap->pages_wanted_reclaimed_valid = 0;
2699 }
2700}
2701
39037602
A
2702void
2703stackshot_memcpy(void *dst, const void *src, size_t len)
2704{
f427ee49 2705#if defined(__arm__) || defined(__arm64__)
5ba3f43e
A
2706 if (panic_stackshot) {
2707 uint8_t *dest_bytes = (uint8_t *)dst;
2708 const uint8_t *src_bytes = (const uint8_t *)src;
2709 for (size_t i = 0; i < len; i++) {
2710 dest_bytes[i] = src_bytes[i];
2711 }
2712 } else
2713#endif
0a7de745 2714 memcpy(dst, src, len);
39037602
A
2715}
2716
2717size_t
2718stackshot_strlcpy(char *dst, const char *src, size_t maxlen)
2719{
2720 const size_t srclen = strlen(src);
2721
2722 if (srclen < maxlen) {
0a7de745 2723 stackshot_memcpy(dst, src, srclen + 1);
39037602 2724 } else if (maxlen != 0) {
0a7de745
A
2725 stackshot_memcpy(dst, src, maxlen - 1);
2726 dst[maxlen - 1] = '\0';
39037602
A
2727 }
2728
2729 return srclen;
2730}
2731
f427ee49
A
2732static inline void
2733kdp_extract_page_mask_and_size(vm_map_t map, int *effective_page_mask, int *effective_page_size)
2734{
2735 if (VM_MAP_PAGE_SHIFT(map) < PAGE_SHIFT) {
2736 *effective_page_mask = VM_MAP_PAGE_MASK(map);
2737 *effective_page_size = VM_MAP_PAGE_SIZE(map);
2738 } else {
2739 *effective_page_mask = PAGE_MASK;
2740 *effective_page_size = PAGE_SIZE;
2741 }
2742}
39037602
A
2743
2744/*
2745 * Returns the physical address of the specified map:target address,
2746 * using the kdp fault path if requested and the page is not resident.
2747 */
2748vm_offset_t
2749kdp_find_phys(vm_map_t map, vm_offset_t target_addr, boolean_t try_fault, uint32_t *kdp_fault_results)
2750{
2751 vm_offset_t cur_phys_addr;
2752 unsigned cur_wimg_bits;
2753 uint64_t fault_start_time = 0;
f427ee49 2754 int effective_page_mask, effective_page_size;
39037602
A
2755
2756 if (map == VM_MAP_NULL) {
2757 return 0;
2758 }
2759
f427ee49
A
2760 kdp_extract_page_mask_and_size(map, &effective_page_mask, &effective_page_size);
2761
39037602
A
2762 cur_phys_addr = kdp_vtophys(map->pmap, target_addr);
2763 if (!pmap_valid_page((ppnum_t) atop(cur_phys_addr))) {
2764 if (!try_fault || fault_stats.sfs_stopped_faulting) {
0a7de745 2765 if (kdp_fault_results) {
39037602 2766 *kdp_fault_results |= KDP_FAULT_RESULT_PAGED_OUT;
0a7de745 2767 }
39037602
A
2768
2769 return 0;
2770 }
2771
2772 /*
2773 * The pmap doesn't have a valid page so we start at the top level
2774 * vm map and try a lightweight fault. Update fault path usage stats.
2775 */
2776 fault_start_time = mach_absolute_time();
f427ee49 2777 cur_phys_addr = kdp_lightweight_fault(map, (target_addr & ~effective_page_mask));
39037602
A
2778 fault_stats.sfs_time_spent_faulting += (mach_absolute_time() - fault_start_time);
2779
2780 if ((fault_stats.sfs_time_spent_faulting >= fault_stats.sfs_system_max_fault_time) && !panic_stackshot) {
2781 fault_stats.sfs_stopped_faulting = (uint8_t) TRUE;
2782 }
2783
f427ee49 2784 cur_phys_addr += (target_addr & effective_page_mask);
39037602
A
2785
2786 if (!pmap_valid_page((ppnum_t) atop(cur_phys_addr))) {
0a7de745 2787 if (kdp_fault_results) {
39037602 2788 *kdp_fault_results |= (KDP_FAULT_RESULT_TRIED_FAULT | KDP_FAULT_RESULT_PAGED_OUT);
0a7de745 2789 }
39037602
A
2790
2791 return 0;
2792 }
2793
0a7de745 2794 if (kdp_fault_results) {
39037602 2795 *kdp_fault_results |= KDP_FAULT_RESULT_FAULTED_IN;
0a7de745 2796 }
39037602
A
2797
2798 fault_stats.sfs_pages_faulted_in++;
2799 } else {
2800 /*
2801 * This check is done in kdp_lightweight_fault for the fault path.
2802 */
2803 cur_wimg_bits = pmap_cache_attributes((ppnum_t) atop(cur_phys_addr));
2804
2805 if ((cur_wimg_bits & VM_WIMG_MASK) != VM_WIMG_DEFAULT) {
2806 return 0;
2807 }
2808 }
2809
2810 return cur_phys_addr;
2811}
2812
fe8ab488 2813boolean_t
39037602
A
2814kdp_copyin_word(
2815 task_t task, uint64_t addr, uint64_t *result, boolean_t try_fault, uint32_t *kdp_fault_results)
2816{
cb323159 2817 if (task_has_64Bit_addr(task)) {
39037602
A
2818 return kdp_copyin(task->map, addr, result, sizeof(uint64_t), try_fault, kdp_fault_results);
2819 } else {
2820 uint32_t buf;
2821 boolean_t r = kdp_copyin(task->map, addr, &buf, sizeof(uint32_t), try_fault, kdp_fault_results);
2822 *result = buf;
2823 return r;
2824 }
2825}
2826
f427ee49
A
2827static int
2828kdp_copyin_string_slowpath(
cb323159
A
2829 task_t task, uint64_t addr, char *buf, int buf_sz, boolean_t try_fault, uint32_t *kdp_fault_results)
2830{
2831 int i;
2832 uint64_t validated = 0, valid_from;
2833 uint64_t phys_src, phys_dest;
f427ee49
A
2834 int effective_page_mask, effective_page_size;
2835 vm_map_t map = task->map;
2836
2837 kdp_extract_page_mask_and_size(map, &effective_page_mask, &effective_page_size);
cb323159
A
2838
2839 for (i = 0; i < buf_sz; i++) {
2840 if (validated == 0) {
2841 valid_from = i;
f427ee49 2842 phys_src = kdp_find_phys(map, addr + i, try_fault, kdp_fault_results);
cb323159 2843 phys_dest = kvtophys((vm_offset_t)&buf[i]);
f427ee49 2844 uint64_t src_rem = effective_page_size - (phys_src & effective_page_mask);
cb323159
A
2845 uint64_t dst_rem = PAGE_SIZE - (phys_dest & PAGE_MASK);
2846 if (phys_src && phys_dest) {
2847 validated = MIN(src_rem, dst_rem);
2848 if (validated) {
2849 bcopy_phys(phys_src, phys_dest, 1);
2850 validated--;
2851 } else {
2852 return 0;
2853 }
2854 } else {
2855 return 0;
2856 }
2857 } else {
2858 bcopy_phys(phys_src + (i - valid_from), phys_dest + (i - valid_from), 1);
2859 validated--;
2860 }
2861
2862 if (buf[i] == '\0') {
2863 return i + 1;
2864 }
2865 }
2866
2867 /* ran out of space */
2868 return -1;
2869}
2870
f427ee49
A
2871int
2872kdp_copyin_string(
2873 task_t task, uint64_t addr, char *buf, int buf_sz, boolean_t try_fault, uint32_t *kdp_fault_results)
2874{
2875 /* try to opportunistically copyin 32 bytes, most strings should fit */
2876 char optbuffer[32];
2877 boolean_t res;
2878
2879 bzero(optbuffer, sizeof(optbuffer));
2880 res = kdp_copyin(task->map, addr, optbuffer, sizeof(optbuffer), try_fault, kdp_fault_results);
2881 if (res == FALSE || strnlen(optbuffer, sizeof(optbuffer)) == sizeof(optbuffer)) {
2882 /* try the slowpath */
2883 return kdp_copyin_string_slowpath(task, addr, buf, buf_sz, try_fault, kdp_fault_results);
2884 }
2885
2886 /* success */
2887 return (int) strlcpy(buf, optbuffer, buf_sz) + 1;
2888}
2889
39037602
A
2890boolean_t
2891kdp_copyin(vm_map_t map, uint64_t uaddr, void *dest, size_t size, boolean_t try_fault, uint32_t *kdp_fault_results)
fe8ab488
A
2892{
2893 size_t rem = size;
2894 char *kvaddr = dest;
f427ee49
A
2895 int effective_page_mask, effective_page_size;
2896
2897 kdp_extract_page_mask_and_size(map, &effective_page_mask, &effective_page_size);
fe8ab488 2898
f427ee49 2899#if defined(__arm__) || defined(__arm64__)
3e170ce0 2900 /* Identify if destination buffer is in panic storage area */
5ba3f43e
A
2901 if (panic_stackshot && ((vm_offset_t)dest >= gPanicBase) && ((vm_offset_t)dest < (gPanicBase + gPanicSize))) {
2902 if (((vm_offset_t)dest + size) > (gPanicBase + gPanicSize)) {
3e170ce0
A
2903 return FALSE;
2904 }
3e170ce0
A
2905 }
2906#endif
2907
fe8ab488 2908 while (rem) {
39037602 2909 uint64_t phys_src = kdp_find_phys(map, uaddr, try_fault, kdp_fault_results);
fe8ab488 2910 uint64_t phys_dest = kvtophys((vm_offset_t)kvaddr);
f427ee49 2911 uint64_t src_rem = effective_page_size - (phys_src & effective_page_mask);
fe8ab488
A
2912 uint64_t dst_rem = PAGE_SIZE - (phys_dest & PAGE_MASK);
2913 size_t cur_size = (uint32_t) MIN(src_rem, dst_rem);
2914 cur_size = MIN(cur_size, rem);
2915
39037602 2916 if (phys_src && phys_dest) {
f427ee49 2917#if defined(__arm__) || defined(__arm64__)
5ba3f43e 2918 /*
f427ee49 2919 * On arm devices the panic buffer is mapped as device memory and doesn't allow
5ba3f43e
A
2920 * unaligned accesses. To prevent these, we copy over bytes individually here.
2921 */
0a7de745 2922 if (panic_stackshot) {
5ba3f43e 2923 stackshot_memcpy(kvaddr, (const void *)phystokv(phys_src), cur_size);
0a7de745 2924 } else
f427ee49 2925#endif /* defined(__arm__) || defined(__arm64__) */
0a7de745 2926 bcopy_phys(phys_src, phys_dest, cur_size);
39037602 2927 } else {
fe8ab488 2928 break;
39037602
A
2929 }
2930
fe8ab488
A
2931 uaddr += cur_size;
2932 kvaddr += cur_size;
3e170ce0 2933 rem -= cur_size;
fe8ab488 2934 }
39037602 2935
0a7de745 2936 return rem == 0;
fe8ab488
A
2937}
2938
39037602
A
2939kern_return_t
2940do_stackshot(void *context)
fe8ab488 2941{
39037602
A
2942#pragma unused(context)
2943 kdp_snapshot++;
2944
2945 stack_snapshot_ret = kdp_stackshot_kcdata_format(stack_snapshot_pid,
3e170ce0 2946 stack_snapshot_flags,
f427ee49
A
2947 &stack_snapshot_bytes_traced,
2948 &stack_snapshot_bytes_uncompressed);
2949
2950 if (stack_snapshot_ret == KERN_SUCCESS && stack_snapshot_flags & STACKSHOT_DO_COMPRESS) {
2951 kcdata_finish_compression(stackshot_kcdata_p);
2952 }
39037602
A
2953
2954 kdp_snapshot--;
2955 return stack_snapshot_ret;
fe8ab488
A
2956}
2957
2958/*
2959 * A fantastical routine that tries to be fast about returning
2960 * translations. Caches the last page we found a translation
2961 * for, so that we can be quick about multiple queries to the
2962 * same page. It turns out this is exactly the workflow
2963 * machine_trace_thread and its relatives tend to throw at us.
2964 *
2965 * Please zero the nasty global this uses after a bulk lookup;
39037602 2966 * this isn't safe across a switch of the map or changes
fe8ab488
A
2967 * to a pmap.
2968 *
2969 * This also means that if zero is a valid KVA, we are
2970 * screwed. Sucks to be us. Fortunately, this should never
2971 * happen.
2972 */
2973vm_offset_t
3e170ce0 2974machine_trace_thread_get_kva(vm_offset_t cur_target_addr, vm_map_t map, uint32_t *thread_trace_flags)
fe8ab488 2975{
fe8ab488
A
2976 vm_offset_t cur_target_page;
2977 vm_offset_t cur_phys_addr;
2978 vm_offset_t kern_virt_target_addr;
39037602 2979 uint32_t kdp_fault_results = 0;
fe8ab488
A
2980
2981 cur_target_page = atop(cur_target_addr);
2982
2983 if ((cur_target_page != prev_target_page) || validate_next_addr) {
2984 /*
2985 * Alright; it wasn't our previous page. So
2986 * we must validate that there is a page
2987 * table entry for this address under the
39037602 2988 * current pmap, and that it has default
fe8ab488
A
2989 * cache attributes (otherwise it may not be
2990 * safe to access it).
2991 */
39037602
A
2992 cur_phys_addr = kdp_find_phys(map, cur_target_addr, stack_enable_faulting, &kdp_fault_results);
2993 if (thread_trace_flags) {
2994 if (kdp_fault_results & KDP_FAULT_RESULT_PAGED_OUT) {
2995 *thread_trace_flags |= kThreadTruncatedBT;
3e170ce0 2996 }
fe8ab488 2997
39037602
A
2998 if (kdp_fault_results & KDP_FAULT_RESULT_TRIED_FAULT) {
2999 *thread_trace_flags |= kThreadTriedFaultBT;
3000 }
3e170ce0 3001
39037602
A
3002 if (kdp_fault_results & KDP_FAULT_RESULT_FAULTED_IN) {
3003 *thread_trace_flags |= kThreadFaultedBT;
3e170ce0 3004 }
fe8ab488
A
3005 }
3006
39037602
A
3007 if (cur_phys_addr == 0) {
3008 return 0;
3009 }
5ba3f43e 3010 kern_virt_target_addr = phystokv(cur_phys_addr);
fe8ab488
A
3011 prev_target_page = cur_target_page;
3012 prev_target_kva = (kern_virt_target_addr & ~PAGE_MASK);
3013 validate_next_addr = FALSE;
fe8ab488
A
3014 } else {
3015 /* We found a translation, so stash this page */
3016 kern_virt_target_addr = prev_target_kva + (cur_target_addr & PAGE_MASK);
fe8ab488 3017 }
5ba3f43e
A
3018
3019#if KASAN
3020 kasan_notify_address(kern_virt_target_addr, sizeof(uint64_t));
3021#endif
3022 return kern_virt_target_addr;
fe8ab488
A
3023}
3024
3025void
3026machine_trace_thread_clear_validation_cache(void)
3027{
3028 validate_next_addr = TRUE;
3029}
3030
39037602
A
3031boolean_t
3032stackshot_thread_is_idle_worker_unsafe(thread_t thread)
3033{
813fb2f6
A
3034 /* When the pthread kext puts a worker thread to sleep, it will
3035 * set kThreadWaitParkedWorkQueue in the block_hint of the thread
3036 * struct. See parkit() in kern/kern_support.c in libpthread.
39037602 3037 */
813fb2f6 3038 return (thread->state & TH_WAIT) &&
0a7de745 3039 (thread->block_hint == kThreadWaitParkedWorkQueue);
813fb2f6
A
3040}
3041
5ba3f43e
A
3042#if CONFIG_COALITIONS
3043static void
3044stackshot_coalition_jetsam_count(void *arg, int i, coalition_t coal)
3045{
3046#pragma unused(i, coal)
3047 unsigned int *coalition_count = (unsigned int*)arg;
3048 (*coalition_count)++;
3049}
3050
3051static void
3052stackshot_coalition_jetsam_snapshot(void *arg, int i, coalition_t coal)
3053{
0a7de745 3054 if (coalition_type(coal) != COALITION_TYPE_JETSAM) {
5ba3f43e 3055 return;
0a7de745 3056 }
5ba3f43e
A
3057
3058 struct jetsam_coalition_snapshot *coalitions = (struct jetsam_coalition_snapshot*)arg;
3059 struct jetsam_coalition_snapshot *jcs = &coalitions[i];
3060 task_t leader = TASK_NULL;
3061 jcs->jcs_id = coalition_id(coal);
3062 jcs->jcs_flags = 0;
4ba76501 3063 jcs->jcs_thread_group = 0;
5ba3f43e 3064
0a7de745 3065 if (coalition_term_requested(coal)) {
5ba3f43e 3066 jcs->jcs_flags |= kCoalitionTermRequested;
0a7de745
A
3067 }
3068 if (coalition_is_terminated(coal)) {
5ba3f43e 3069 jcs->jcs_flags |= kCoalitionTerminated;
0a7de745
A
3070 }
3071 if (coalition_is_reaped(coal)) {
5ba3f43e 3072 jcs->jcs_flags |= kCoalitionReaped;
0a7de745
A
3073 }
3074 if (coalition_is_privileged(coal)) {
5ba3f43e 3075 jcs->jcs_flags |= kCoalitionPrivileged;
0a7de745 3076 }
5ba3f43e 3077
f427ee49
A
3078#if CONFIG_THREAD_GROUPS
3079 struct thread_group *thread_group = kdp_coalition_get_thread_group(coal);
3080 if (thread_group) {
3081 jcs->jcs_thread_group = thread_group_get_id(thread_group);
3082 }
3083#endif /* CONFIG_THREAD_GROUPS */
5ba3f43e
A
3084
3085 leader = kdp_coalition_get_leader(coal);
0a7de745 3086 if (leader) {
5ba3f43e 3087 jcs->jcs_leader_task_uniqueid = get_task_uniqueid(leader);
0a7de745 3088 } else {
5ba3f43e 3089 jcs->jcs_leader_task_uniqueid = 0;
0a7de745 3090 }
5ba3f43e
A
3091}
3092#endif /* CONFIG_COALITIONS */
3093
f427ee49
A
3094#if CONFIG_THREAD_GROUPS
3095static void
3096stackshot_thread_group_count(void *arg, int i, struct thread_group *tg)
3097{
3098#pragma unused(i, tg)
3099 unsigned int *n = (unsigned int*)arg;
3100 (*n)++;
3101}
3102
3103static void
3104stackshot_thread_group_snapshot(void *arg, int i, struct thread_group *tg)
3105{
3106 struct thread_group_snapshot_v2 *thread_groups = (struct thread_group_snapshot_v2 *)arg;
3107 struct thread_group_snapshot_v2 *tgs = &thread_groups[i];
3108 uint64_t flags = kdp_thread_group_get_flags(tg);
3109 tgs->tgs_id = thread_group_get_id(tg);
3110 stackshot_memcpy(tgs->tgs_name, thread_group_get_name(tg), THREAD_GROUP_MAXNAME);
3111 tgs->tgs_flags = ((flags & THREAD_GROUP_FLAGS_EFFICIENT) ? kThreadGroupEfficient : 0) |
3112 ((flags & THREAD_GROUP_FLAGS_UI_APP) ? kThreadGroupUIApp : 0);
3113}
3114#endif /* CONFIG_THREAD_GROUPS */
5ba3f43e 3115
813fb2f6
A
3116/* Determine if a thread has waitinfo that stackshot can provide */
3117static int
3118stackshot_thread_has_valid_waitinfo(thread_t thread)
3119{
0a7de745 3120 if (!(thread->state & TH_WAIT)) {
813fb2f6 3121 return 0;
0a7de745 3122 }
813fb2f6
A
3123
3124 switch (thread->block_hint) {
0a7de745
A
3125 // If set to None or is a parked work queue, ignore it
3126 case kThreadWaitParkedWorkQueue:
3127 case kThreadWaitNone:
3128 return 0;
3129 // There is a short window where the pthread kext removes a thread
3130 // from its ksyn wait queue before waking the thread up
3131 case kThreadWaitPThreadMutex:
3132 case kThreadWaitPThreadRWLockRead:
3133 case kThreadWaitPThreadRWLockWrite:
3134 case kThreadWaitPThreadCondVar:
3135 return kdp_pthread_get_thread_kwq(thread) != NULL;
3136 // All other cases are valid block hints if in a wait state
3137 default:
3138 return 1;
813fb2f6
A
3139 }
3140}
3141
cb323159
A
3142/* Determine if a thread has turnstileinfo that stackshot can provide */
3143static int
3144stackshot_thread_has_valid_turnstileinfo(thread_t thread)
3145{
3146 struct turnstile *ts = thread_get_waiting_turnstile(thread);
3147
3148 return stackshot_thread_has_valid_waitinfo(thread) &&
3149 ts != TURNSTILE_NULL;
3150}
3151
3152static void
3153stackshot_thread_turnstileinfo(thread_t thread, thread_turnstileinfo_t *tsinfo)
3154{
3155 struct turnstile *ts;
3156
3157 /* acquire turnstile information and store it in the stackshot */
3158 ts = thread_get_waiting_turnstile(thread);
3159 tsinfo->waiter = thread_tid(thread);
3160 kdp_turnstile_fill_tsinfo(ts, tsinfo);
3161}
3162
813fb2f6
A
3163static void
3164stackshot_thread_wait_owner_info(thread_t thread, thread_waitinfo_t *waitinfo)
3165{
cb323159
A
3166 waitinfo->waiter = thread_tid(thread);
3167 waitinfo->wait_type = thread->block_hint;
3168
813fb2f6 3169 switch (waitinfo->wait_type) {
0a7de745
A
3170 case kThreadWaitKernelMutex:
3171 kdp_lck_mtx_find_owner(thread->waitq, thread->wait_event, waitinfo);
3172 break;
3173 case kThreadWaitPortReceive:
3174 kdp_mqueue_recv_find_owner(thread->waitq, thread->wait_event, waitinfo);
3175 break;
3176 case kThreadWaitPortSend:
3177 kdp_mqueue_send_find_owner(thread->waitq, thread->wait_event, waitinfo);
3178 break;
3179 case kThreadWaitSemaphore:
3180 kdp_sema_find_owner(thread->waitq, thread->wait_event, waitinfo);
3181 break;
3182 case kThreadWaitUserLock:
3183 kdp_ulock_find_owner(thread->waitq, thread->wait_event, waitinfo);
3184 break;
3185 case kThreadWaitKernelRWLockRead:
3186 case kThreadWaitKernelRWLockWrite:
3187 case kThreadWaitKernelRWLockUpgrade:
3188 kdp_rwlck_find_owner(thread->waitq, thread->wait_event, waitinfo);
3189 break;
3190 case kThreadWaitPThreadMutex:
3191 case kThreadWaitPThreadRWLockRead:
3192 case kThreadWaitPThreadRWLockWrite:
3193 case kThreadWaitPThreadCondVar:
3194 kdp_pthread_find_owner(thread, waitinfo);
3195 break;
3196 case kThreadWaitWorkloopSyncWait:
3197 kdp_workloop_sync_wait_find_owner(thread, thread->wait_event, waitinfo);
3198 break;
3199 case kThreadWaitOnProcess:
3200 kdp_wait4_find_process(thread, thread->wait_event, waitinfo);
3201 break;
cb323159
A
3202 case kThreadWaitSleepWithInheritor:
3203 kdp_sleep_with_inheritor_find_owner(thread->waitq, thread->wait_event, waitinfo);
3204 break;
f427ee49
A
3205 case kThreadWaitEventlink:
3206 kdp_eventlink_find_owner(thread->waitq, thread->wait_event, waitinfo);
3207 break;
ea3f0419
A
3208 case kThreadWaitCompressor:
3209 kdp_compressor_busy_find_owner(thread->wait_event, waitinfo);
3210 break;
0a7de745
A
3211 default:
3212 waitinfo->owner = 0;
3213 waitinfo->context = 0;
3214 break;
813fb2f6 3215 }
39037602 3216}