9 #include <spawn_private.h>
11 #include <sys/sysctl.h>
12 #include <sys/spawn_internal.h>
13 #include <sys/kern_memorystatus.h>
14 #include <mach-o/dyld.h>
16 #include <darwintest.h>
17 #include <darwintest_utils.h>
20 T_META_NAMESPACE("xnu.vm"),
21 T_META_CHECK_LEAKS(false)
24 extern char **environ
;
27 * This test file contains two sub-tests which attempt to verify
28 * the allowing or not allowing of a corpse for crashreporter when
29 * a task exceeds its memory allocation limit. vm_map_fork() is the
30 * kernel routine used to generate a corpse task.
32 * A corpse is allowed to be taken if a task's memory resource limit that
33 * is exceeded is less than 1/4 of the system wide task limit.
34 * If the amount exceeds 1/4 the sytem wide limit, then the corpse is disallowed.
36 * If the device under test is already under pressure, the test
37 * could fail due to jetsam cutting in and killing the parent, child or
38 * other necessary testing processes.
42 #define TEST_ALLOWED 0x1
43 #define TEST_NOT_ALLOWED 0x2
46 * Values which the kernel OR's into the PID when a corpse
47 * is either allowed or disallowed for the
48 * kern.memorystatus_vm_map_fork_pidwatch sysctl.
50 #define MEMORYSTATUS_VM_MAP_FORK_ALLOWED 0x100000000ul
51 #define MEMORYSTATUS_VM_MAP_FORK_NOT_ALLOWED 0x200000000ul
54 * The memory allocation happens in a child process, this
55 * is stuff to deal with creating and managing the child.
56 * The child will only execute the T_HELPER_DECL.
58 static char testpath
[PATH_MAX
];
59 static uint32_t testpath_size
= sizeof(testpath
);
60 #define LIMIT_DELTA_MB 5 /* an arbitrary limit delta */
61 #define MEGABYTE (1024 * 1024)
64 * The child process communicates back to parent via an exit() code.
73 static char *child_exit_why
[] = {
75 "no memsize argument to child",
76 "invalid memsize argument to child",
81 * Corpse collection only happens in development kernels.
82 * So we need this to detect if the test is relevant.
85 is_development_kernel(void)
89 size_t dev_size
= sizeof(dev
);
91 ret
= sysctlbyname("kern.development", &dev
, &dev_size
, NULL
, 0);
100 * Set/Get the sysctl used to determine if corpse collection occurs.
101 * This is done by the kernel checking for a specific PID.
104 set_memorystatus_vm_map_fork_pidwatch(pid_t pid
)
106 uint64_t new_value
= (uint64_t)pid
;
107 size_t new_len
= sizeof(new_value
);
110 err
= sysctlbyname("kern.memorystatus_vm_map_fork_pidwatch", NULL
, NULL
, &new_value
, new_len
);
112 T_ASSERT_POSIX_SUCCESS(err
, "set sysctlbyname(kern.memorystatus_vm_map_fork_pidwatch...) failed");
117 get_memorystatus_vm_map_fork_pidwatch()
120 size_t val_len
= sizeof(value
);
123 err
= sysctlbyname("kern.memorystatus_vm_map_fork_pidwatch", &value
, &val_len
, NULL
, 0);
125 T_ASSERT_POSIX_SUCCESS(err
, "get sysctlbyname(kern.memorystatus_vm_map_fork_pidwatch...) failed");
131 * We want to avoid jetsam giving us bad results, if possible. So check if there's
132 * enough memory for the test to run, waiting briefly for some to free up.
135 wait_for_free_mem(int need_mb
)
138 int memorystatus_level
;
145 * get amount of memory in the machine
147 size
= sizeof(memsize
);
148 err
= sysctlbyname("hw.memsize", &memsize
, &size
, NULL
, 0);
149 T_QUIET
; T_ASSERT_POSIX_SUCCESS(err
, "sysctlbyname(hw.memsize...) failed");
152 * Use a loop to briefly sleep and recheck if short on memory.
158 * memorystatus_level is a percentage of memory available. For example 20 means 1/5 of memory.
159 * It currently doesn't exist on macOS but neither does jetsam, so pass the test there.
161 size
= sizeof(memorystatus_level
);
162 if (sysctlbyname("kern.memorystatus_level", &memorystatus_level
, &size
, NULL
, 0) != 0)
164 T_QUIET
; T_ASSERT_LE(memorystatus_level
, 100, "memorystatus_level too high");
165 T_QUIET
; T_ASSERT_GT(memorystatus_level
, 0, "memorystatus_level negative");
168 * jetsam kicks in at memory status level of 15%, so subtract that much out of what's available.
170 avail
= MAX(0, (memsize
* (memorystatus_level
- 15)) / 100);
173 * We're good to go if there's more than enough available.
175 if ((int64_t)need_mb
* MEGABYTE
< avail
)
179 * issue a message to log and sleep briefly to see if we can get more memory
183 T_LOG("Need %d MB, only %d MB available. sleeping 5 seconds for more to free. memorystatus_level %d",
184 need_mb
, (int)(avail
/ MEGABYTE
), memorystatus_level
);
187 T_SKIP("Needed %d MB, but only %d MB available. Skipping test to avoid jetsam issues.",
188 need_mb
, (int)(avail
/ MEGABYTE
));
193 * The main test calls this to spawn child process which will run and
194 * exceed some memory limit. The child is initially suspended so that
195 * we can do the sysctl calls before it runs.
196 * Since this is a libdarwintest, the "-n" names the T_HELPER_DECL() that
197 * we want to run. The arguments specific to the test follow a "--".
201 char * const executable
,
202 char * const memlimit
,
206 int inactive_limit_mb
)
208 posix_spawnattr_t spawn_attrs
;
211 char * const argv_child
[] = { executable
, "-n", "child_process", "--", memlimit
, NULL
};
213 err
= posix_spawnattr_init(&spawn_attrs
);
214 T_QUIET
; T_ASSERT_POSIX_SUCCESS(err
, " posix_spawnattr_init() failed");
216 err
= posix_spawnattr_setflags(&spawn_attrs
, POSIX_SPAWN_START_SUSPENDED
);
217 T_QUIET
; T_ASSERT_POSIX_SUCCESS(err
, " posix_spawnattr_setflags() failed");
219 err
= posix_spawnattr_setjetsam_ext(&spawn_attrs
, flags
, priority
, active_limit_mb
, inactive_limit_mb
);
220 T_QUIET
; T_ASSERT_POSIX_SUCCESS(err
, " posix_spawnattr_setjetsam_ext() failed");
222 err
= posix_spawn(&child_pid
, executable
, NULL
, &spawn_attrs
, argv_child
, environ
);
223 T_QUIET
; T_ASSERT_POSIX_SUCCESS(err
, " posix_spawn() failed");
230 * The parent calls this to continue the suspended child, then wait for its result.
231 * We collect its resource usage to vefiry the expected amount allocated.
234 test_child_process(pid_t child_pid
, int *status
, struct rusage
*ru
)
239 T_LOG(" continuing child[%d]\n", child_pid
);
241 err
= kill(child_pid
, SIGCONT
);
242 T_QUIET
; T_ASSERT_POSIX_SUCCESS(err
, " kill(%d, SIGCONT) failed", child_pid
);
244 T_LOG(" waiting for child[%d] to exit", child_pid
);
246 got_pid
= wait4(child_pid
, status
, 0, ru
);
247 T_QUIET
; T_ASSERT_EQ(child_pid
, got_pid
, " wait4(%d, ...) returned %d", child_pid
, got_pid
);
251 * The child process executes this code. The easiest way, with given darwintest infrastructure,
252 * it has to return information is via exit status.
254 T_HELPER_DECL(child_process
, "child allocates memory to failure")
256 #define BYTESPERALLOC MEGABYTE
257 #define BYTESINEXCESS (2 * MEGABYTE) /* 2 MB - arbitrary */
260 long max_bytes_to_munch
, bytes_remaining
, bytes_this_munch
;
264 * This helper is run in a child process. The helper sees one argument
265 * as a string which is the amount of memory in megabytes to allocate.
268 exit(NO_MEMSIZE_ARG
);
272 limit_mb
= strtol(limit
, NULL
, 10);
273 if (errno
!= 0 || limit_mb
<= 0)
274 exit(INVALID_MEMSIZE
);
276 /* Compute in excess of assigned limit */
277 max_bytes_to_munch
= limit_mb
* MEGABYTE
;
278 max_bytes_to_munch
+= BYTESINEXCESS
;
280 for (bytes_remaining
= max_bytes_to_munch
; bytes_remaining
> 0; bytes_remaining
-= bytes_this_munch
) {
281 bytes_this_munch
= MIN(bytes_remaining
, BYTESPERALLOC
);
283 mem
= malloc((size_t)bytes_this_munch
);
286 arc4random_buf(mem
, (size_t)bytes_this_munch
);
289 /* We chewed up all the memory we were asked to. */
298 memorystatus_vm_map_fork_parent(int test_variant
)
300 int max_task_pmem
= 0; /* MB */
302 int active_limit_mb
= 0;
303 int inactive_limit_mb
= 0;
305 char memlimit_str
[16];
308 uint64_t kernel_pidwatch_val
;
309 uint64_t expected_pidwatch_val
;
312 enum child_exits exit_val
;
315 * The code to set/get the pidwatch sysctl is only in
316 * development kernels. Skip the test if not on one.
318 if (!is_development_kernel()) {
319 T_SKIP("Can't test on release kernel");
323 * Determine a memory limit based on system having one or not.
325 size
= sizeof(max_task_pmem
);
326 (void)sysctlbyname("kern.max_task_pmem", &max_task_pmem
, &size
, NULL
, 0);
327 if (max_task_pmem
<= 0)
330 if (test_variant
== TEST_ALLOWED
) {
333 * Tell the child to allocate less than 1/4 the system wide limit.
335 if (max_task_pmem
/ 4 - LIMIT_DELTA_MB
<= 0) {
336 active_limit_mb
= LIMIT_DELTA_MB
;
338 active_limit_mb
= max_task_pmem
/ 4 - LIMIT_DELTA_MB
;
340 expected_pidwatch_val
= MEMORYSTATUS_VM_MAP_FORK_ALLOWED
;
342 } else { /* TEST_NOT_ALLOWED */
345 * Tell the child to allocate more than 1/4 the system wide limit.
347 active_limit_mb
= (max_task_pmem
/ 4) + LIMIT_DELTA_MB
;
348 if (max_task_pmem
== 0) {
349 expected_pidwatch_val
= MEMORYSTATUS_VM_MAP_FORK_ALLOWED
;
351 expected_pidwatch_val
= MEMORYSTATUS_VM_MAP_FORK_NOT_ALLOWED
;
355 inactive_limit_mb
= active_limit_mb
;
356 T_LOG("using limit of %d Meg", active_limit_mb
);
359 * When run as part of a larger suite, a previous test
360 * may have left the system temporarily with too little
361 * memory to run this test. We try to detect if there is
362 * enough free memory to proceed, waiting a little bit
363 * for memory to free up.
365 wait_for_free_mem(active_limit_mb
);
367 #if defined(__x86_64__)
369 * vm_map_fork() is always allowed on desktop.
371 expected_pidwatch_val
= MEMORYSTATUS_VM_MAP_FORK_ALLOWED
;
375 * Prepare the arguments needed to spawn the child process.
377 memset (memlimit_str
, 0, sizeof(memlimit_str
));
378 (void)sprintf(memlimit_str
, "%d", active_limit_mb
);
380 ret
= _NSGetExecutablePath(testpath
, &testpath_size
);
381 T_QUIET
; T_ASSERT_POSIX_SUCCESS(ret
, "_NSGetExecutablePath(%s, ...)", testpath
);
384 * We put the child process in FOREGROUND to try and keep jetsam's hands off it.
386 child_pid
= spawn_child_process(testpath
, memlimit_str
, flags
,
387 JETSAM_PRIORITY_FOREGROUND
, active_limit_mb
, inactive_limit_mb
);
389 expected_pidwatch_val
|= (uint64_t)child_pid
;
392 * We only reach here if parent successfully spawned child process.
394 T_LOG(" spawned child_pid[%d] with memlimit %s (%d)MB\n",
395 child_pid
, memlimit_str
, active_limit_mb
);
398 * Set the kernel's pidwatch to look for the child.
400 (void)set_memorystatus_vm_map_fork_pidwatch((pid_t
)0);
401 (void)set_memorystatus_vm_map_fork_pidwatch(child_pid
);
404 * Let the child run and wait for it to finish.
406 test_child_process(child_pid
, &child_status
, &ru
);
407 T_LOG("Child exited with max_rss of %ld", ru
.ru_maxrss
);
410 * Retrieve the kernel's pidwatch value. This should now indicate
411 * if the corpse was allowed or not.
413 kernel_pidwatch_val
= get_memorystatus_vm_map_fork_pidwatch();
414 (void)set_memorystatus_vm_map_fork_pidwatch((pid_t
)0);
417 * If the child died abnormally, the test is invalid.
419 if (!WIFEXITED(child_status
)) {
420 if (WIFSIGNALED(child_status
)) {
421 /* jetsam kills a process with SIGKILL */
422 if (WTERMSIG(child_status
) == SIGKILL
)
423 T_LOG("Child appears to have been a jetsam victim");
424 T_SKIP("Child terminated by signal %d test result invalid", WTERMSIG(child_status
));
426 T_SKIP("child did not exit normally (status=%d) test result invalid", child_status
);
430 * We don't expect the child to exit for any other reason than success
432 exit_val
= (enum child_exits
)WEXITSTATUS(child_status
);
433 T_QUIET
; T_ASSERT_EQ(exit_val
, NORMAL_EXIT
, "child exit due to: %s",
434 (0 < exit_val
&& exit_val
< NUM_CHILD_EXIT
) ? child_exit_why
[exit_val
] : "unknown");
437 * If the kernel aborted generating a corpse for other reasons, the test is invalid.
439 if (kernel_pidwatch_val
== -1ull) {
440 T_SKIP("corpse generation was aborted by kernel");
444 * We should always have made it through the vm_map_fork() checks in the kernel for this test.
446 T_QUIET
; T_ASSERT_NE_ULLONG(kernel_pidwatch_val
, (uint64_t)child_pid
, "child didn't trigger corpse generation");
448 T_EXPECT_EQ(kernel_pidwatch_val
, expected_pidwatch_val
, "kernel value 0x%llx - expected 0x%llx",
449 kernel_pidwatch_val
, expected_pidwatch_val
);
453 * The order of these 2 test functions is important. They will be executed by the test framwork in order.
455 * We test "not allowed first", then "allowed". If it were the other way around, the corpse from the "allowed"
456 * test would likely cause memory pressure and jetsam would likely kill the "not allowed" test.
458 T_DECL(memorystatus_vm_map_fork_test_not_allowed
, "test that corpse generation was not allowed")
460 memorystatus_vm_map_fork_parent(TEST_NOT_ALLOWED
);
463 T_DECL(memorystatus_vm_map_fork_test_allowed
, "test corpse generation allowed")
466 memorystatus_vm_map_fork_parent(TEST_ALLOWED
);