]> git.saurik.com Git - apple/xnu.git/blame - tests/memorystatus_vm_map_fork.c
xnu-7195.81.3.tar.gz
[apple/xnu.git] / tests / memorystatus_vm_map_fork.c
CommitLineData
a39ff7e2
A
1#include <stdio.h>
2#include <unistd.h>
3#include <stdlib.h>
4#include <errno.h>
5#include <string.h>
6#include <assert.h>
7#include <signal.h>
8#include <spawn.h>
9#include <spawn_private.h>
10#include <stdint.h>
11#include <sys/sysctl.h>
12#include <sys/spawn_internal.h>
13#include <sys/kern_memorystatus.h>
14#include <mach-o/dyld.h>
15
16#include <darwintest.h>
17#include <darwintest_utils.h>
18
19T_GLOBAL_META(
20 T_META_NAMESPACE("xnu.vm"),
21 T_META_CHECK_LEAKS(false)
0a7de745 22 );
a39ff7e2
A
23
24extern char **environ;
25
26/*
27 * This test file contains two sub-tests which attempt to verify
28 * the allowing or not allowing of a corpse for crashreporter when
29 * a task exceeds its memory allocation limit. vm_map_fork() is the
30 * kernel routine used to generate a corpse task.
31 *
32 * A corpse is allowed to be taken if a task's memory resource limit that
d9a64523
A
33 * is exceeded is less than 1/4 of the system wide task limit.
34 * If the amount exceeds 1/4 the sytem wide limit, then the corpse is disallowed.
a39ff7e2
A
35 *
36 * If the device under test is already under pressure, the test
37 * could fail due to jetsam cutting in and killing the parent, child or
38 * other necessary testing processes.
39 */
40
41/* Test variants */
0a7de745 42#define TEST_ALLOWED 0x1
a39ff7e2
A
43#define TEST_NOT_ALLOWED 0x2
44
45/*
46 * Values which the kernel OR's into the PID when a corpse
47 * is either allowed or disallowed for the
48 * kern.memorystatus_vm_map_fork_pidwatch sysctl.
49 */
0a7de745 50#define MEMORYSTATUS_VM_MAP_FORK_ALLOWED 0x100000000ul
a39ff7e2
A
51#define MEMORYSTATUS_VM_MAP_FORK_NOT_ALLOWED 0x200000000ul
52
53/*
54 * The memory allocation happens in a child process, this
55 * is stuff to deal with creating and managing the child.
56 * The child will only execute the T_HELPER_DECL.
57 */
58static char testpath[PATH_MAX];
59static uint32_t testpath_size = sizeof(testpath);
60#define LIMIT_DELTA_MB 5 /* an arbitrary limit delta */
0a7de745 61#define MEGABYTE (1024 * 1024)
a39ff7e2
A
62
63/*
64 * The child process communicates back to parent via an exit() code.
65 */
66enum child_exits {
67 NORMAL_EXIT = 0,
68 NO_MEMSIZE_ARG,
69 INVALID_MEMSIZE,
70 MALLOC_FAILED,
71 NUM_CHILD_EXIT
72};
73static char *child_exit_why[] = {
74 "normal exit",
75 "no memsize argument to child",
76 "invalid memsize argument to child",
77 "malloc() failed",
78};
79
80/*
81 * Corpse collection only happens in development kernels.
82 * So we need this to detect if the test is relevant.
83 */
84static boolean_t
85is_development_kernel(void)
86{
87 int ret;
88 int dev = 0;
89 size_t dev_size = sizeof(dev);
90
91 ret = sysctlbyname("kern.development", &dev, &dev_size, NULL, 0);
92 if (ret != 0) {
93 return FALSE;
94 }
95
0a7de745 96 return dev != 0;
a39ff7e2
A
97}
98
99/*
100 * Set/Get the sysctl used to determine if corpse collection occurs.
101 * This is done by the kernel checking for a specific PID.
102 */
103static void
104set_memorystatus_vm_map_fork_pidwatch(pid_t pid)
105{
106 uint64_t new_value = (uint64_t)pid;
107 size_t new_len = sizeof(new_value);
108 int err;
109
110 err = sysctlbyname("kern.memorystatus_vm_map_fork_pidwatch", NULL, NULL, &new_value, new_len);
111 T_QUIET;
112 T_ASSERT_POSIX_SUCCESS(err, "set sysctlbyname(kern.memorystatus_vm_map_fork_pidwatch...) failed");
113 return;
114}
115
116static uint64_t
117get_memorystatus_vm_map_fork_pidwatch()
118{
119 uint64_t value = 0;
120 size_t val_len = sizeof(value);
121 int err;
122
123 err = sysctlbyname("kern.memorystatus_vm_map_fork_pidwatch", &value, &val_len, NULL, 0);
124 T_QUIET;
125 T_ASSERT_POSIX_SUCCESS(err, "get sysctlbyname(kern.memorystatus_vm_map_fork_pidwatch...) failed");
126
127 return value;
128}
129
130/*
131 * We want to avoid jetsam giving us bad results, if possible. So check if there's
132 * enough memory for the test to run, waiting briefly for some to free up.
133 */
134static void
135wait_for_free_mem(int need_mb)
136{
0a7de745
A
137 int64_t memsize;
138 int memorystatus_level;
139 size_t size;
140 int64_t avail;
141 int err;
142 int try;
a39ff7e2
A
143
144 /*
145 * get amount of memory in the machine
146 */
147 size = sizeof(memsize);
148 err = sysctlbyname("hw.memsize", &memsize, &size, NULL, 0);
149 T_QUIET; T_ASSERT_POSIX_SUCCESS(err, "sysctlbyname(hw.memsize...) failed");
150
151 /*
152 * Use a loop to briefly sleep and recheck if short on memory.
153 */
154 try = 1;
155 for (;;) {
a39ff7e2
A
156 /*
157 * memorystatus_level is a percentage of memory available. For example 20 means 1/5 of memory.
158 * It currently doesn't exist on macOS but neither does jetsam, so pass the test there.
159 */
160 size = sizeof(memorystatus_level);
0a7de745 161 if (sysctlbyname("kern.memorystatus_level", &memorystatus_level, &size, NULL, 0) != 0) {
a39ff7e2 162 return;
0a7de745 163 }
a39ff7e2
A
164 T_QUIET; T_ASSERT_LE(memorystatus_level, 100, "memorystatus_level too high");
165 T_QUIET; T_ASSERT_GT(memorystatus_level, 0, "memorystatus_level negative");
166
167 /*
168 * jetsam kicks in at memory status level of 15%, so subtract that much out of what's available.
169 */
170 avail = MAX(0, (memsize * (memorystatus_level - 15)) / 100);
171
172 /*
173 * We're good to go if there's more than enough available.
174 */
0a7de745 175 if ((int64_t)need_mb * MEGABYTE < avail) {
a39ff7e2 176 return;
0a7de745 177 }
a39ff7e2
A
178
179 /*
180 * issue a message to log and sleep briefly to see if we can get more memory
181 */
0a7de745 182 if (try-- == 0) {
a39ff7e2 183 break;
0a7de745 184 }
a39ff7e2
A
185 T_LOG("Need %d MB, only %d MB available. sleeping 5 seconds for more to free. memorystatus_level %d",
186 need_mb, (int)(avail / MEGABYTE), memorystatus_level);
187 sleep(5);
188 }
189 T_SKIP("Needed %d MB, but only %d MB available. Skipping test to avoid jetsam issues.",
190 need_mb, (int)(avail / MEGABYTE));
191}
192
193
194/*
195 * The main test calls this to spawn child process which will run and
196 * exceed some memory limit. The child is initially suspended so that
197 * we can do the sysctl calls before it runs.
198 * Since this is a libdarwintest, the "-n" names the T_HELPER_DECL() that
199 * we want to run. The arguments specific to the test follow a "--".
200 */
201static pid_t
202spawn_child_process(
203 char * const executable,
204 char * const memlimit,
205 short flags,
206 int priority,
207 int active_limit_mb,
208 int inactive_limit_mb)
209{
210 posix_spawnattr_t spawn_attrs;
211 int err;
212 pid_t child_pid;
213 char * const argv_child[] = { executable, "-n", "child_process", "--", memlimit, NULL };
214
215 err = posix_spawnattr_init(&spawn_attrs);
216 T_QUIET; T_ASSERT_POSIX_SUCCESS(err, " posix_spawnattr_init() failed");
217
218 err = posix_spawnattr_setflags(&spawn_attrs, POSIX_SPAWN_START_SUSPENDED);
219 T_QUIET; T_ASSERT_POSIX_SUCCESS(err, " posix_spawnattr_setflags() failed");
220
221 err = posix_spawnattr_setjetsam_ext(&spawn_attrs, flags, priority, active_limit_mb, inactive_limit_mb);
222 T_QUIET; T_ASSERT_POSIX_SUCCESS(err, " posix_spawnattr_setjetsam_ext() failed");
223
224 err = posix_spawn(&child_pid, executable, NULL, &spawn_attrs, argv_child, environ);
225 T_QUIET; T_ASSERT_POSIX_SUCCESS(err, " posix_spawn() failed");
226
227 return child_pid;
228}
229
230
231/*
232 * The parent calls this to continue the suspended child, then wait for its result.
233 * We collect its resource usage to vefiry the expected amount allocated.
234 */
235static void
236test_child_process(pid_t child_pid, int *status, struct rusage *ru)
237{
238 int err = 0;
239 pid_t got_pid;
240
241 T_LOG(" continuing child[%d]\n", child_pid);
242
243 err = kill(child_pid, SIGCONT);
244 T_QUIET; T_ASSERT_POSIX_SUCCESS(err, " kill(%d, SIGCONT) failed", child_pid);
245
246 T_LOG(" waiting for child[%d] to exit", child_pid);
247
248 got_pid = wait4(child_pid, status, 0, ru);
249 T_QUIET; T_ASSERT_EQ(child_pid, got_pid, " wait4(%d, ...) returned %d", child_pid, got_pid);
250}
251
252/*
253 * The child process executes this code. The easiest way, with given darwintest infrastructure,
254 * it has to return information is via exit status.
255 */
256T_HELPER_DECL(child_process, "child allocates memory to failure")
257{
0a7de745
A
258#define BYTESPERALLOC MEGABYTE
259#define BYTESINEXCESS (2 * MEGABYTE) /* 2 MB - arbitrary */
a39ff7e2
A
260 char *limit;
261 long limit_mb = 0;
262 long max_bytes_to_munch, bytes_remaining, bytes_this_munch;
263 void *mem = NULL;
264
265 /*
266 * This helper is run in a child process. The helper sees one argument
267 * as a string which is the amount of memory in megabytes to allocate.
268 */
0a7de745 269 if (argc != 1) {
a39ff7e2 270 exit(NO_MEMSIZE_ARG);
0a7de745 271 }
a39ff7e2
A
272
273 limit = argv[0];
274 errno = 0;
275 limit_mb = strtol(limit, NULL, 10);
0a7de745 276 if (errno != 0 || limit_mb <= 0) {
a39ff7e2 277 exit(INVALID_MEMSIZE);
0a7de745 278 }
a39ff7e2
A
279
280 /* Compute in excess of assigned limit */
281 max_bytes_to_munch = limit_mb * MEGABYTE;
282 max_bytes_to_munch += BYTESINEXCESS;
283
284 for (bytes_remaining = max_bytes_to_munch; bytes_remaining > 0; bytes_remaining -= bytes_this_munch) {
285 bytes_this_munch = MIN(bytes_remaining, BYTESPERALLOC);
286
287 mem = malloc((size_t)bytes_this_munch);
0a7de745 288 if (mem == NULL) {
a39ff7e2 289 exit(MALLOC_FAILED);
0a7de745 290 }
a39ff7e2
A
291 arc4random_buf(mem, (size_t)bytes_this_munch);
292 }
293
294 /* We chewed up all the memory we were asked to. */
295 exit(NORMAL_EXIT);
296}
297
298
299/*
300 * Actual test body.
301 */
302static void
303memorystatus_vm_map_fork_parent(int test_variant)
304{
0a7de745
A
305 int max_task_pmem = 0; /* MB */
306 size_t size = 0;
307 int active_limit_mb = 0;
308 int inactive_limit_mb = 0;
309 short flags = 0;
310 char memlimit_str[16];
311 pid_t child_pid;
312 int child_status;
313 uint64_t kernel_pidwatch_val;
314 uint64_t expected_pidwatch_val;
315 int ret;
316 struct rusage ru;
a39ff7e2
A
317 enum child_exits exit_val;
318
319 /*
320 * The code to set/get the pidwatch sysctl is only in
321 * development kernels. Skip the test if not on one.
322 */
323 if (!is_development_kernel()) {
324 T_SKIP("Can't test on release kernel");
325 }
326
327 /*
328 * Determine a memory limit based on system having one or not.
329 */
330 size = sizeof(max_task_pmem);
331 (void)sysctlbyname("kern.max_task_pmem", &max_task_pmem, &size, NULL, 0);
0a7de745 332 if (max_task_pmem <= 0) {
a39ff7e2 333 max_task_pmem = 0;
0a7de745 334 }
a39ff7e2
A
335
336 if (test_variant == TEST_ALLOWED) {
a39ff7e2 337 /*
d9a64523 338 * Tell the child to allocate less than 1/4 the system wide limit.
a39ff7e2 339 */
d9a64523 340 if (max_task_pmem / 4 - LIMIT_DELTA_MB <= 0) {
a39ff7e2
A
341 active_limit_mb = LIMIT_DELTA_MB;
342 } else {
d9a64523 343 active_limit_mb = max_task_pmem / 4 - LIMIT_DELTA_MB;
a39ff7e2
A
344 }
345 expected_pidwatch_val = MEMORYSTATUS_VM_MAP_FORK_ALLOWED;
a39ff7e2 346 } else { /* TEST_NOT_ALLOWED */
a39ff7e2 347 /*
d9a64523 348 * Tell the child to allocate more than 1/4 the system wide limit.
a39ff7e2 349 */
d9a64523 350 active_limit_mb = (max_task_pmem / 4) + LIMIT_DELTA_MB;
a39ff7e2
A
351 if (max_task_pmem == 0) {
352 expected_pidwatch_val = MEMORYSTATUS_VM_MAP_FORK_ALLOWED;
353 } else {
354 expected_pidwatch_val = MEMORYSTATUS_VM_MAP_FORK_NOT_ALLOWED;
355 }
a39ff7e2
A
356 }
357 inactive_limit_mb = active_limit_mb;
358 T_LOG("using limit of %d Meg", active_limit_mb);
359
360 /*
361 * When run as part of a larger suite, a previous test
362 * may have left the system temporarily with too little
363 * memory to run this test. We try to detect if there is
364 * enough free memory to proceed, waiting a little bit
365 * for memory to free up.
366 */
367 wait_for_free_mem(active_limit_mb);
368
f427ee49 369#if TARGET_OS_OSX
a39ff7e2
A
370 /*
371 * vm_map_fork() is always allowed on desktop.
372 */
373 expected_pidwatch_val = MEMORYSTATUS_VM_MAP_FORK_ALLOWED;
374#endif
375
376 /*
377 * Prepare the arguments needed to spawn the child process.
378 */
0a7de745 379 memset(memlimit_str, 0, sizeof(memlimit_str));
a39ff7e2
A
380 (void)sprintf(memlimit_str, "%d", active_limit_mb);
381
382 ret = _NSGetExecutablePath(testpath, &testpath_size);
383 T_QUIET; T_ASSERT_POSIX_SUCCESS(ret, "_NSGetExecutablePath(%s, ...)", testpath);
384
385 /*
386 * We put the child process in FOREGROUND to try and keep jetsam's hands off it.
387 */
388 child_pid = spawn_child_process(testpath, memlimit_str, flags,
389 JETSAM_PRIORITY_FOREGROUND, active_limit_mb, inactive_limit_mb);
390
391 expected_pidwatch_val |= (uint64_t)child_pid;
392
393 /*
394 * We only reach here if parent successfully spawned child process.
395 */
396 T_LOG(" spawned child_pid[%d] with memlimit %s (%d)MB\n",
397 child_pid, memlimit_str, active_limit_mb);
398
399 /*
400 * Set the kernel's pidwatch to look for the child.
401 */
402 (void)set_memorystatus_vm_map_fork_pidwatch((pid_t)0);
403 (void)set_memorystatus_vm_map_fork_pidwatch(child_pid);
404
405 /*
406 * Let the child run and wait for it to finish.
407 */
408 test_child_process(child_pid, &child_status, &ru);
409 T_LOG("Child exited with max_rss of %ld", ru.ru_maxrss);
410
411 /*
412 * Retrieve the kernel's pidwatch value. This should now indicate
413 * if the corpse was allowed or not.
414 */
415 kernel_pidwatch_val = get_memorystatus_vm_map_fork_pidwatch();
416 (void)set_memorystatus_vm_map_fork_pidwatch((pid_t)0);
417
418 /*
419 * If the child died abnormally, the test is invalid.
420 */
421 if (!WIFEXITED(child_status)) {
422 if (WIFSIGNALED(child_status)) {
423 /* jetsam kills a process with SIGKILL */
0a7de745 424 if (WTERMSIG(child_status) == SIGKILL) {
a39ff7e2 425 T_LOG("Child appears to have been a jetsam victim");
0a7de745 426 }
a39ff7e2
A
427 T_SKIP("Child terminated by signal %d test result invalid", WTERMSIG(child_status));
428 }
429 T_SKIP("child did not exit normally (status=%d) test result invalid", child_status);
430 }
431
432 /*
433 * We don't expect the child to exit for any other reason than success
434 */
435 exit_val = (enum child_exits)WEXITSTATUS(child_status);
0a7de745 436 T_QUIET; T_ASSERT_EQ(exit_val, NORMAL_EXIT, "child exit due to: %s",
a39ff7e2
A
437 (0 < exit_val && exit_val < NUM_CHILD_EXIT) ? child_exit_why[exit_val] : "unknown");
438
439 /*
440 * If the kernel aborted generating a corpse for other reasons, the test is invalid.
441 */
442 if (kernel_pidwatch_val == -1ull) {
443 T_SKIP("corpse generation was aborted by kernel");
444 }
445
446 /*
447 * We should always have made it through the vm_map_fork() checks in the kernel for this test.
448 */
449 T_QUIET; T_ASSERT_NE_ULLONG(kernel_pidwatch_val, (uint64_t)child_pid, "child didn't trigger corpse generation");
450
451 T_EXPECT_EQ(kernel_pidwatch_val, expected_pidwatch_val, "kernel value 0x%llx - expected 0x%llx",
452 kernel_pidwatch_val, expected_pidwatch_val);
453}
454
455/*
456 * The order of these 2 test functions is important. They will be executed by the test framwork in order.
457 *
458 * We test "not allowed first", then "allowed". If it were the other way around, the corpse from the "allowed"
459 * test would likely cause memory pressure and jetsam would likely kill the "not allowed" test.
460 */
f427ee49 461T_DECL(memorystatus_vm_map_fork_test_not_allowed, "test that corpse generation was not allowed", T_META_ASROOT(true))
a39ff7e2
A
462{
463 memorystatus_vm_map_fork_parent(TEST_NOT_ALLOWED);
464}
465
f427ee49 466T_DECL(memorystatus_vm_map_fork_test_allowed, "test corpse generation allowed", T_META_ASROOT(true))
a39ff7e2 467{
a39ff7e2
A
468 memorystatus_vm_map_fork_parent(TEST_ALLOWED);
469}