14 #include <sys/sysctl.h>
15 #include <mach/mach_time.h>
16 #include <mach/mach.h>
17 #include <mach/semaphore.h>
18 #include <TargetConditionals.h>
24 #include <darwintest.h>
25 #include <stdatomic.h>
27 #define MAX_THREADS 32
29 #define THR_SPINNER_PRI 63
30 #define THR_MANAGER_PRI 62
31 #define WARMUP_ITERATIONS 100
32 #define FILE_SIZE (16384 * 4096)
36 static mach_timebase_info_data_t timebase_info
;
37 static semaphore_t semaphore
;
38 static semaphore_t worker_sem
;
39 static uint32_t g_numcpus
;
40 static _Atomic
uint32_t keep_going
= 1;
42 char *data_buf
= NULL
;
43 extern char **environ
;
47 } threads
[MAX_THREADS
];
50 nanos_to_abs(uint64_t nanos
)
52 return nanos
* timebase_info
.denom
/ timebase_info
.numer
;
56 io_perf_test_io_init(void)
59 char *const mount_args
[] = {"/usr/local/sbin/mount_nand.sh", NULL
};
60 spawn_ret
= posix_spawn(&pid
, mount_args
[0], NULL
, NULL
, mount_args
, environ
);
62 T_SKIP("NAND mounting in LTE not possible on this device. Skipping test!");
64 waitpid(pid
, &spawn_ret
, 0);
65 if (WIFEXITED(spawn_ret
) && !WEXITSTATUS(spawn_ret
)) {
66 T_PASS("NAND mounted successfully");
68 T_SKIP("Unable to mount NAND. Skipping test!");
71 /* Mark the main thread as fixed priority */
72 struct sched_param param
= {.sched_priority
= THR_MANAGER_PRI
};
73 T_ASSERT_POSIX_ZERO(pthread_setschedparam(pthread_self(), SCHED_FIFO
, ¶m
),
74 "pthread_setschedparam");
76 /* Set I/O Policy to Tier 0 */
77 T_ASSERT_POSIX_ZERO(setiopolicy_np(IOPOL_TYPE_DISK
, IOPOL_SCOPE_PROCESS
,
78 IOPOL_IMPORTANT
), "setiopolicy");
80 /* Create data buffer */
81 data_buf
= malloc(IO_SIZE
* 16);
82 T_ASSERT_NOTNULL(data_buf
, "Data buffer allocation");
84 int rndfd
= open("/dev/urandom", O_RDONLY
, S_IRUSR
);
85 T_ASSERT_POSIX_SUCCESS(rndfd
, "Open /dev/urandom");
86 T_ASSERT_GE_INT((int)read(rndfd
, data_buf
, IO_SIZE
* 16), 0, "read /dev/urandom");
89 /* Create test file */
90 int fd
= open("/mnt2/test", O_CREAT
| O_WRONLY
, S_IRUSR
);
91 T_ASSERT_POSIX_SUCCESS(fd
, 0, "Open /mnt2/test for writing!");
93 T_ASSERT_POSIX_ZERO(fcntl(fd
, F_NOCACHE
, 1), "fcntl F_NOCACHE enable");
94 for (int size
= 0; size
< FILE_SIZE
;) {
96 T_ASSERT_GE_INT((int)write(fd
, data_buf
, IO_SIZE
* 16), 0, "write test file");
97 size
+= (IO_SIZE
* 16);
105 create_thread(uint32_t thread_id
, uint32_t priority
, bool fixpri
,
106 void *(*start_routine
)(void *))
109 pthread_t new_thread
;
110 struct sched_param param
= { .sched_priority
= (int)priority
};
113 T_ASSERT_POSIX_ZERO(pthread_attr_init(&attr
), "pthread_attr_init");
115 T_ASSERT_POSIX_ZERO(pthread_attr_setschedparam(&attr
, ¶m
),
116 "pthread_attr_setschedparam");
119 T_ASSERT_POSIX_ZERO(pthread_attr_setschedpolicy(&attr
, SCHED_RR
),
120 "pthread_attr_setschedpolicy");
123 T_ASSERT_POSIX_ZERO(pthread_create(&new_thread
, &attr
, start_routine
,
124 (void*)(uintptr_t)thread_id
), "pthread_create");
126 T_ASSERT_POSIX_ZERO(pthread_attr_destroy(&attr
), "pthread_attr_destroy");
128 threads
[thread_id
].thread
= new_thread
;
133 /* Spin until a specified number of seconds elapses */
135 spin_for_duration(uint32_t seconds
)
137 uint64_t duration
= nanos_to_abs((uint64_t)seconds
* NSEC_PER_SEC
);
138 uint64_t current_time
= mach_absolute_time();
139 uint64_t timeout
= duration
+ current_time
;
141 uint64_t spin_count
= 0;
143 while (mach_absolute_time() < timeout
&& atomic_load_explicit(&keep_going
,
144 memory_order_relaxed
)) {
150 spin_thread(void *arg
)
152 uint32_t thread_id
= (uint32_t) arg
;
155 snprintf(name
, sizeof(name
), "spin thread %2d", thread_id
);
156 pthread_setname_np(name
);
157 T_ASSERT_MACH_SUCCESS(semaphore_wait_signal(semaphore
, worker_sem
),
158 "semaphore_wait_signal");
159 spin_for_duration(SPIN_SECS
);
164 perform_io(dt_stat_time_t stat
)
166 /* Open the test data file */
167 int test_file_fd
= open("/mnt2/test", O_RDONLY
);
169 T_ASSERT_POSIX_SUCCESS(test_file_fd
, "Open test data file");
171 /* Disable caching and read-ahead for the file */
172 T_ASSERT_POSIX_ZERO(fcntl(test_file_fd
, F_NOCACHE
, 1), "fcntl F_NOCACHE enable");
173 T_ASSERT_POSIX_ZERO(fcntl(test_file_fd
, F_RDAHEAD
, 0), "fcntl F_RDAHEAD disable");
178 for (int i
=0; i
< WARMUP_ITERATIONS
; i
++) {
180 read(test_file_fd
, data_buf
, IO_SIZE
);
184 T_STAT_MEASURE(stat
) {
185 ret
= read(test_file_fd
, data_buf
, IO_SIZE
);
189 T_ASSERT_POSIX_SUCCESS(lseek(test_file_fd
, 0, SEEK_SET
), "lseek begin");
190 } else if (ret
< 0) {
191 T_FAIL("read failure");
195 } while(count
< IO_COUNT
);
199 T_GLOBAL_META(T_META_NAMESPACE("xnu.io"), T_META_TAG_PERF
);
201 /* Disable the test on MacOS for now */
202 T_DECL(read_perf
, "Sequential Uncached Read Performance", T_META_TYPE_PERF
, T_META_CHECK_LEAKS(NO
), T_META_ASROOT(YES
), T_META_LTEPHASE(LTE_POSTINIT
))
206 T_SKIP("Not supported on MacOS");
207 #endif /* !CONFIG_EMBEDDED */
209 io_perf_test_io_init();
210 pthread_setname_np("main thread");
212 T_ASSERT_MACH_SUCCESS(mach_timebase_info(&timebase_info
), "mach_timebase_info");
214 dt_stat_time_t seq_noload
= dt_stat_time_create("sequential read latency (CPU idle)");
215 perform_io(seq_noload
);
216 dt_stat_finalize(seq_noload
);
219 * We create spinner threads for this test so that all other cores are
220 * busy. That way the I/O issue thread has to context switch to the
221 * IOWorkLoop thread and back for the I/O.
223 T_ASSERT_MACH_SUCCESS(semaphore_create(mach_task_self(), &semaphore
,
224 SYNC_POLICY_FIFO
, 0), "semaphore_create");
226 T_ASSERT_MACH_SUCCESS(semaphore_create(mach_task_self(), &worker_sem
,
227 SYNC_POLICY_FIFO
, 0), "semaphore_create");
229 size_t ncpu_size
= sizeof(g_numcpus
);
230 T_ASSERT_POSIX_SUCCESS(sysctlbyname("hw.ncpu", &g_numcpus
, &ncpu_size
, NULL
, 0),
231 "sysctlbyname(hw.ncpu)");
233 T_LOG("hw.ncpu: %d\n", g_numcpus
);
234 uint32_t n_spinners
= g_numcpus
- 1;
236 for (uint32_t thread_id
= 0; thread_id
< n_spinners
; thread_id
++) {
237 threads
[thread_id
].thread
= create_thread(thread_id
, THR_SPINNER_PRI
,
241 for (uint32_t thread_id
= 0; thread_id
< n_spinners
; thread_id
++) {
242 T_ASSERT_MACH_SUCCESS(semaphore_wait(worker_sem
), "semaphore_wait");
245 T_ASSERT_MACH_SUCCESS(semaphore_signal_all(semaphore
), "semaphore_signal");
247 dt_stat_time_t seq_load
= dt_stat_time_create("sequential read latency (Single CPU)");
248 perform_io(seq_load
);
249 dt_stat_finalize(seq_load
);
251 atomic_store_explicit(&keep_going
, 0, memory_order_relaxed
);
252 for (uint32_t thread_id
= 0; thread_id
< n_spinners
; thread_id
++) {
253 T_ASSERT_POSIX_ZERO(pthread_join(threads
[thread_id
].thread
, NULL
),
254 "pthread_join %d", thread_id
);