git.saurik.com Git - apple/xnu.git/blob - tools/tests/zero-to-n/zero-to-n.c

1 /*

3 *

4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@

5 *

6 * This file contains Original Code and/or Modifications of Original Code

7 * as defined in and that are subject to the Apple Public Source License

8 * Version 2.0 (the 'License'). You may not use this file except in

9 * compliance with the License. The rights granted to you under the License

10 * may not be used to create, or enable the creation or redistribution of,

11 * unlawful or unlicensed copies of an Apple operating system, or to

12 * circumvent, violate, or enable the circumvention or violation of, any

13 * terms of an Apple operating system software license agreement.

14 *

15 * Please obtain a copy of the License at

16 * http://www.opensource.apple.com/apsl/ and read it before using this file.

17 *

18 * The Original Code and all software distributed under the License are

19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER

20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,

21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,

22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.

23 * Please see the License for the specific language governing rights and

24 * limitations under the License.

25 *

26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@

27 */

28 #include <unistd.h>

29 #include <stdio.h>

30 #include <math.h>

31 #include <sys/kdebug.h>

32 #include <stdlib.h>

33 #include <pthread.h>

34 #include <errno.h>

35 #include <err.h>

36 #include <string.h>

37 #include <assert.h>

38 #include <sysexits.h>

39 #include <sys/sysctl.h>

40 #include <getopt.h>

41 #include <libproc.h>

43 #include <spawn.h>

44 #include <spawn_private.h>

45 #include <sys/spawn_internal.h>

46 #include <mach-o/dyld.h>

48 #include <mach/mach_time.h>

49 #include <mach/mach.h>

50 #include <mach/task.h>

51 #include <mach/semaphore.h>

53 #include <pthread/qos_private.h>

55 #include <sys/resource.h>

57 #include <stdatomic.h>

59 #include <os/tsd.h>

60 #include <os/lock.h>

61 #include <TargetConditionals.h>

 typedef enum wake_type { WAKE_BROADCAST_ONESEM, WAKE_BROADCAST_PERTHREAD, WAKE_CHAIN, WAKE_HOP } wake_type_t;

 typedef enum my_policy_type { MY_POLICY_REALTIME, MY_POLICY_TIMESHARE, MY_POLICY_TIMESHARE_NO_SMT, MY_POLICY_FIXEDPRI } my_policy_type_t;

 #define mach_assert_zero(error)        do { if ((error) != 0) { fprintf(stderr, "[FAIL] error %d (%s) ", (error), mach_error_string(error)); assert(error == 0); } } while (0)

 #define mach_assert_zero_t(tid, error) do { if ((error) != 0) { fprintf(stderr, "[FAIL] Thread %d error %d (%s) ", (tid), (error), mach_error_string(error)); assert(error == 0); } } while (0)

 #define assert_zero_t(tid, error)      do { if ((error) != 0) { fprintf(stderr, "[FAIL] Thread %d error %d ", (tid), (error)); assert(error == 0); } } while (0)

70 #define CONSTRAINT_NANOS (20000000ll) /* 20 ms */

71 #define COMPUTATION_NANOS (10000000ll) /* 10 ms */

72 #define LL_CONSTRAINT_NANOS ( 2000000ll) /* 2 ms */

73 #define LL_COMPUTATION_NANOS ( 1000000ll) /* 1 ms */

74 #define RT_CHURN_COMP_NANOS ( 1000000ll) /* 1 ms */

75 #define TRACEWORTHY_NANOS (10000000ll) /* 10 ms */

76 #define TRACEWORTHY_NANOS_TEST ( 2000000ll) /* 2 ms */

78 #if DEBUG

79 #define debug_log(args ...) printf(args)

80 #else

81 #define debug_log(args ...) do { } while(0)

82 #endif

84 /* Declarations */

 static void*                    worker_thread(void *arg);

86 static void usage();

 static int                      thread_setup(uint32_t my_id);

 static my_policy_type_t         parse_thread_policy(const char *str);

 static void                     selfexec_with_apptype(int argc, char *argv[]);

 static void                     parse_args(int argc, char *argv[]);

 static __attribute__((aligned(128))) _Atomic uint32_t   g_done_threads;

 static __attribute__((aligned(128))) _Atomic boolean_t  g_churn_stop = FALSE;

 static __attribute__((aligned(128))) _Atomic uint64_t   g_churn_stopped_at = 0;

96 /* Global variables (general) */

97 static uint32_t g_numcpus;

98 static uint32_t g_nphysicalcpu;

99 static uint32_t g_nlogicalcpu;

100 static uint32_t g_numthreads;

101 static wake_type_t g_waketype;

102 static policy_t g_policy;

103 static uint32_t g_iterations;

104 static struct mach_timebase_info g_mti;

105 static semaphore_t g_main_sem;

106 static uint64_t *g_thread_endtimes_abs;

107 static boolean_t g_verbose = FALSE;

108 static boolean_t g_do_affinity = FALSE;

109 static uint64_t g_starttime_abs;

110 static uint32_t g_iteration_sleeptime_us = 0;

111 static uint32_t g_priority = 0;

112 static uint32_t g_churn_pri = 0;

113 static uint32_t g_churn_count = 0;

114 static uint32_t g_rt_churn_count = 0;

115

116 static pthread_t* g_churn_threads = NULL;

117 static pthread_t* g_rt_churn_threads = NULL;

118

119 /* should we skip test if run on non-intel */

120 static boolean_t g_run_on_intel_only = FALSE;

121

122 /* Threshold for dropping a 'bad run' tracepoint */

123 static uint64_t g_traceworthy_latency_ns = TRACEWORTHY_NANOS;

124

125 /* Have we re-execed to set apptype? */

126 static boolean_t g_seen_apptype = FALSE;

127

128 /* usleep in betweeen iterations */

129 static boolean_t g_do_sleep = TRUE;

130

131 /* Every thread spins until all threads have checked in */

132 static boolean_t g_do_all_spin = FALSE;

133

134 /* Every thread backgrounds temporarily before parking */

135 static boolean_t g_drop_priority = FALSE;

136

137 /* Use low-latency (sub 4ms deadline) realtime threads */

138 static boolean_t g_rt_ll = FALSE;

139

140 /* Test whether realtime threads are scheduled on the separate CPUs */

141 static boolean_t g_test_rt = FALSE;

142

143 static boolean_t g_rt_churn = FALSE;

144

145 /* On SMT machines, test whether realtime threads are scheduled on the correct CPUs */

146 static boolean_t g_test_rt_smt = FALSE;

147

148 /* Test whether realtime threads are successfully avoiding CPU 0 on Intel */

149 static boolean_t g_test_rt_avoid0 = FALSE;

150

151 /* Print a histgram showing how many threads ran on each CPU */

152 static boolean_t g_histogram = FALSE;

153

154 /* One randomly chosen thread holds up the train for a certain duration. */

155 static boolean_t g_do_one_long_spin = FALSE;

156 static uint32_t g_one_long_spin_id = 0;

157 static uint64_t g_one_long_spin_length_abs = 0;

158 static uint64_t g_one_long_spin_length_ns = 0;

159

160 /* Each thread spins for a certain duration after waking up before blocking again. */

161 static boolean_t g_do_each_spin = FALSE;

162 static uint64_t g_each_spin_duration_abs = 0;

163 static uint64_t g_each_spin_duration_ns = 0;

164

165 /* Global variables (broadcast) */

166 static semaphore_t g_broadcastsem;

167 static semaphore_t g_leadersem;

168 static semaphore_t g_readysem;

169 static semaphore_t g_donesem;

170 static semaphore_t g_rt_churn_sem;

171 static semaphore_t g_rt_churn_start_sem;

172

173 /* Global variables (chain) */

174 static semaphore_t *g_semarr;

175

176 typedef struct {

         __attribute__((aligned(128))) uint32_t current;

178 uint32_t accum;

179 } histogram_t;

180

181 static histogram_t *g_cpu_histogram;

182 static _Atomic uint64_t *g_cpu_map;

183

184 static uint64_t

185 abs_to_nanos(uint64_t abstime)

186 {

         return (uint64_t)(abstime * (((double)g_mti.numer) / ((double)g_mti.denom)));

188 }

189

190 static uint64_t

191 nanos_to_abs(uint64_t ns)

192 {

         return (uint64_t)(ns * (((double)g_mti.denom) / ((double)g_mti.numer)));

194 }

195

196 inline static void

197 yield(void)

198 {

199 #if defined(__arm__) || defined(__arm64__)

         asm volatile ("yield");

201 #elif defined(__x86_64__) || defined(__i386__)

         asm volatile ("pause");

203 #else

204 #error Unrecognized architecture

205 #endif

206 }

207

208 static void *

 churn_thread(__unused void *arg)

210 {

211 uint64_t spin_count = 0;

212

213 /*

214 * As a safety measure to avoid wedging, we will bail on the spin if

215 * it's been more than 1s after the most recent run start

216 */

217

218 while (g_churn_stop == FALSE &&

219 mach_absolute_time() < (g_starttime_abs + NSEC_PER_SEC)) {

220 spin_count++;

221 yield();

222 }

223

224 /* This is totally racy, but only here to detect if anyone stops early */

         atomic_fetch_add_explicit(&g_churn_stopped_at, spin_count, memory_order_relaxed);

226

227 return NULL;

228 }

229

230 static void

231 create_churn_threads()

232 {

         if (g_churn_count == 0) {

                 g_churn_count = g_test_rt_smt ? g_numcpus : g_numcpus - 1;

235 }

236

237 errno_t err;

238

         struct sched_param param = { .sched_priority = (int)g_churn_pri };

240 pthread_attr_t attr;

241

242 /* Array for churn threads */

         g_churn_threads = (pthread_t*) valloc(sizeof(pthread_t) * g_churn_count);

244 assert(g_churn_threads);

245

         if ((err = pthread_attr_init(&attr))) {

                 errc(EX_OSERR, err, "pthread_attr_init");

248 }

249

         if ((err = pthread_attr_setschedparam(&attr, &param))) {

                 errc(EX_OSERR, err, "pthread_attr_setschedparam");

252 }

253

         if ((err = pthread_attr_setschedpolicy(&attr, SCHED_RR))) {

                 errc(EX_OSERR, err, "pthread_attr_setschedpolicy");

256 }

257

         for (uint32_t i = 0; i < g_churn_count; i++) {

259 pthread_t new_thread;

260

                 if ((err = pthread_create(&new_thread, &attr, churn_thread, NULL))) {

                         errc(EX_OSERR, err, "pthread_create");

263 }

264 g_churn_threads[i] = new_thread;

265 }

266

         if ((err = pthread_attr_destroy(&attr))) {

                 errc(EX_OSERR, err, "pthread_attr_destroy");

269 }

270 }

271

272 static void

273 join_churn_threads(void)

274 {

         if (atomic_load_explicit(&g_churn_stopped_at, memory_order_seq_cst) != 0) {

                 printf("Warning: Some of the churn threads may have stopped early: %lld\n",

277 g_churn_stopped_at);

278 }

279

         atomic_store_explicit(&g_churn_stop, TRUE, memory_order_seq_cst);

281

282 /* Rejoin churn threads */

         for (uint32_t i = 0; i < g_churn_count; i++) {

                 errno_t err = pthread_join(g_churn_threads[i], NULL);

285 if (err) {

                         errc(EX_OSERR, err, "pthread_join %d", i);

287 }

288 }

289 }

290

291 /*

292 * Set policy

293 */

294 static int

295 rt_churn_thread_setup(void)

296 {

297 kern_return_t kr;

298 thread_time_constraint_policy_data_t pol;

299

300 /* Hard-coded realtime parameters (similar to what Digi uses) */

301 pol.period = 100000;

         pol.constraint  = (uint32_t) nanos_to_abs(CONSTRAINT_NANOS * 2);

         pol.computation = (uint32_t) nanos_to_abs(RT_CHURN_COMP_NANOS * 2);

         pol.preemptible = 0;         /* Ignored by OS */

305

         kr = thread_policy_set(mach_thread_self(), THREAD_TIME_CONSTRAINT_POLICY,

307 (thread_policy_t) &pol, THREAD_TIME_CONSTRAINT_POLICY_COUNT);

         mach_assert_zero_t(0, kr);

309

310 return 0;

311 }

312

313 static void *

 rt_churn_thread(__unused void *arg)

315 {

316 rt_churn_thread_setup();

317

         for (uint32_t i = 0; i < g_iterations; i++) {

                 kern_return_t kr = semaphore_wait_signal(g_rt_churn_start_sem, g_rt_churn_sem);

                 mach_assert_zero_t(0, kr);

321

                 volatile double x = 0.0;

                 volatile double y = 0.0;

324

                 uint64_t endspin = mach_absolute_time() + nanos_to_abs(RT_CHURN_COMP_NANOS);

                 while (mach_absolute_time() < endspin) {

                         y = y + 1.5 + x;

328 x = sqrt(y);

329 }

330 }

331

332 kern_return_t kr = semaphore_signal(g_rt_churn_sem);

         mach_assert_zero_t(0, kr);

334

335 return NULL;

336 }

337

338 static void

339 wait_for_rt_churn_threads(void)

340 {

         for (uint32_t i = 0; i < g_rt_churn_count; i++) {

342 kern_return_t kr = semaphore_wait(g_rt_churn_sem);

                 mach_assert_zero_t(0, kr);

344 }

345 }

346

347 static void

348 start_rt_churn_threads(void)

349 {

         for (uint32_t i = 0; i < g_rt_churn_count; i++) {

351 kern_return_t kr = semaphore_signal(g_rt_churn_start_sem);

                 mach_assert_zero_t(0, kr);

353 }

354 }

355

356 static void

357 create_rt_churn_threads(void)

358 {

         if (g_rt_churn_count == 0) {

360 /* Leave 1 CPU to ensure that the main thread can make progress */

361 g_rt_churn_count = g_numcpus - 1;

362 }

363

364 errno_t err;

365

         struct sched_param param = { .sched_priority = (int)g_churn_pri };

367 pthread_attr_t attr;

368

369 /* Array for churn threads */

         g_rt_churn_threads = (pthread_t*) valloc(sizeof(pthread_t) * g_rt_churn_count);

371 assert(g_rt_churn_threads);

372

         if ((err = pthread_attr_init(&attr))) {

                 errc(EX_OSERR, err, "pthread_attr_init");

375 }

376

         if ((err = pthread_attr_setschedparam(&attr, &param))) {

                 errc(EX_OSERR, err, "pthread_attr_setschedparam");

379 }

380

         if ((err = pthread_attr_setschedpolicy(&attr, SCHED_RR))) {

                 errc(EX_OSERR, err, "pthread_attr_setschedpolicy");

383 }

384

         for (uint32_t i = 0; i < g_rt_churn_count; i++) {

386 pthread_t new_thread;

387

                 if ((err = pthread_create(&new_thread, &attr, rt_churn_thread, NULL))) {

                         errc(EX_OSERR, err, "pthread_create");

390 }

391 g_rt_churn_threads[i] = new_thread;

392 }

393

         if ((err = pthread_attr_destroy(&attr))) {

                 errc(EX_OSERR, err, "pthread_attr_destroy");

396 }

397

398 /* Wait until all threads have checked in */

399 wait_for_rt_churn_threads();

400 }

401

402 static void

403 join_rt_churn_threads(void)

404 {

405 /* Rejoin rt churn threads */

         for (uint32_t i = 0; i < g_rt_churn_count; i++) {

                 errno_t err = pthread_join(g_rt_churn_threads[i], NULL);

408 if (err) {

                         errc(EX_OSERR, err, "pthread_join %d", i);

410 }

411 }

412 }

413

414 /*

415 * Figure out what thread policy to use

416 */

417 static my_policy_type_t

 parse_thread_policy(const char *str)

419 {

         if (strcmp(str, "timeshare") == 0) {

421 return MY_POLICY_TIMESHARE;

         } else if (strcmp(str, "timeshare_no_smt") == 0) {

423 return MY_POLICY_TIMESHARE_NO_SMT;

         } else if (strcmp(str, "realtime") == 0) {

425 return MY_POLICY_REALTIME;

         } else if (strcmp(str, "fixed") == 0) {

427 return MY_POLICY_FIXEDPRI;

428 } else {

                 errx(EX_USAGE, "Invalid thread policy \"%s\"", str);

430 }

431 }

432

433 /*

434 * Figure out what wakeup pattern to use

435 */

436 static wake_type_t

 parse_wakeup_pattern(const char *str)

438 {

         if (strcmp(str, "chain") == 0) {

440 return WAKE_CHAIN;

         } else if (strcmp(str, "hop") == 0) {

442 return WAKE_HOP;

         } else if (strcmp(str, "broadcast-single-sem") == 0) {

444 return WAKE_BROADCAST_ONESEM;

         } else if (strcmp(str, "broadcast-per-thread") == 0) {

446 return WAKE_BROADCAST_PERTHREAD;

447 } else {

                 errx(EX_USAGE, "Invalid wakeup pattern \"%s\"", str);

449 }

450 }

451

452 /*

453 * Set policy

454 */

455 static int

456 thread_setup(uint32_t my_id)

457 {

458 kern_return_t kr;

459 errno_t ret;

460 thread_time_constraint_policy_data_t pol;

461

462 if (g_priority) {

463 int policy = SCHED_OTHER;

464 if (g_policy == MY_POLICY_FIXEDPRI) {

465 policy = SCHED_RR;

466 }

467

                 struct sched_param param = {.sched_priority = (int)g_priority};

                 if ((ret = pthread_setschedparam(pthread_self(), policy, &param))) {

                         errc(EX_OSERR, ret, "pthread_setschedparam: %d", my_id);

471 }

472 }

473

474 switch (g_policy) {

475 case MY_POLICY_TIMESHARE:

476 break;

477 case MY_POLICY_TIMESHARE_NO_SMT:

478 proc_setthread_no_smt();

479 break;

480 case MY_POLICY_REALTIME:

481 /* Hard-coded realtime parameters (similar to what Digi uses) */

482 pol.period = 100000;

483 if (g_rt_ll) {

                         pol.constraint  = (uint32_t) nanos_to_abs(LL_CONSTRAINT_NANOS);

                         pol.computation = (uint32_t) nanos_to_abs(LL_COMPUTATION_NANOS);

486 } else {

                         pol.constraint  = (uint32_t) nanos_to_abs(CONSTRAINT_NANOS);

                         pol.computation = (uint32_t) nanos_to_abs(COMPUTATION_NANOS);

489 }

                 pol.preemptible = 0;         /* Ignored by OS */

491

                 kr = thread_policy_set(mach_thread_self(), THREAD_TIME_CONSTRAINT_POLICY,

493 (thread_policy_t) &pol, THREAD_TIME_CONSTRAINT_POLICY_COUNT);

494 mach_assert_zero_t(my_id, kr);

495 break;

496 case MY_POLICY_FIXEDPRI:

497 ret = pthread_set_fixedpriority_self();

498 if (ret) {

                         errc(EX_OSERR, ret, "pthread_set_fixedpriority_self");

500 }

501 break;

502 default:

                 errx(EX_USAGE, "invalid policy type %d", g_policy);

504 }

505

506 if (g_do_affinity) {

507 thread_affinity_policy_data_t affinity;

508

                 affinity.affinity_tag = my_id % 2;

510

                 kr = thread_policy_set(mach_thread_self(), THREAD_AFFINITY_POLICY,

512 (thread_policy_t)&affinity, THREAD_AFFINITY_POLICY_COUNT);

513 mach_assert_zero_t(my_id, kr);

514 }

515

516 return 0;

517 }

518

519 time_value_t

520 get_thread_runtime(void)

521 {

522 thread_basic_info_data_t info;

523 mach_msg_type_number_t info_count = THREAD_BASIC_INFO_COUNT;

         thread_info(pthread_mach_thread_np(pthread_self()), THREAD_BASIC_INFO, (thread_info_t)&info, &info_count);

525

         time_value_add(&info.user_time, &info.system_time);

527

528 return info.user_time;

529 }

530

531 time_value_t worker_threads_total_runtime = {};

532

533 /*

534 * Wait for a wakeup, potentially wake up another of the "0-N" threads,

535 * and notify the main thread when done.

536 */

537 static void*

 worker_thread(void *arg)

539 {

540 static os_unfair_lock runtime_lock = OS_UNFAIR_LOCK_INIT;

541

         uint32_t my_id = (uint32_t)(uintptr_t)arg;

543 kern_return_t kr;

544

         volatile double x = 0.0;

         volatile double y = 0.0;

547

548 /* Set policy and so forth */

549 thread_setup(my_id);

550

         for (uint32_t i = 0; i < g_iterations; i++) {

                 if (my_id == 0) {

553 /*

554 * Leader thread either wakes everyone up or starts the chain going.

555 */

556

557 /* Give the worker threads undisturbed time to finish before waiting on them */

558 if (g_do_sleep) {

559 usleep(g_iteration_sleeptime_us);

560 }

561

                         debug_log("%d Leader thread wait for ready\n", i);

563

564 /*

565 * Wait for everyone else to declare ready

566 * Is there a better way to do this that won't interfere with the rest of the chain?

567 * TODO: Invent 'semaphore wait for N signals'

568 */

569

                         for (uint32_t j = 0; j < g_numthreads - 1; j++) {

571 kr = semaphore_wait(g_readysem);

572 mach_assert_zero_t(my_id, kr);

573 }

574

                         debug_log("%d Leader thread wait\n", i);

576

                         if (i > 0) {

                                 for (int cpuid = 0; cpuid < g_numcpus; cpuid++) {

                                         if (g_cpu_histogram[cpuid].current == 1) {

                                                 atomic_fetch_or_explicit(&g_cpu_map[i - 1], (1UL << cpuid), memory_order_relaxed);

                                                 g_cpu_histogram[cpuid].current = 0;

582 }

583 }

584 }

585

586 /* Signal main thread and wait for start of iteration */

587

                         kr = semaphore_wait_signal(g_leadersem, g_main_sem);

589 mach_assert_zero_t(my_id, kr);

590

591 g_thread_endtimes_abs[my_id] = mach_absolute_time();

592

                         debug_log("%d Leader thread go\n", i);

594

                         assert_zero_t(my_id, atomic_load_explicit(&g_done_threads, memory_order_relaxed));

596

597 switch (g_waketype) {

598 case WAKE_BROADCAST_ONESEM:

599 kr = semaphore_signal_all(g_broadcastsem);

600 mach_assert_zero_t(my_id, kr);

601 break;

602 case WAKE_BROADCAST_PERTHREAD:

                                 for (uint32_t j = 1; j < g_numthreads; j++) {

                                         kr = semaphore_signal(g_semarr[j]);

605 mach_assert_zero_t(my_id, kr);

606 }

607 break;

608 case WAKE_CHAIN:

                                 kr = semaphore_signal(g_semarr[my_id + 1]);

610 mach_assert_zero_t(my_id, kr);

611 break;

612 case WAKE_HOP:

                                 kr = semaphore_wait_signal(g_donesem, g_semarr[my_id + 1]);

614 mach_assert_zero_t(my_id, kr);

615 break;

616 }

617 } else {

618 /*

619 * Everyone else waits to be woken up,

620 * records when she wakes up, and possibly

621 * wakes up a friend.

622 */

623 switch (g_waketype) {

624 case WAKE_BROADCAST_ONESEM:

                                 kr = semaphore_wait_signal(g_broadcastsem, g_readysem);

626 mach_assert_zero_t(my_id, kr);

627

628 g_thread_endtimes_abs[my_id] = mach_absolute_time();

629 break;

630

631 case WAKE_BROADCAST_PERTHREAD:

                                 kr = semaphore_wait_signal(g_semarr[my_id], g_readysem);

633 mach_assert_zero_t(my_id, kr);

634

635 g_thread_endtimes_abs[my_id] = mach_absolute_time();

636 break;

637

638 case WAKE_CHAIN:

                                 kr = semaphore_wait_signal(g_semarr[my_id], g_readysem);

640 mach_assert_zero_t(my_id, kr);

641

642 /* Signal the next thread *after* recording wake time */

643

644 g_thread_endtimes_abs[my_id] = mach_absolute_time();

645

                                 if (my_id < (g_numthreads - 1)) {

                                         kr = semaphore_signal(g_semarr[my_id + 1]);

648 mach_assert_zero_t(my_id, kr);

649 }

650

651 break;

652

653 case WAKE_HOP:

                                 kr = semaphore_wait_signal(g_semarr[my_id], g_readysem);

655 mach_assert_zero_t(my_id, kr);

656

657 /* Signal the next thread *after* recording wake time */

658

659 g_thread_endtimes_abs[my_id] = mach_absolute_time();

660

                                 if (my_id < (g_numthreads - 1)) {

                                         kr = semaphore_wait_signal(g_donesem, g_semarr[my_id + 1]);

663 mach_assert_zero_t(my_id, kr);

664 } else {

665 kr = semaphore_signal_all(g_donesem);

666 mach_assert_zero_t(my_id, kr);

667 }

668

669 break;

670 }

671 }

672

673 unsigned int cpuid = _os_cpu_number();

674 assert(cpuid < g_numcpus);

                 debug_log("Thread %p woke up on CPU %d for iteration %d.\n", pthread_self(), cpuid, i);

                 g_cpu_histogram[cpuid].current = 1;

677 g_cpu_histogram[cpuid].accum++;

678

                 if (g_do_one_long_spin && g_one_long_spin_id == my_id) {

680 /* One randomly chosen thread holds up the train for a while. */

681

682 uint64_t endspin = g_starttime_abs + g_one_long_spin_length_abs;

                         while (mach_absolute_time() < endspin) {

                                 y = y + 1.5 + x;

685 x = sqrt(y);

686 }

687 }

688

689 if (g_do_each_spin) {

690 /* Each thread spins for a certain duration after waking up before blocking again. */

691

                         uint64_t endspin = mach_absolute_time() + g_each_spin_duration_abs;

                         while (mach_absolute_time() < endspin) {

                                 y = y + 1.5 + x;

695 x = sqrt(y);

696 }

697 }

698

699 uint32_t done_threads;

                 done_threads = atomic_fetch_add_explicit(&g_done_threads, 1, memory_order_relaxed) + 1;

701

                 debug_log("Thread %p new value is %d, iteration %d\n", pthread_self(), done_threads, i);

703

704 if (g_drop_priority) {

705 /* Drop priority to BG momentarily */

                         errno_t ret = setpriority(PRIO_DARWIN_THREAD, 0, PRIO_DARWIN_BG);

707 if (ret) {

                                 errc(EX_OSERR, ret, "setpriority PRIO_DARWIN_BG");

709 }

710 }

711

712 if (g_do_all_spin) {

713 /* Everyone spins until the last thread checks in. */

714

                         while (atomic_load_explicit(&g_done_threads, memory_order_relaxed) < g_numthreads) {

                                 y = y + 1.5 + x;

717 x = sqrt(y);

718 }

719 }

720

721 if (g_drop_priority) {

722 /* Restore normal priority */

                         errno_t ret = setpriority(PRIO_DARWIN_THREAD, 0, 0);

724 if (ret) {

                                 errc(EX_OSERR, ret, "setpriority 0");

726 }

727 }

728

                 debug_log("Thread %p done spinning, iteration %d\n", pthread_self(), i);

730 }

731

         if (my_id == 0) {

733 /* Give the worker threads undisturbed time to finish before waiting on them */

734 if (g_do_sleep) {

735 usleep(g_iteration_sleeptime_us);

736 }

737

738 /* Wait for the worker threads to finish */

                 for (uint32_t i = 0; i < g_numthreads - 1; i++) {

740 kr = semaphore_wait(g_readysem);

741 mach_assert_zero_t(my_id, kr);

742 }

743

744 /* Tell everyone and the main thread that the last iteration is done */

                 debug_log("%d Leader thread done\n", g_iterations - 1);

746

                 for (int cpuid = 0; cpuid < g_numcpus; cpuid++) {

                         if (g_cpu_histogram[cpuid].current == 1) {

                                 atomic_fetch_or_explicit(&g_cpu_map[g_iterations - 1], (1UL << cpuid), memory_order_relaxed);

                                 g_cpu_histogram[cpuid].current = 0;

751 }

752 }

753

754 kr = semaphore_signal_all(g_main_sem);

755 mach_assert_zero_t(my_id, kr);

756 } else {

757 /* Hold up thread teardown so it doesn't affect the last iteration */

                 kr = semaphore_wait_signal(g_main_sem, g_readysem);

759 mach_assert_zero_t(my_id, kr);

760 }

761

762 time_value_t runtime = get_thread_runtime();

763 os_unfair_lock_lock(&runtime_lock);

764 time_value_add(&worker_threads_total_runtime, &runtime);

765 os_unfair_lock_unlock(&runtime_lock);

766

767 return 0;

768 }

769

770 /*

771 * Given an array of uint64_t values, compute average, max, min, and standard deviation

772 */

773 static void

 compute_stats(uint64_t *values, uint64_t count, float *averagep, uint64_t *maxp, uint64_t *minp, float *stddevp)

775 {

776 uint32_t i;

777 uint64_t _sum = 0;

778 uint64_t _max = 0;

779 uint64_t _min = UINT64_MAX;

780 float _avg = 0;

781 float _dev = 0;

782

         for (i = 0; i < count; i++) {

784 _sum += values[i];

                 _max = values[i] > _max ? values[i] : _max;

                 _min = values[i] < _min ? values[i] : _min;

787 }

788

         _avg = ((float)_sum) / ((float)count);

790

791 _dev = 0;

         for (i = 0; i < count; i++) {

                 _dev += powf((((float)values[i]) - _avg), 2);

794 }

795

796 _dev /= count;

797 _dev = sqrtf(_dev);

798

799 *averagep = _avg;

800 *maxp = _max;

801 *minp = _min;

802 *stddevp = _dev;

803 }

804

805 typedef struct {

806 natural_t sys;

807 natural_t user;

808 natural_t idle;

809 } cpu_time_t;

810

811 void

812 record_cpu_time(cpu_time_t *cpu_time)

813 {

814 host_cpu_load_info_data_t load;

815 mach_msg_type_number_t count = HOST_CPU_LOAD_INFO_COUNT;

         kern_return_t kr = host_statistics(mach_host_self(), HOST_CPU_LOAD_INFO, (int *)&load, &count);

         mach_assert_zero_t(0, kr);

818

819 natural_t total_system_time = load.cpu_ticks[CPU_STATE_SYSTEM];

         natural_t total_user_time = load.cpu_ticks[CPU_STATE_USER] + load.cpu_ticks[CPU_STATE_NICE];

821 natural_t total_idle_time = load.cpu_ticks[CPU_STATE_IDLE];

822

823 cpu_time->sys = total_system_time;

824 cpu_time->user = total_user_time;

825 cpu_time->idle = total_idle_time;

826 }

827

828 int

 main(int argc, char **argv)

830 {

831 errno_t ret;

832 kern_return_t kr;

833

834 pthread_t *threads;

835 uint64_t *worst_latencies_ns;

836 uint64_t *worst_latencies_from_first_ns;

837 uint64_t max, min;

838 float avg, stddev;

839

840 bool test_fail = false;

841 bool test_warn = false;

842

         for (int i = 0; i < argc; i++) {

                 if (strcmp(argv[i], "--switched_apptype") == 0) {

845 g_seen_apptype = TRUE;

846 }

847 }

848

849 if (!g_seen_apptype) {

850 selfexec_with_apptype(argc, argv);

851 }

852

853 parse_args(argc, argv);

854

         srand((unsigned int)time(NULL));

856

857 mach_timebase_info(&g_mti);

858

859 #if TARGET_OS_OSX

860 /* SKIP test if running on arm platform */

861 if (g_run_on_intel_only) {

862 int is_arm = 0;

                 size_t is_arm_size = sizeof(is_arm);

                 ret = sysctlbyname("hw.optional.arm64", &is_arm, &is_arm_size, NULL, 0);

                 if (ret == 0 && is_arm) {

                         printf("Unsupported platform. Skipping test.\n");

867 exit(0);

868 }

869 }

870 #endif /* TARGET_OS_OSX */

871

         size_t ncpu_size = sizeof(g_numcpus);

         ret = sysctlbyname("hw.ncpu", &g_numcpus, &ncpu_size, NULL, 0);

874 if (ret) {

                 err(EX_OSERR, "Failed sysctlbyname(hw.ncpu)");

876 }

         assert(g_numcpus <= 64); /* g_cpu_map needs to be extended for > 64 cpus */

878

         size_t physicalcpu_size = sizeof(g_nphysicalcpu);

         ret = sysctlbyname("hw.physicalcpu", &g_nphysicalcpu, &physicalcpu_size, NULL, 0);

881 if (ret) {

                 err(EX_OSERR, "Failed sysctlbyname(hw.physicalcpu)");

883 }

884

         size_t logicalcpu_size = sizeof(g_nlogicalcpu);

         ret = sysctlbyname("hw.logicalcpu", &g_nlogicalcpu, &logicalcpu_size, NULL, 0);

887 if (ret) {

                 err(EX_OSERR, "Failed sysctlbyname(hw.logicalcpu)");

889 }

890

891 if (g_test_rt) {

                 if (g_numthreads == 0) {

893 g_numthreads = g_numcpus;

894 }

895 g_policy = MY_POLICY_REALTIME;

896 g_do_all_spin = TRUE;

897 g_histogram = true;

898 /* Don't change g_traceworthy_latency_ns if it's explicity been set to something other than the default */

899 if (g_traceworthy_latency_ns == TRACEWORTHY_NANOS) {

900 g_traceworthy_latency_ns = TRACEWORTHY_NANOS_TEST;

901 }

902 } else if (g_test_rt_smt) {

                 if (g_nlogicalcpu != 2 * g_nphysicalcpu) {

904 /* Not SMT */

                         printf("Attempt to run --test-rt-smt on a non-SMT device\n");

906 exit(0);

907 }

908

                 if (g_numthreads == 0) {

910 g_numthreads = g_nphysicalcpu;

911 }

912 g_policy = MY_POLICY_REALTIME;

913 g_do_all_spin = TRUE;

914 g_histogram = true;

915 } else if (g_test_rt_avoid0) {

916 #if defined(__x86_64__) || defined(__i386__)

                 if (g_numthreads == 0) {

918 g_numthreads = g_nphysicalcpu - 1;

919 }

                 if (g_numthreads == 0) {

                         printf("Attempt to run --test-rt-avoid0 on a uniprocessor\n");

922 exit(0);

923 }

924 g_policy = MY_POLICY_REALTIME;

925 g_do_all_spin = TRUE;

926 g_histogram = true;

927 #else

                 printf("Attempt to run --test-rt-avoid0 on a non-Intel device\n");

929 exit(0);

930 #endif

         } else if (g_numthreads == 0) {

932 g_numthreads = g_numcpus;

933 }

934

935 if (g_do_each_spin) {

936 g_each_spin_duration_abs = nanos_to_abs(g_each_spin_duration_ns);

937 }

938

939 /* Configure the long-spin thread to take up half of its computation */

940 if (g_do_one_long_spin) {

941 g_one_long_spin_length_ns = COMPUTATION_NANOS / 2;

942 g_one_long_spin_length_abs = nanos_to_abs(g_one_long_spin_length_ns);

943 }

944

945 /* Estimate the amount of time the cleanup phase needs to back off */

946 g_iteration_sleeptime_us = g_numthreads * 20;

947

         uint32_t threads_per_core = (g_numthreads / g_numcpus) + 1;

949 if (g_do_each_spin) {

950 g_iteration_sleeptime_us += threads_per_core * (g_each_spin_duration_ns / NSEC_PER_USEC);

951 }

952 if (g_do_one_long_spin) {

953 g_iteration_sleeptime_us += g_one_long_spin_length_ns / NSEC_PER_USEC;

954 }

955

956 /* Arrays for threads and their wakeup times */

         threads = (pthread_t*) valloc(sizeof(pthread_t) * g_numthreads);

958 assert(threads);

959

         size_t endtimes_size = sizeof(uint64_t) * g_numthreads;

961

         g_thread_endtimes_abs = (uint64_t*) valloc(endtimes_size);

963 assert(g_thread_endtimes_abs);

964

965 /* Ensure the allocation is pre-faulted */

         ret = memset_s(g_thread_endtimes_abs, endtimes_size, 0, endtimes_size);

967 if (ret) {

                 errc(EX_OSERR, ret, "memset_s endtimes");

969 }

970

         size_t latencies_size = sizeof(uint64_t) * g_iterations;

972

         worst_latencies_ns = (uint64_t*) valloc(latencies_size);

974 assert(worst_latencies_ns);

975

976 /* Ensure the allocation is pre-faulted */

         ret = memset_s(worst_latencies_ns, latencies_size, 0, latencies_size);

978 if (ret) {

                 errc(EX_OSERR, ret, "memset_s latencies");

980 }

981

         worst_latencies_from_first_ns = (uint64_t*) valloc(latencies_size);

983 assert(worst_latencies_from_first_ns);

984

985 /* Ensure the allocation is pre-faulted */

         ret = memset_s(worst_latencies_from_first_ns, latencies_size, 0, latencies_size);

987 if (ret) {

                 errc(EX_OSERR, ret, "memset_s latencies_from_first");

989 }

990

         size_t histogram_size = sizeof(histogram_t) * g_numcpus;

         g_cpu_histogram = (histogram_t *)valloc(histogram_size);

993 assert(g_cpu_histogram);

994 /* Ensure the allocation is pre-faulted */

         ret = memset_s(g_cpu_histogram, histogram_size, 0, histogram_size);

996 if (ret) {

                 errc(EX_OSERR, ret, "memset_s g_cpu_histogram");

998 }

999

         size_t map_size = sizeof(uint64_t) * g_iterations;

         g_cpu_map = (_Atomic uint64_t *)valloc(map_size);

1002 assert(g_cpu_map);

1003 /* Ensure the allocation is pre-faulted */

         ret = memset_s(g_cpu_map, map_size, 0, map_size);

1005 if (ret) {

                 errc(EX_OSERR, ret, "memset_s g_cpu_map");

1007 }

1008

         kr = semaphore_create(mach_task_self(), &g_main_sem, SYNC_POLICY_FIFO, 0);

1010 mach_assert_zero(kr);

1011

1012 /* Either one big semaphore or one per thread */

1013 if (g_waketype == WAKE_CHAIN ||

1014 g_waketype == WAKE_BROADCAST_PERTHREAD ||

1015 g_waketype == WAKE_HOP) {

                 g_semarr = valloc(sizeof(semaphore_t) * g_numthreads);

1017 assert(g_semarr);

1018

                 for (uint32_t i = 0; i < g_numthreads; i++) {

                         kr = semaphore_create(mach_task_self(), &g_semarr[i], SYNC_POLICY_FIFO, 0);

1021 mach_assert_zero(kr);

1022 }

1023

1024 g_leadersem = g_semarr[0];

1025 } else {

                 kr = semaphore_create(mach_task_self(), &g_broadcastsem, SYNC_POLICY_FIFO, 0);

1027 mach_assert_zero(kr);

                 kr = semaphore_create(mach_task_self(), &g_leadersem, SYNC_POLICY_FIFO, 0);

1029 mach_assert_zero(kr);

1030 }

1031

1032 if (g_waketype == WAKE_HOP) {

                 kr = semaphore_create(mach_task_self(), &g_donesem, SYNC_POLICY_FIFO, 0);

1034 mach_assert_zero(kr);

1035 }

1036

         kr = semaphore_create(mach_task_self(), &g_readysem, SYNC_POLICY_FIFO, 0);

1038 mach_assert_zero(kr);

1039

         kr = semaphore_create(mach_task_self(), &g_rt_churn_sem, SYNC_POLICY_FIFO, 0);

1041 mach_assert_zero(kr);

1042

         kr = semaphore_create(mach_task_self(), &g_rt_churn_start_sem, SYNC_POLICY_FIFO, 0);

1044 mach_assert_zero(kr);

1045

         atomic_store_explicit(&g_done_threads, 0, memory_order_relaxed);

1047

1048 /* Create the threads */

         for (uint32_t i = 0; i < g_numthreads; i++) {

                 ret = pthread_create(&threads[i], NULL, worker_thread, (void*)(uintptr_t)i);

1051 if (ret) {

                         errc(EX_OSERR, ret, "pthread_create %d", i);

1053 }

1054 }

1055

         ret = setpriority(PRIO_DARWIN_ROLE, 0, PRIO_DARWIN_ROLE_UI_FOCAL);

1057 if (ret) {

                 errc(EX_OSERR, ret, "setpriority");

1059 }

1060

1061 thread_setup(0);

1062

1063 g_starttime_abs = mach_absolute_time();

1064

1065 if (g_churn_pri) {

1066 create_churn_threads();

1067 }

1068 if (g_rt_churn) {

1069 create_rt_churn_threads();

1070 }

1071

1072 /* Let everyone get settled */

1073 kr = semaphore_wait(g_main_sem);

1074 mach_assert_zero(kr);

1075

1076 /* Give the system a bit more time to settle */

1077 if (g_do_sleep) {

1078 usleep(g_iteration_sleeptime_us);

1079 }

1080

1081 cpu_time_t start_time;

1082 cpu_time_t finish_time;

1083

1084 record_cpu_time(&start_time);

1085

1086 /* Go! */

         for (uint32_t i = 0; i < g_iterations; i++) {

1088 uint32_t j;

                 uint64_t worst_abs = 0, best_abs = UINT64_MAX;

1090

1091 if (g_do_one_long_spin) {

                         g_one_long_spin_id = (uint32_t)rand() % g_numthreads;

1093 }

1094

1095 if (g_rt_churn) {

1096 start_rt_churn_threads();

1097 usleep(100);

1098 }

1099

                 debug_log("%d Main thread reset\n", i);

1101

                 atomic_store_explicit(&g_done_threads, 0, memory_order_seq_cst);

1103

1104 g_starttime_abs = mach_absolute_time();

1105

1106 /* Fire them off and wait for worker threads to finish */

                 kr = semaphore_wait_signal(g_main_sem, g_leadersem);

1108 mach_assert_zero(kr);

1109

                 debug_log("%d Main thread return\n", i);

1111

                 assert(atomic_load_explicit(&g_done_threads, memory_order_relaxed) == g_numthreads);

1113

1114 if (g_rt_churn) {

1115 wait_for_rt_churn_threads();

1116 }

1117

1118 /*

1119 * We report the worst latencies relative to start time

1120 * and relative to the lead worker thread.

1121 */

                 for (j = 0; j < g_numthreads; j++) {

1123 uint64_t latency_abs;

1124

1125 latency_abs = g_thread_endtimes_abs[j] - g_starttime_abs;

                         worst_abs = worst_abs < latency_abs ? latency_abs : worst_abs;

1127 }

1128

                 worst_latencies_ns[i] = abs_to_nanos(worst_abs);

1130

1131 worst_abs = 0;

                 for (j = 1; j < g_numthreads; j++) {

1133 uint64_t latency_abs;

1134

                         latency_abs = g_thread_endtimes_abs[j] - g_thread_endtimes_abs[0];

                         worst_abs = worst_abs < latency_abs ? latency_abs : worst_abs;

                         best_abs = best_abs > latency_abs ? latency_abs : best_abs;

1138 }

1139

                 worst_latencies_from_first_ns[i] = abs_to_nanos(worst_abs);

1141

1142 /*

1143 * In the event of a bad run, cut a trace point.

1144 */

                 if (worst_latencies_from_first_ns[i] > g_traceworthy_latency_ns) {

1146 /* Ariadne's ad-hoc test signpost */

                         kdebug_trace(ARIADNEDBG_CODE(0, 0), worst_latencies_from_first_ns[i], g_traceworthy_latency_ns, 0, 0);

1148

1149 if (g_verbose) {

                                 printf("Worst on this round was %.2f us.\n", ((float)worst_latencies_from_first_ns[i]) / 1000.0);

1151 }

1152 }

1153

1154 /* Give the system a bit more time to settle */

1155 if (g_do_sleep) {

1156 usleep(g_iteration_sleeptime_us);

1157 }

1158 }

1159

1160 record_cpu_time(&finish_time);

1161

1162 /* Rejoin threads */

         for (uint32_t i = 0; i < g_numthreads; i++) {

                 ret = pthread_join(threads[i], NULL);

1165 if (ret) {

                         errc(EX_OSERR, ret, "pthread_join %d", i);

1167 }

1168 }

1169

1170 if (g_rt_churn) {

1171 join_rt_churn_threads();

1172 }

1173

1174 if (g_churn_pri) {

1175 join_churn_threads();

1176 }

1177

         uint32_t cpu_idle_time = (finish_time.idle - start_time.idle) * 10;

         uint32_t worker_threads_runtime = worker_threads_total_runtime.seconds * 1000 + worker_threads_total_runtime.microseconds / 1000;

1180

         compute_stats(worst_latencies_ns, g_iterations, &avg, &max, &min, &stddev);

         printf("Results (from a stop):\n");

         printf("Max:\t\t%.2f us\n", ((float)max) / 1000.0);

         printf("Min:\t\t%.2f us\n", ((float)min) / 1000.0);

         printf("Avg:\t\t%.2f us\n", avg / 1000.0);

         printf("Stddev:\t\t%.2f us\n", stddev / 1000.0);

1187

         putchar('\n');

1189

         compute_stats(worst_latencies_from_first_ns, g_iterations, &avg, &max, &min, &stddev);

         printf("Results (relative to first thread):\n");

         printf("Max:\t\t%.2f us\n", ((float)max) / 1000.0);

         printf("Min:\t\t%.2f us\n", ((float)min) / 1000.0);

         printf("Avg:\t\t%.2f us\n", avg / 1000.0);

         printf("Stddev:\t\t%.2f us\n", stddev / 1000.0);

1196

1197 #if 0

         for (uint32_t i = 0; i < g_iterations; i++) {

                 printf("Iteration %d: %f us\n", i, worst_latencies_ns[i] / 1000.0);

1200 }

1201 #endif

1202

1203 if (g_histogram) {

                 putchar('\n');

1205

                 for (uint32_t i = 0; i < g_numcpus; i++) {

                         printf("%d\t%d\n", i, g_cpu_histogram[i].accum);

1208 }

1209 }

1210

         if (g_test_rt || g_test_rt_smt || g_test_rt_avoid0) {

1212 #define PRIMARY 0x5555555555555555ULL

1213 #define SECONDARY 0xaaaaaaaaaaaaaaaaULL

1214

1215 int fail_count = 0;

1216

                 for (uint32_t i = 0; i < g_iterations; i++) {

1218 bool secondary = false;

1219 bool fail = false;

1220 uint64_t map = g_cpu_map[i];

1221 if (g_test_rt_smt) {

1222 /* Test for one or more threads running on secondary cores unexpectedly (WARNING) */

1223 secondary = (map & SECONDARY);

1224 /* Test for threads running on both primary and secondary cpus of the same core (FAIL) */

                                 fail = ((map & PRIMARY) & ((map & SECONDARY) >> 1));

1226 } else if (g_test_rt) {

                                 fail = (__builtin_popcountll(map) != g_numthreads) && (worst_latencies_ns[i] > g_traceworthy_latency_ns);

1228 } else if (g_test_rt_avoid0) {

                                 fail = ((map & 0x1) == 0x1);

1230 }

1231 if (secondary || fail) {

                                 printf("Iteration %d: 0x%llx%s%s\n", i, map,

                                     secondary ? " SECONDARY" : "",

                                     fail ? " FAIL" : "");

1235 }

1236 test_warn |= (secondary || fail);

1237 test_fail |= fail;

1238 fail_count += fail;

1239 }

1240

                 if (test_fail && (g_iterations >= 100) && (fail_count <= g_iterations / 100)) {

                         printf("99%% or better success rate\n");

1243 test_fail = 0;

1244 }

1245 }

1246

         if (g_test_rt_smt && (g_each_spin_duration_ns >= 200000) && !test_warn) {

                 printf("cpu_idle_time=%dms worker_threads_runtime=%dms\n", cpu_idle_time, worker_threads_runtime);

                 if (cpu_idle_time < worker_threads_runtime / 4) {

                         printf("FAIL cpu_idle_time unexpectedly small\n");

1251 test_fail = 1;

                 } else if (cpu_idle_time > worker_threads_runtime * 2) {

                         printf("FAIL cpu_idle_time unexpectedly large\n");

1254 test_fail = 1;

1255 }

1256 }

1257

1258 free(threads);

1259 free(g_thread_endtimes_abs);

1260 free(worst_latencies_ns);

1261 free(worst_latencies_from_first_ns);

1262 free(g_cpu_histogram);

1263 free(g_cpu_map);

1264

1265 return test_fail;

1266 }

1267

1268 /*

1269 * WARNING: This is SPI specifically intended for use by launchd to start UI

1270 * apps. We use it here for a test tool only to opt into QoS using the same

1271 * policies. Do not use this outside xnu or libxpc/launchd.

1272 */

1273 static void

 selfexec_with_apptype(int argc, char *argv[])

1275 {

1276 int ret;

1277 posix_spawnattr_t attr;

1278 extern char **environ;

         char *new_argv[argc + 1 + 1 /* NULL */];

1280 int i;

1281 char prog[PATH_MAX];

1282 uint32_t prog_size = PATH_MAX;

1283

         ret = _NSGetExecutablePath(prog, &prog_size);

1285 if (ret) {

                 err(EX_OSERR, "_NSGetExecutablePath");

1287 }

1288

         for (i = 0; i < argc; i++) {

1290 new_argv[i] = argv[i];

1291 }

1292

1293 new_argv[i] = "--switched_apptype";

         new_argv[i + 1] = NULL;

1295

1296 ret = posix_spawnattr_init(&attr);

1297 if (ret) {

                 errc(EX_OSERR, ret, "posix_spawnattr_init");

1299 }

1300

         ret = posix_spawnattr_setflags(&attr, POSIX_SPAWN_SETEXEC);

1302 if (ret) {

                 errc(EX_OSERR, ret, "posix_spawnattr_setflags");

1304 }

1305

         ret = posix_spawnattr_setprocesstype_np(&attr, POSIX_SPAWN_PROC_TYPE_APP_DEFAULT);

1307 if (ret) {

                 errc(EX_OSERR, ret, "posix_spawnattr_setprocesstype_np");

1309 }

1310

         ret = posix_spawn(NULL, prog, NULL, &attr, new_argv, environ);

1312 if (ret) {

                 errc(EX_OSERR, ret, "posix_spawn");

1314 }

1315 }

1316

1317 /*

1318 * Admittedly not very attractive.

1319 */

1320 static void __attribute__((noreturn))

1321 usage()

1322 {

         errx(EX_USAGE, "Usage: %s <threads> <chain | hop | broadcast-single-sem | broadcast-per-thread> "

1324 "<realtime | timeshare | timeshare_no_smt | fixed> <iterations>\n\t\t"

1325 "[--trace <traceworthy latency in ns>] "

1326 "[--verbose] [--spin-one] [--spin-all] [--spin-time <nanos>] [--affinity]\n\t\t"

1327 "[--no-sleep] [--drop-priority] [--churn-pri <pri>] [--churn-count <n>]\n\t\t"

1328 "[--rt-churn] [--rt-churn-count <n>] [--rt-ll] [--test-rt] [--test-rt-smt] [--test-rt-avoid0]",

1329 getprogname());

1330 }

1331

1332 static struct option* g_longopts;

1333 static int option_index;

1334

1335 static uint32_t

1336 read_dec_arg()

1337 {

1338 char *cp;

1339 /* char* optarg is a magic global */

1340

         uint32_t arg_val = (uint32_t)strtoull(optarg, &cp, 10);

1342

         if (cp == optarg || *cp) {

                 errx(EX_USAGE, "arg --%s requires a decimal number, found \"%s\"",

1345 g_longopts[option_index].name, optarg);

1346 }

1347

1348 return arg_val;

1349 }

1350

1351 static void

 parse_args(int argc, char *argv[])

1353 {

1354 enum {

1355 OPT_GETOPT = 0,

1356 OPT_SPIN_TIME,

1357 OPT_TRACE,

1358 OPT_PRIORITY,

1359 OPT_CHURN_PRI,

1360 OPT_CHURN_COUNT,

1361 OPT_RT_CHURN_COUNT,

1362 };

1363

1364 static struct option longopts[] = {

1365 /* BEGIN IGNORE CODESTYLE */

                 { "spin-time",          required_argument,      NULL,                           OPT_SPIN_TIME },

                 { "trace",              required_argument,      NULL,                           OPT_TRACE     },

                 { "priority",           required_argument,      NULL,                           OPT_PRIORITY  },

                 { "churn-pri",          required_argument,      NULL,                           OPT_CHURN_PRI },

                 { "churn-count",        required_argument,      NULL,                           OPT_CHURN_COUNT },

                 { "rt-churn-count",     required_argument,      NULL,                           OPT_RT_CHURN_COUNT },

                 { "switched_apptype",   no_argument,            (int*)&g_seen_apptype,          TRUE },

                 { "spin-one",           no_argument,            (int*)&g_do_one_long_spin,      TRUE },

                 { "intel-only",         no_argument,            (int*)&g_run_on_intel_only,     TRUE },

                 { "spin-all",           no_argument,            (int*)&g_do_all_spin,           TRUE },

                 { "affinity",           no_argument,            (int*)&g_do_affinity,           TRUE },

                 { "no-sleep",           no_argument,            (int*)&g_do_sleep,              FALSE },

                 { "drop-priority",      no_argument,            (int*)&g_drop_priority,         TRUE },

                 { "test-rt",            no_argument,            (int*)&g_test_rt,               TRUE },

                 { "test-rt-smt",        no_argument,            (int*)&g_test_rt_smt,           TRUE },

                 { "test-rt-avoid0",     no_argument,            (int*)&g_test_rt_avoid0,        TRUE },

                 { "rt-churn",           no_argument,            (int*)&g_rt_churn,              TRUE },

                 { "rt-ll",              no_argument,            (int*)&g_rt_ll,                 TRUE },

                 { "histogram",          no_argument,            (int*)&g_histogram,             TRUE },

                 { "verbose",            no_argument,            (int*)&g_verbose,               TRUE },

                 { "help",               no_argument,            NULL,                           'h' },

                 { NULL,                 0,                      NULL,                           0 }

1388 /* END IGNORE CODESTYLE */

1389 };

1390

1391 g_longopts = longopts;

1392 int ch = 0;

1393

         while ((ch = getopt_long(argc, argv, "h", longopts, &option_index)) != -1) {

1395 switch (ch) {

1396 case OPT_GETOPT:

1397 /* getopt_long set a variable */

1398 break;

1399 case OPT_SPIN_TIME:

1400 g_do_each_spin = TRUE;

1401 g_each_spin_duration_ns = read_dec_arg();

1402 break;

1403 case OPT_TRACE:

1404 g_traceworthy_latency_ns = read_dec_arg();

1405 break;

1406 case OPT_PRIORITY:

1407 g_priority = read_dec_arg();

1408 break;

1409 case OPT_CHURN_PRI:

1410 g_churn_pri = read_dec_arg();

1411 break;

1412 case OPT_CHURN_COUNT:

1413 g_churn_count = read_dec_arg();

1414 break;

1415 case OPT_RT_CHURN_COUNT:

1416 g_rt_churn_count = read_dec_arg();

1417 break;

1418 case '?':

1419 case 'h':

1420 default:

1421 usage();

1422 /* NORETURN */

1423 }

1424 }

1425

1426 /*

1427 * getopt_long reorders all the options to the beginning of the argv array.

1428 * Jump past them to the non-option arguments.

1429 */

1430

1431 argc -= optind;

1432 argv += optind;

1433

         if (argc > 4) {

1435 warnx("Too many non-option arguments passed");

1436 usage();

1437 }

1438

         if (argc != 4) {

1440 warnx("Missing required <threads> <waketype> <policy> <iterations> arguments");

1441 usage();

1442 }

1443

1444 char *cp;

1445

1446 /* How many threads? */

         g_numthreads = (uint32_t)strtoull(argv[0], &cp, 10);

1448

         if (cp == argv[0] || *cp) {

                 errx(EX_USAGE, "numthreads requires a decimal number, found \"%s\"", argv[0]);

1451 }

1452

1453 /* What wakeup pattern? */

         g_waketype = parse_wakeup_pattern(argv[1]);

1455

1456 /* Policy */

         g_policy = parse_thread_policy(argv[2]);

1458

1459 /* Iterations */

         g_iterations = (uint32_t)strtoull(argv[3], &cp, 10);

1461

         if (cp == argv[3] || *cp) {

                 errx(EX_USAGE, "numthreads requires a decimal number, found \"%s\"", argv[3]);

1464 }

1465

         if (g_iterations < 1) {

                 errx(EX_USAGE, "Must have at least one iteration");

1468 }

1469

         if (g_numthreads == 1 && g_waketype == WAKE_CHAIN) {

                 errx(EX_USAGE, "chain mode requires more than one thread");

1472 }

1473

         if (g_numthreads == 1 && g_waketype == WAKE_HOP) {

                 errx(EX_USAGE, "hop mode requires more than one thread");

1476 }

1477 }