]> git.saurik.com Git - apple/xnu.git/blob - tools/tests/MPMMTest/MPMMtest.c
xnu-6153.141.1.tar.gz
[apple/xnu.git] / tools / tests / MPMMTest / MPMMtest.c
1 #include <AvailabilityMacros.h>
2 #include <mach/thread_policy.h>
3
4 #include <pthread.h>
5 #include <stdio.h>
6 #include <stdlib.h>
7 #include <libgen.h>
8 #include <string.h>
9 #include <err.h>
10 #include <unistd.h>
11
12 #include <pthread.h>
13 #include <mach/mach.h>
14 #include <mach/mach_error.h>
15 #include <mach/mach_time.h>
16 #include <mach/notify.h>
17 #include <servers/bootstrap.h>
18 #include <sys/types.h>
19 #include <sys/time.h>
20 #include <sys/signal.h>
21 #include <errno.h>
22 #include "../unit_tests/tests_common.h" /* for record_perf_data() */
23
24 #include <libkern/OSAtomic.h>
25
26 #define MAX(A, B) ((A) < (B) ? (B) : (A))
27
28
29 typedef struct {
30 mach_msg_header_t header;
31 mach_msg_trailer_t trailer; // subtract this when sending
32 } ipc_trivial_message;
33
34 typedef struct {
35 mach_msg_header_t header;
36 u_int32_t numbers[0];
37 mach_msg_trailer_t trailer; // subtract this when sending
38 } ipc_inline_message;
39
40 typedef struct {
41 mach_msg_header_t header;
42 mach_msg_body_t body;
43 mach_msg_ool_descriptor_t descriptor;
44 mach_msg_trailer_t trailer; // subtract this when sending
45 } ipc_complex_message;
46
47 enum {
48 msg_type_trivial = 0,
49 msg_type_inline = 1,
50 msg_type_complex = 2
51 };
52
53 struct port_args {
54 int server_num;
55 int req_size;
56 mach_msg_header_t *req_msg;
57 int reply_size;
58 mach_msg_header_t *reply_msg;
59 mach_port_t port;
60 mach_port_t rcv_set;
61
62 mach_port_t *set;
63 mach_port_t *port_list;
64 };
65
66 typedef union {
67 pid_t pid;
68 pthread_t tid;
69 } thread_id_t;
70
71 /* Global options */
72 static int verbose = 0;
73 static boolean_t affinity = FALSE;
74 static boolean_t timeshare = FALSE;
75 static boolean_t threaded = FALSE;
76 static boolean_t oneway = FALSE;
77 static boolean_t useset = FALSE;
78 static boolean_t save_perfdata = FALSE;
79 int msg_type;
80 int num_ints;
81 int num_msgs;
82 int num_clients;
83 int num_servers;
84 int client_delay;
85 int client_spin;
86 int client_pages;
87 int portcount = 1;
88 int setcount = 0;
89 boolean_t stress_prepost = FALSE;
90 char **server_port_name;
91
92 struct port_args *server_port_args;
93
94 /* global data */
95 mach_timebase_info_data_t g_timebase;
96 int64_t g_client_send_time = 0;
97
98 static inline uint64_t
99 ns_to_abs(uint64_t ns)
100 {
101 return ns * g_timebase.denom / g_timebase.numer;
102 }
103
104 static inline uint64_t
105 abs_to_ns(uint64_t abs)
106 {
107 return abs * g_timebase.numer / g_timebase.denom;
108 }
109
110
111 void
112 signal_handler(int sig)
113 {
114 }
115
116 void
117 usage(const char *progname)
118 {
119 fprintf(stderr, "usage: %s [options]\n", progname);
120 fprintf(stderr, "where options are:\n");
121 fprintf(stderr, " -affinity\t\tthreads use affinity\n");
122 fprintf(stderr, " -timeshare\t\tthreads use timeshare\n");
123 fprintf(stderr, " -threaded\t\tuse (p)threads\n");
124 fprintf(stderr, " -verbose\t\tbe verbose (use multiple times to increase verbosity)\n");
125 fprintf(stderr, " -oneway\t\tdo not request return reply\n");
126 fprintf(stderr, " -count num\t\tnumber of messages to send\n");
127 fprintf(stderr, " -perf \t\tCreate perfdata files for metrics.\n");
128 fprintf(stderr, " -type trivial|inline|complex\ttype of messages to send\n");
129 fprintf(stderr, " -numints num\tnumber of 32-bit ints to send in messages\n");
130 fprintf(stderr, " -servers num\tnumber of server threads to run\n");
131 fprintf(stderr, " -clients num\tnumber of clients per server\n");
132 fprintf(stderr, " -delay num\t\tmicroseconds to sleep clients between messages\n");
133 fprintf(stderr, " -work num\t\tmicroseconds of client work\n");
134 fprintf(stderr, " -pages num\t\tpages of memory touched by client work\n");
135 fprintf(stderr, " -set nset num\tcreate [nset] portsets and [num] ports in each server.\n");
136 fprintf(stderr, " \tEach port is connected to each set.\n");
137 fprintf(stderr, " -prepost\t\tstress the prepost system (implies -threaded, requires -set X Y)\n");
138 fprintf(stderr, "default values are:\n");
139 fprintf(stderr, " . no affinity\n");
140 fprintf(stderr, " . not timeshare\n");
141 fprintf(stderr, " . not threaded\n");
142 fprintf(stderr, " . not verbose\n");
143 fprintf(stderr, " . not oneway\n");
144 fprintf(stderr, " . client sends 100000 messages\n");
145 fprintf(stderr, " . inline message type\n");
146 fprintf(stderr, " . 64 32-bit integers in inline/complex messages\n");
147 fprintf(stderr, " . (num_available_processors+1)%%2 servers\n");
148 fprintf(stderr, " . 4 clients per server\n");
149 fprintf(stderr, " . no delay\n");
150 fprintf(stderr, " . no sets / extra ports\n");
151 fprintf(stderr, " . no prepost stress\n");
152 exit(1);
153 }
154
155 void
156 parse_args(int argc, char *argv[])
157 {
158 host_basic_info_data_t info;
159 mach_msg_type_number_t count;
160 kern_return_t result;
161
162 /* Initialize defaults */
163 msg_type = msg_type_trivial;
164 num_ints = 64;
165 num_msgs = 100000;
166 client_delay = 0;
167 num_clients = 4;
168
169 count = HOST_BASIC_INFO_COUNT;
170 result = host_info(mach_host_self(), HOST_BASIC_INFO,
171 (host_info_t)&info, &count);
172 if (result == KERN_SUCCESS && info.avail_cpus > 1) {
173 num_servers = info.avail_cpus / 2;
174 } else {
175 num_servers = 1;
176 }
177
178 const char *progname = argv[0];
179 argc--; argv++;
180 while (0 < argc) {
181 if (0 == strcmp("-verbose", argv[0])) {
182 verbose++;
183 argc--; argv++;
184 } else if (0 == strcmp("-affinity", argv[0])) {
185 affinity = TRUE;
186 argc--; argv++;
187 } else if (0 == strcmp("-timeshare", argv[0])) {
188 timeshare = TRUE;
189 argc--; argv++;
190 } else if (0 == strcmp("-threaded", argv[0])) {
191 threaded = TRUE;
192 argc--; argv++;
193 } else if (0 == strcmp("-oneway", argv[0])) {
194 oneway = TRUE;
195 argc--; argv++;
196 } else if (0 == strcmp("-perf", argv[0])) {
197 save_perfdata = TRUE;
198 argc--; argv++;
199 } else if (0 == strcmp("-type", argv[0])) {
200 if (argc < 2) {
201 usage(progname);
202 }
203 if (0 == strcmp("trivial", argv[1])) {
204 msg_type = msg_type_trivial;
205 } else if (0 == strcmp("inline", argv[1])) {
206 msg_type = msg_type_inline;
207 } else if (0 == strcmp("complex", argv[1])) {
208 msg_type = msg_type_complex;
209 } else {
210 usage(progname);
211 }
212 argc -= 2; argv += 2;
213 } else if (0 == strcmp("-numints", argv[0])) {
214 if (argc < 2) {
215 usage(progname);
216 }
217 num_ints = strtoul(argv[1], NULL, 0);
218 argc -= 2; argv += 2;
219 } else if (0 == strcmp("-count", argv[0])) {
220 if (argc < 2) {
221 usage(progname);
222 }
223 num_msgs = strtoul(argv[1], NULL, 0);
224 argc -= 2; argv += 2;
225 } else if (0 == strcmp("-clients", argv[0])) {
226 if (argc < 2) {
227 usage(progname);
228 }
229 num_clients = strtoul(argv[1], NULL, 0);
230 argc -= 2; argv += 2;
231 } else if (0 == strcmp("-servers", argv[0])) {
232 if (argc < 2) {
233 usage(progname);
234 }
235 num_servers = strtoul(argv[1], NULL, 0);
236 argc -= 2; argv += 2;
237 } else if (0 == strcmp("-delay", argv[0])) {
238 if (argc < 2) {
239 usage(progname);
240 }
241 client_delay = strtoul(argv[1], NULL, 0);
242 argc -= 2; argv += 2;
243 } else if (0 == strcmp("-spin", argv[0])) {
244 if (argc < 2) {
245 usage(progname);
246 }
247 client_spin = strtoul(argv[1], NULL, 0);
248 argc -= 2; argv += 2;
249 } else if (0 == strcmp("-pages", argv[0])) {
250 if (argc < 2) {
251 usage(progname);
252 }
253 client_pages = strtoul(argv[1], NULL, 0);
254 argc -= 2; argv += 2;
255 } else if (0 == strcmp("-set", argv[0])) {
256 if (argc < 3) {
257 usage(progname);
258 }
259 setcount = strtoul(argv[1], NULL, 0);
260 portcount = strtoul(argv[2], NULL, 0);
261 if (setcount <= 0 || portcount <= 0) {
262 usage(progname);
263 }
264 useset = TRUE;
265 argc -= 3; argv += 3;
266 } else if (0 == strcmp("-prepost", argv[0])) {
267 stress_prepost = TRUE;
268 threaded = TRUE;
269 argc--; argv++;
270 } else {
271 fprintf(stderr, "unknown option '%s'\n", argv[0]);
272 usage(progname);
273 }
274 }
275
276 if (stress_prepost) {
277 if (!threaded) {
278 fprintf(stderr, "Prepost stress test _must_ be threaded\n");
279 exit(1);
280 }
281 if (portcount < 1 || setcount < 1) {
282 fprintf(stderr, "Prepost stress test requires >= 1 port in >= 1 set.\n");
283 exit(1);
284 }
285 }
286 }
287
288 void
289 setup_server_ports(struct port_args *ports)
290 {
291 kern_return_t ret = 0;
292 mach_port_t bsport;
293 mach_port_t port;
294
295 ports->req_size = MAX(sizeof(ipc_inline_message) +
296 sizeof(u_int32_t) * num_ints,
297 sizeof(ipc_complex_message));
298 ports->reply_size = sizeof(ipc_trivial_message) -
299 sizeof(mach_msg_trailer_t);
300 ports->req_msg = malloc(ports->req_size);
301 ports->reply_msg = malloc(ports->reply_size);
302 if (setcount > 0) {
303 ports->set = (mach_port_t *)calloc(sizeof(mach_port_t), setcount);
304 if (!ports->set) {
305 fprintf(stderr, "calloc(%lu, %d) failed!\n", sizeof(mach_port_t), setcount);
306 exit(1);
307 }
308 }
309 if (stress_prepost) {
310 ports->port_list = (mach_port_t *)calloc(sizeof(mach_port_t), portcount);
311 if (!ports->port_list) {
312 fprintf(stderr, "calloc(%lu, %d) failed!\n", sizeof(mach_port_t), portcount);
313 exit(1);
314 }
315 }
316
317 if (useset) {
318 mach_port_t set;
319 if (setcount < 1) {
320 fprintf(stderr, "Can't use sets with a setcount of %d\n", setcount);
321 exit(1);
322 }
323
324 for (int ns = 0; ns < setcount; ns++) {
325 ret = mach_port_allocate(mach_task_self(),
326 MACH_PORT_RIGHT_PORT_SET,
327 &ports->set[ns]);
328 if (KERN_SUCCESS != ret) {
329 mach_error("mach_port_allocate(SET): ", ret);
330 exit(1);
331 }
332 if (verbose > 1) {
333 printf("SVR[%d] allocated set[%d] %#x\n",
334 ports->server_num, ns, ports->set[ns]);
335 }
336
337 set = ports->set[ns];
338 }
339
340 /* receive on a port set (always use the first in the chain) */
341 ports->rcv_set = ports->set[0];
342 }
343
344 /* stuff the portset(s) with ports */
345 for (int i = 0; i < portcount; i++) {
346 ret = mach_port_allocate(mach_task_self(),
347 MACH_PORT_RIGHT_RECEIVE,
348 &port);
349 if (KERN_SUCCESS != ret) {
350 mach_error("mach_port_allocate(PORT): ", ret);
351 exit(1);
352 }
353
354 if (stress_prepost) {
355 ports->port_list[i] = port;
356 }
357
358 if (useset) {
359 /* insert the port into _all_ allocated lowest-level sets */
360 for (int ns = 0; ns < setcount; ns++) {
361 if (verbose > 1) {
362 printf("SVR[%d] moving port %#x into set %#x...\n",
363 ports->server_num, port, ports->set[ns]);
364 }
365 ret = mach_port_insert_member(mach_task_self(),
366 port, ports->set[ns]);
367 if (KERN_SUCCESS != ret) {
368 mach_error("mach_port_insert_member(): ", ret);
369 exit(1);
370 }
371 }
372 }
373 }
374
375 /* use the last one as the server's bootstrap port */
376 ports->port = port;
377
378 if (stress_prepost) {
379 /* insert a send right for _each_ port */
380 for (int i = 0; i < portcount; i++) {
381 ret = mach_port_insert_right(mach_task_self(),
382 ports->port_list[i],
383 ports->port_list[i],
384 MACH_MSG_TYPE_MAKE_SEND);
385 if (KERN_SUCCESS != ret) {
386 mach_error("mach_port_insert_right(): ", ret);
387 exit(1);
388 }
389 }
390 } else {
391 ret = mach_port_insert_right(mach_task_self(),
392 ports->port,
393 ports->port,
394 MACH_MSG_TYPE_MAKE_SEND);
395 if (KERN_SUCCESS != ret) {
396 mach_error("mach_port_insert_right(): ", ret);
397 exit(1);
398 }
399 }
400
401 ret = task_get_bootstrap_port(mach_task_self(), &bsport);
402 if (KERN_SUCCESS != ret) {
403 mach_error("task_get_bootstrap_port(): ", ret);
404 exit(1);
405 }
406
407 if (verbose) {
408 printf("server waiting for IPC messages from client on port '%s' (%#x).\n",
409 server_port_name[ports->server_num], ports->port);
410 }
411 ret = bootstrap_register(bsport,
412 server_port_name[ports->server_num],
413 ports->port);
414 if (KERN_SUCCESS != ret) {
415 mach_error("bootstrap_register(): ", ret);
416 exit(1);
417 }
418 }
419
420 void
421 setup_client_ports(struct port_args *ports)
422 {
423 kern_return_t ret = 0;
424 switch (msg_type) {
425 case msg_type_trivial:
426 ports->req_size = sizeof(ipc_trivial_message);
427 break;
428 case msg_type_inline:
429 ports->req_size = sizeof(ipc_inline_message) +
430 sizeof(u_int32_t) * num_ints;
431 break;
432 case msg_type_complex:
433 ports->req_size = sizeof(ipc_complex_message);
434 break;
435 }
436 ports->req_size -= sizeof(mach_msg_trailer_t);
437 ports->reply_size = sizeof(ipc_trivial_message);
438 ports->req_msg = malloc(ports->req_size);
439 ports->reply_msg = malloc(ports->reply_size);
440
441 ret = mach_port_allocate(mach_task_self(),
442 MACH_PORT_RIGHT_RECEIVE,
443 &(ports->port));
444 if (KERN_SUCCESS != ret) {
445 mach_error("mach_port_allocate(): ", ret);
446 exit(1);
447 }
448 if (verbose) {
449 printf("Client sending %d %s IPC messages to port '%s' in %s mode\n",
450 num_msgs, (msg_type == msg_type_inline) ?
451 "inline" : ((msg_type == msg_type_complex) ?
452 "complex" : "trivial"),
453 server_port_name[ports->server_num],
454 (oneway ? "oneway" : "rpc"));
455 }
456 }
457
458
459 static void
460 thread_setup(int tag)
461 {
462 kern_return_t ret;
463 thread_extended_policy_data_t epolicy;
464 thread_affinity_policy_data_t policy;
465
466 if (!timeshare) {
467 epolicy.timeshare = FALSE;
468 ret = thread_policy_set(
469 mach_thread_self(), THREAD_EXTENDED_POLICY,
470 (thread_policy_t) &epolicy,
471 THREAD_EXTENDED_POLICY_COUNT);
472 if (ret != KERN_SUCCESS) {
473 printf("thread_policy_set(THREAD_EXTENDED_POLICY) returned %d\n", ret);
474 }
475 }
476
477 if (affinity) {
478 policy.affinity_tag = tag;
479 ret = thread_policy_set(
480 mach_thread_self(), THREAD_AFFINITY_POLICY,
481 (thread_policy_t) &policy,
482 THREAD_AFFINITY_POLICY_COUNT);
483 if (ret != KERN_SUCCESS) {
484 printf("thread_policy_set(THREAD_AFFINITY_POLICY) returned %d\n", ret);
485 }
486 }
487 }
488
489 void *
490 server(void *serverarg)
491 {
492 int idx;
493 kern_return_t ret;
494 int totalmsg = num_msgs * num_clients;
495 mach_port_t recv_port;
496 uint64_t starttm, endtm;
497
498 int svr_num = (int)(uintptr_t)serverarg;
499 struct port_args *args = &server_port_args[svr_num];
500
501 args->server_num = svr_num;
502 setup_server_ports(args);
503
504 thread_setup(args->server_num + 1);
505
506 recv_port = (useset) ? args->rcv_set : args->port;
507
508 for (idx = 0; idx < totalmsg; idx++) {
509 if (verbose > 2) {
510 printf("server awaiting message %d\n", idx);
511 }
512 ret = mach_msg(args->req_msg,
513 MACH_RCV_MSG | MACH_RCV_INTERRUPT | MACH_RCV_LARGE,
514 0,
515 args->req_size,
516 recv_port,
517 MACH_MSG_TIMEOUT_NONE,
518 MACH_PORT_NULL);
519 if (MACH_RCV_INTERRUPTED == ret) {
520 break;
521 }
522 if (MACH_MSG_SUCCESS != ret) {
523 if (verbose) {
524 printf("mach_msg() ret=%d", ret);
525 }
526 mach_error("mach_msg (receive): ", ret);
527 exit(1);
528 }
529 if (verbose > 2) {
530 printf("server received message %d\n", idx);
531 }
532 if (args->req_msg->msgh_bits & MACH_MSGH_BITS_COMPLEX) {
533 ret = vm_deallocate(mach_task_self(),
534 (vm_address_t)((ipc_complex_message *)args->req_msg)->descriptor.address,
535 ((ipc_complex_message *)args->req_msg)->descriptor.size);
536 }
537
538 if (1 == args->req_msg->msgh_id) {
539 if (verbose > 2) {
540 printf("server sending reply %d\n", idx);
541 }
542 args->reply_msg->msgh_bits = MACH_MSGH_BITS(MACH_MSG_TYPE_MOVE_SEND_ONCE, 0);
543 args->reply_msg->msgh_size = args->reply_size;
544 args->reply_msg->msgh_remote_port = args->req_msg->msgh_remote_port;
545 args->reply_msg->msgh_local_port = MACH_PORT_NULL;
546 args->reply_msg->msgh_id = 2;
547 ret = mach_msg(args->reply_msg,
548 MACH_SEND_MSG,
549 args->reply_size,
550 0,
551 MACH_PORT_NULL,
552 MACH_MSG_TIMEOUT_NONE,
553 MACH_PORT_NULL);
554 if (MACH_MSG_SUCCESS != ret) {
555 mach_error("mach_msg (send): ", ret);
556 exit(1);
557 }
558 }
559 }
560
561 if (!useset) {
562 return NULL;
563 }
564
565 if (verbose < 1) {
566 return NULL;
567 }
568
569 uint64_t deltans = 0;
570 /*
571 * If we're using multiple sets, explicitly tear them all down
572 * and measure the time.
573 */
574 for (int ns = 0; ns < setcount; ns++) {
575 if (verbose > 1) {
576 printf("\tTearing down set[%d] %#x...\n", ns, args->set[ns]);
577 }
578 starttm = mach_absolute_time();
579 ret = mach_port_mod_refs(mach_task_self(), args->set[ns], MACH_PORT_RIGHT_PORT_SET, -1);
580 endtm = mach_absolute_time();
581 deltans += abs_to_ns(endtm - starttm);
582 if (ret != KERN_SUCCESS) {
583 mach_error("mach_port_mod_refs(): ", ret);
584 exit(1);
585 }
586 }
587
588 uint64_t nlinks = (uint64_t)setcount * (uint64_t)portcount;
589
590 printf("\tteardown of %llu links took %llu ns\n", nlinks, deltans);
591 printf("\t%lluns per set\n", deltans / (uint64_t)setcount);
592
593 return NULL;
594 }
595
596 static inline void
597 client_spin_loop(unsigned count, void(fn)(void))
598 {
599 while (count--) {
600 fn();
601 }
602 }
603
604 static long dummy_memory;
605 static long *client_memory = &dummy_memory;
606 static void
607 client_work_atom(void)
608 {
609 static int i;
610
611 if (++i > client_pages * PAGE_SIZE / sizeof(long)) {
612 i = 0;
613 }
614 client_memory[i] = 0;
615 }
616
617 static int calibration_count = 10000;
618 static int calibration_usec;
619 static void *
620 calibrate_client_work(void)
621 {
622 long dummy;
623 struct timeval nowtv;
624 struct timeval warmuptv = { 0, 100 * 1000 }; /* 100ms */
625 struct timeval starttv;
626 struct timeval endtv;
627
628 if (client_spin) {
629 /* Warm-up the stepper first... */
630 gettimeofday(&nowtv, NULL);
631 timeradd(&nowtv, &warmuptv, &endtv);
632 do {
633 client_spin_loop(calibration_count, client_work_atom);
634 gettimeofday(&nowtv, NULL);
635 } while (timercmp(&nowtv, &endtv, < ));
636
637 /* Now do the calibration */
638 while (TRUE) {
639 gettimeofday(&starttv, NULL);
640 client_spin_loop(calibration_count, client_work_atom);
641 gettimeofday(&endtv, NULL);
642 if (endtv.tv_sec - starttv.tv_sec > 1) {
643 calibration_count /= 10;
644 continue;
645 }
646 calibration_usec = endtv.tv_usec - starttv.tv_usec;
647 if (endtv.tv_usec < starttv.tv_usec) {
648 calibration_usec += 1000000;
649 }
650 if (calibration_usec < 1000) {
651 calibration_count *= 10;
652 continue;
653 }
654 calibration_count /= calibration_usec;
655 break;
656 }
657 if (verbose > 1) {
658 printf("calibration_count=%d calibration_usec=%d\n",
659 calibration_count, calibration_usec);
660 }
661 }
662 return NULL;
663 }
664
665 static void *
666 client_work(void)
667 {
668 if (client_spin) {
669 client_spin_loop(calibration_count * client_spin,
670 client_work_atom);
671 }
672
673 if (client_delay) {
674 usleep(client_delay);
675 }
676 return NULL;
677 }
678
679 void *
680 client(void *threadarg)
681 {
682 struct port_args args;
683 struct port_args *svr_args = NULL;
684 int idx;
685 mach_msg_header_t *req, *reply;
686 mach_port_t bsport, servport;
687 kern_return_t ret;
688 int server_num = (int)(uintptr_t)threadarg;
689 void *ints = malloc(sizeof(u_int32_t) * num_ints);
690
691 if (verbose) {
692 printf("client(%d) started, server port name %s\n",
693 server_num, server_port_name[server_num]);
694 }
695
696 args.server_num = server_num;
697 thread_setup(server_num + 1);
698
699 if (stress_prepost) {
700 svr_args = &server_port_args[server_num];
701 }
702
703 /* find server port */
704 ret = task_get_bootstrap_port(mach_task_self(), &bsport);
705 if (KERN_SUCCESS != ret) {
706 mach_error("task_get_bootstrap_port(): ", ret);
707 exit(1);
708 }
709 ret = bootstrap_look_up(bsport,
710 server_port_name[server_num],
711 &servport);
712 if (KERN_SUCCESS != ret) {
713 mach_error("bootstrap_look_up(): ", ret);
714 exit(1);
715 }
716
717 setup_client_ports(&args);
718
719 /* Allocate and touch memory */
720 if (client_pages) {
721 unsigned i;
722 client_memory = (long *) malloc(client_pages * PAGE_SIZE);
723 for (i = 0; i < client_pages; i++) {
724 client_memory[i * PAGE_SIZE / sizeof(long)] = 0;
725 }
726 }
727
728 uint64_t starttm, endtm;
729
730 /* start message loop */
731 for (idx = 0; idx < num_msgs; idx++) {
732 req = args.req_msg;
733 reply = args.reply_msg;
734
735 req->msgh_size = args.req_size;
736 if (stress_prepost) {
737 req->msgh_remote_port = svr_args->port_list[idx % portcount];
738 } else {
739 req->msgh_remote_port = servport;
740 }
741 if (oneway) {
742 req->msgh_bits = MACH_MSGH_BITS(MACH_MSG_TYPE_COPY_SEND, 0);
743 req->msgh_local_port = MACH_PORT_NULL;
744 } else {
745 req->msgh_bits = MACH_MSGH_BITS(MACH_MSG_TYPE_COPY_SEND,
746 MACH_MSG_TYPE_MAKE_SEND_ONCE);
747 req->msgh_local_port = args.port;
748 }
749 req->msgh_id = oneway ? 0 : 1;
750 if (msg_type == msg_type_complex) {
751 (req)->msgh_bits |= MACH_MSGH_BITS_COMPLEX;
752 ((ipc_complex_message *)req)->body.msgh_descriptor_count = 1;
753 ((ipc_complex_message *)req)->descriptor.address = ints;
754 ((ipc_complex_message *)req)->descriptor.size =
755 num_ints * sizeof(u_int32_t);
756 ((ipc_complex_message *)req)->descriptor.deallocate = FALSE;
757 ((ipc_complex_message *)req)->descriptor.copy = MACH_MSG_VIRTUAL_COPY;
758 ((ipc_complex_message *)req)->descriptor.type = MACH_MSG_OOL_DESCRIPTOR;
759 }
760 if (verbose > 2) {
761 printf("client sending message %d to port %#x\n",
762 idx, req->msgh_remote_port);
763 }
764 starttm = mach_absolute_time();
765 ret = mach_msg(req,
766 MACH_SEND_MSG,
767 args.req_size,
768 0,
769 MACH_PORT_NULL,
770 MACH_MSG_TIMEOUT_NONE,
771 MACH_PORT_NULL);
772 endtm = mach_absolute_time();
773 if (MACH_MSG_SUCCESS != ret) {
774 mach_error("mach_msg (send): ", ret);
775 fprintf(stderr, "bailing after %u iterations\n", idx);
776 exit(1);
777 break;
778 }
779 if (stress_prepost) {
780 OSAtomicAdd64(endtm - starttm, &g_client_send_time);
781 }
782
783 if (!oneway) {
784 if (verbose > 2) {
785 printf("client awaiting reply %d\n", idx);
786 }
787 reply->msgh_bits = 0;
788 reply->msgh_size = args.reply_size;
789 reply->msgh_local_port = args.port;
790 ret = mach_msg(args.reply_msg,
791 MACH_RCV_MSG | MACH_RCV_INTERRUPT,
792 0,
793 args.reply_size,
794 args.port,
795 MACH_MSG_TIMEOUT_NONE,
796 MACH_PORT_NULL);
797 if (MACH_MSG_SUCCESS != ret) {
798 mach_error("mach_msg (receive): ", ret);
799 fprintf(stderr, "bailing after %u iterations\n",
800 idx);
801 exit(1);
802 }
803 if (verbose > 2) {
804 printf("client received reply %d\n", idx);
805 }
806 }
807
808 client_work();
809 }
810
811 free(ints);
812 return NULL;
813 }
814
815 static void
816 thread_spawn(thread_id_t *thread, void *(fn)(void *), void *arg)
817 {
818 if (threaded) {
819 kern_return_t ret;
820 ret = pthread_create(
821 &thread->tid,
822 NULL,
823 fn,
824 arg);
825 if (ret != 0) {
826 err(1, "pthread_create()");
827 }
828 if (verbose > 1) {
829 printf("created pthread %p\n", thread->tid);
830 }
831 } else {
832 thread->pid = fork();
833 if (thread->pid == 0) {
834 if (verbose > 1) {
835 printf("calling %p(%p)\n", fn, arg);
836 }
837 fn(arg);
838 exit(0);
839 }
840 if (verbose > 1) {
841 printf("forked pid %d\n", thread->pid);
842 }
843 }
844 }
845
846 static void
847 thread_join(thread_id_t *thread)
848 {
849 if (threaded) {
850 kern_return_t ret;
851 if (verbose > 1) {
852 printf("joining thread %p\n", thread->tid);
853 }
854 ret = pthread_join(thread->tid, NULL);
855 if (ret != KERN_SUCCESS) {
856 err(1, "pthread_join(%p)", thread->tid);
857 }
858 } else {
859 int stat;
860 if (verbose > 1) {
861 printf("waiting for pid %d\n", thread->pid);
862 }
863 waitpid(thread->pid, &stat, 0);
864 }
865 }
866
867 static void
868 wait_for_servers(void)
869 {
870 int i;
871 int retry_count = 10;
872 mach_port_t bsport, servport;
873 kern_return_t ret;
874
875 /* find server port */
876 ret = task_get_bootstrap_port(mach_task_self(), &bsport);
877 if (KERN_SUCCESS != ret) {
878 mach_error("task_get_bootstrap_port(): ", ret);
879 exit(1);
880 }
881
882 while (retry_count-- > 0) {
883 for (i = 0; i < num_servers; i++) {
884 ret = bootstrap_look_up(bsport,
885 server_port_name[i],
886 &servport);
887 if (ret != KERN_SUCCESS) {
888 break;
889 }
890 }
891 if (ret == KERN_SUCCESS) {
892 return;
893 }
894 usleep(100 * 1000); /* 100ms */
895 }
896 fprintf(stderr, "Server(s) failed to register\n");
897 exit(1);
898 }
899
900 int
901 main(int argc, char *argv[])
902 {
903 int i;
904 int j;
905 thread_id_t *client_id;
906 thread_id_t *server_id;
907
908 signal(SIGINT, signal_handler);
909 parse_args(argc, argv);
910
911 if (mach_timebase_info(&g_timebase) != KERN_SUCCESS) {
912 fprintf(stderr, "Can't get mach_timebase_info!\n");
913 exit(1);
914 }
915
916 calibrate_client_work();
917
918 /*
919 * If we're using affinity create an empty namespace now
920 * so this is shared by all our offspring.
921 */
922 if (affinity) {
923 thread_setup(0);
924 }
925
926 server_id = (thread_id_t *) malloc(num_servers * sizeof(thread_id_t));
927 server_port_name = (char **) malloc(num_servers * sizeof(char *));
928 server_port_args = (struct port_args *)calloc(sizeof(struct port_args), num_servers);
929 if (!server_id || !server_port_name || !server_port_args) {
930 fprintf(stderr, "malloc/calloc of %d server book keeping structs failed\n", num_servers);
931 exit(1);
932 }
933
934 if (verbose) {
935 printf("creating %d servers\n", num_servers);
936 }
937 for (i = 0; i < num_servers; i++) {
938 server_port_name[i] = (char *) malloc(sizeof("PORT.pppppp.xx"));
939 /* PORT names include pid of main process for disambiguation */
940 sprintf(server_port_name[i], "PORT.%06d.%02d", getpid(), i);
941 thread_spawn(&server_id[i], server, (void *) (long) i);
942 }
943
944 int totalclients = num_servers * num_clients;
945 int totalmsg = num_msgs * totalclients;
946 struct timeval starttv, endtv, deltatv;
947
948 /*
949 * Wait for all servers to have registered all ports before starting
950 * the clients and the clock.
951 */
952 wait_for_servers();
953
954 printf("%d server%s, %d client%s per server (%d total) %u messages...",
955 num_servers, (num_servers > 1)? "s" : "",
956 num_clients, (num_clients > 1)? "s" : "",
957 totalclients,
958 totalmsg);
959 fflush(stdout);
960
961 /* Call gettimeofday() once and throw away result; some implementations
962 * (like Mach's) cache some time zone info on first call.
963 */
964 gettimeofday(&starttv, NULL);
965 gettimeofday(&starttv, NULL);
966
967 client_id = (thread_id_t *) malloc(totalclients * sizeof(thread_id_t));
968 if (verbose) {
969 printf("creating %d clients\n", totalclients);
970 }
971 for (i = 0; i < num_servers; i++) {
972 for (j = 0; j < num_clients; j++) {
973 thread_spawn(
974 &client_id[(i * num_clients) + j],
975 client,
976 (void *) (long) i);
977 }
978 }
979
980 /* Wait for servers to complete */
981 for (i = 0; i < num_servers; i++) {
982 thread_join(&server_id[i]);
983 }
984
985 gettimeofday(&endtv, NULL);
986 if (verbose) {
987 printf("all servers complete: waiting for clients...\n");
988 }
989
990 for (i = 0; i < totalclients; i++) {
991 thread_join(&client_id[i]);
992 }
993
994 /* report results */
995 deltatv.tv_sec = endtv.tv_sec - starttv.tv_sec;
996 deltatv.tv_usec = endtv.tv_usec - starttv.tv_usec;
997 if (endtv.tv_usec < starttv.tv_usec) {
998 deltatv.tv_sec--;
999 deltatv.tv_usec += 1000000;
1000 }
1001
1002 double dsecs = (double) deltatv.tv_sec +
1003 1.0E-6 * (double) deltatv.tv_usec;
1004
1005 printf(" in %lu.%03u seconds\n",
1006 deltatv.tv_sec, deltatv.tv_usec / 1000);
1007 printf(" throughput in messages/sec: %g\n",
1008 (double)totalmsg / dsecs);
1009 printf(" average message latency (usec): %2.3g\n",
1010 dsecs * 1.0E6 / (double) totalmsg);
1011
1012 double time_in_sec = (double)deltatv.tv_sec + (double)deltatv.tv_usec / 1000.0;
1013 double throughput_msg_p_sec = (double) totalmsg / dsecs;
1014 double avg_msg_latency = dsecs * 1.0E6 / (double)totalmsg;
1015
1016 if (save_perfdata == TRUE) {
1017 char name[256];
1018 snprintf(name, sizeof(name), "%s_avg_msg_latency", basename(argv[0]));
1019 record_perf_data(name, "usec", avg_msg_latency, "Message latency measured in microseconds. Lower is better", stderr);
1020 }
1021
1022 if (stress_prepost) {
1023 int64_t sendns = abs_to_ns(g_client_send_time);
1024 dsecs = (double)sendns / (double)NSEC_PER_SEC;
1025 printf(" total send time: %2.3gs\n", dsecs);
1026 printf(" average send time (usec): %2.3g\n",
1027 dsecs * 1.0E6 / (double)totalmsg);
1028 }
1029
1030 return 0;
1031 }