]> git.saurik.com Git - apple/xnu.git/blame_incremental - tools/tests/MPMMTest/MPMMtest.c
xnu-4903.241.1.tar.gz
[apple/xnu.git] / tools / tests / MPMMTest / MPMMtest.c
... / ...
CommitLineData
1#include <AvailabilityMacros.h>
2#include <mach/thread_policy.h>
3
4#include <pthread.h>
5#include <stdio.h>
6#include <stdlib.h>
7#include <libgen.h>
8#include <string.h>
9#include <err.h>
10#include <unistd.h>
11
12#include <pthread.h>
13#include <mach/mach.h>
14#include <mach/mach_error.h>
15#include <mach/mach_time.h>
16#include <mach/notify.h>
17#include <servers/bootstrap.h>
18#include <sys/types.h>
19#include <sys/time.h>
20#include <sys/signal.h>
21#include <errno.h>
22#include "../unit_tests/tests_common.h" /* for record_perf_data() */
23
24#include <libkern/OSAtomic.h>
25
26#define MAX(A, B) ((A) < (B) ? (B) : (A))
27
28
29typedef struct {
30 mach_msg_header_t header;
31 mach_msg_trailer_t trailer; // subtract this when sending
32} ipc_trivial_message;
33
34typedef struct {
35 mach_msg_header_t header;
36 u_int32_t numbers[0];
37 mach_msg_trailer_t trailer; // subtract this when sending
38} ipc_inline_message;
39
40typedef struct {
41 mach_msg_header_t header;
42 mach_msg_body_t body;
43 mach_msg_ool_descriptor_t descriptor;
44 mach_msg_trailer_t trailer; // subtract this when sending
45} ipc_complex_message;
46
47enum {
48 msg_type_trivial = 0,
49 msg_type_inline = 1,
50 msg_type_complex = 2
51};
52
53struct port_args {
54 int server_num;
55 int req_size;
56 mach_msg_header_t *req_msg;
57 int reply_size;
58 mach_msg_header_t *reply_msg;
59 mach_port_t port;
60 mach_port_t rcv_set;
61
62 mach_port_t *set;
63 mach_port_t *port_list;
64};
65
66typedef union {
67 pid_t pid;
68 pthread_t tid;
69} thread_id_t;
70
71/* Global options */
72static int verbose = 0;
73static boolean_t affinity = FALSE;
74static boolean_t timeshare = FALSE;
75static boolean_t threaded = FALSE;
76static boolean_t oneway = FALSE;
77static boolean_t useset = FALSE;
78static boolean_t save_perfdata = FALSE;
79int msg_type;
80int num_ints;
81int num_msgs;
82int num_clients;
83int num_servers;
84int client_delay;
85int client_spin;
86int client_pages;
87int portcount = 1;
88int setcount = 0;
89boolean_t stress_prepost = FALSE;
90char **server_port_name;
91
92struct port_args *server_port_args;
93
94/* global data */
95mach_timebase_info_data_t g_timebase;
96int64_t g_client_send_time = 0;
97
98static inline uint64_t ns_to_abs(uint64_t ns)
99{
100 return ns * g_timebase.denom / g_timebase.numer;
101}
102
103static inline uint64_t abs_to_ns(uint64_t abs)
104{
105 return abs * g_timebase.numer / g_timebase.denom;
106}
107
108
109void signal_handler(int sig) {
110}
111
112void usage(const char *progname) {
113 fprintf(stderr, "usage: %s [options]\n", progname);
114 fprintf(stderr, "where options are:\n");
115 fprintf(stderr, " -affinity\t\tthreads use affinity\n");
116 fprintf(stderr, " -timeshare\t\tthreads use timeshare\n");
117 fprintf(stderr, " -threaded\t\tuse (p)threads\n");
118 fprintf(stderr, " -verbose\t\tbe verbose (use multiple times to increase verbosity)\n");
119 fprintf(stderr, " -oneway\t\tdo not request return reply\n");
120 fprintf(stderr, " -count num\t\tnumber of messages to send\n");
121 fprintf(stderr, " -perf \t\tCreate perfdata files for metrics.\n");
122 fprintf(stderr, " -type trivial|inline|complex\ttype of messages to send\n");
123 fprintf(stderr, " -numints num\tnumber of 32-bit ints to send in messages\n");
124 fprintf(stderr, " -servers num\tnumber of server threads to run\n");
125 fprintf(stderr, " -clients num\tnumber of clients per server\n");
126 fprintf(stderr, " -delay num\t\tmicroseconds to sleep clients between messages\n");
127 fprintf(stderr, " -work num\t\tmicroseconds of client work\n");
128 fprintf(stderr, " -pages num\t\tpages of memory touched by client work\n");
129 fprintf(stderr, " -set nset num\tcreate [nset] portsets and [num] ports in each server.\n");
130 fprintf(stderr, " \tEach port is connected to each set.\n");
131 fprintf(stderr, " -prepost\t\tstress the prepost system (implies -threaded, requires -set X Y)\n");
132 fprintf(stderr, "default values are:\n");
133 fprintf(stderr, " . no affinity\n");
134 fprintf(stderr, " . not timeshare\n");
135 fprintf(stderr, " . not threaded\n");
136 fprintf(stderr, " . not verbose\n");
137 fprintf(stderr, " . not oneway\n");
138 fprintf(stderr, " . client sends 100000 messages\n");
139 fprintf(stderr, " . inline message type\n");
140 fprintf(stderr, " . 64 32-bit integers in inline/complex messages\n");
141 fprintf(stderr, " . (num_available_processors+1)%%2 servers\n");
142 fprintf(stderr, " . 4 clients per server\n");
143 fprintf(stderr, " . no delay\n");
144 fprintf(stderr, " . no sets / extra ports\n");
145 fprintf(stderr, " . no prepost stress\n");
146 exit(1);
147}
148
149void parse_args(int argc, char *argv[]) {
150 host_basic_info_data_t info;
151 mach_msg_type_number_t count;
152 kern_return_t result;
153
154 /* Initialize defaults */
155 msg_type = msg_type_trivial;
156 num_ints = 64;
157 num_msgs = 100000;
158 client_delay = 0;
159 num_clients = 4;
160
161 count = HOST_BASIC_INFO_COUNT;
162 result = host_info(mach_host_self(), HOST_BASIC_INFO,
163 (host_info_t)&info, &count);
164 if (result == KERN_SUCCESS && info.avail_cpus > 1)
165 num_servers = info.avail_cpus / 2;
166 else
167 num_servers = 1;
168
169 const char *progname = argv[0];
170 argc--; argv++;
171 while (0 < argc) {
172 if (0 == strcmp("-verbose", argv[0])) {
173 verbose++;
174 argc--; argv++;
175 } else if (0 == strcmp("-affinity", argv[0])) {
176 affinity = TRUE;
177 argc--; argv++;
178 } else if (0 == strcmp("-timeshare", argv[0])) {
179 timeshare = TRUE;
180 argc--; argv++;
181 } else if (0 == strcmp("-threaded", argv[0])) {
182 threaded = TRUE;
183 argc--; argv++;
184 } else if (0 == strcmp("-oneway", argv[0])) {
185 oneway = TRUE;
186 argc--; argv++;
187 } else if (0 == strcmp("-perf", argv[0])) {
188 save_perfdata = TRUE;
189 argc--; argv++;
190 } else if (0 == strcmp("-type", argv[0])) {
191 if (argc < 2)
192 usage(progname);
193 if (0 == strcmp("trivial", argv[1])) {
194 msg_type = msg_type_trivial;
195 } else if (0 == strcmp("inline", argv[1])) {
196 msg_type = msg_type_inline;
197 } else if (0 == strcmp("complex", argv[1])) {
198 msg_type = msg_type_complex;
199 } else
200 usage(progname);
201 argc -= 2; argv += 2;
202 } else if (0 == strcmp("-numints", argv[0])) {
203 if (argc < 2)
204 usage(progname);
205 num_ints = strtoul(argv[1], NULL, 0);
206 argc -= 2; argv += 2;
207 } else if (0 == strcmp("-count", argv[0])) {
208 if (argc < 2)
209 usage(progname);
210 num_msgs = strtoul(argv[1], NULL, 0);
211 argc -= 2; argv += 2;
212 } else if (0 == strcmp("-clients", argv[0])) {
213 if (argc < 2)
214 usage(progname);
215 num_clients = strtoul(argv[1], NULL, 0);
216 argc -= 2; argv += 2;
217 } else if (0 == strcmp("-servers", argv[0])) {
218 if (argc < 2)
219 usage(progname);
220 num_servers = strtoul(argv[1], NULL, 0);
221 argc -= 2; argv += 2;
222 } else if (0 == strcmp("-delay", argv[0])) {
223 if (argc < 2)
224 usage(progname);
225 client_delay = strtoul(argv[1], NULL, 0);
226 argc -= 2; argv += 2;
227 } else if (0 == strcmp("-spin", argv[0])) {
228 if (argc < 2)
229 usage(progname);
230 client_spin = strtoul(argv[1], NULL, 0);
231 argc -= 2; argv += 2;
232 } else if (0 == strcmp("-pages", argv[0])) {
233 if (argc < 2)
234 usage(progname);
235 client_pages = strtoul(argv[1], NULL, 0);
236 argc -= 2; argv += 2;
237 } else if (0 == strcmp("-set", argv[0])) {
238 if (argc < 3)
239 usage(progname);
240 setcount = strtoul(argv[1], NULL, 0);
241 portcount = strtoul(argv[2], NULL, 0);
242 if (setcount <= 0 || portcount <= 0)
243 usage(progname);
244 useset = TRUE;
245 argc -= 3; argv += 3;
246 } else if (0 == strcmp("-prepost", argv[0])) {
247 stress_prepost = TRUE;
248 threaded = TRUE;
249 argc--; argv++;
250 } else {
251 fprintf(stderr, "unknown option '%s'\n", argv[0]);
252 usage(progname);
253 }
254 }
255
256 if (stress_prepost) {
257 if (!threaded) {
258 fprintf(stderr, "Prepost stress test _must_ be threaded\n");
259 exit(1);
260 }
261 if (portcount < 1 || setcount < 1) {
262 fprintf(stderr, "Prepost stress test requires >= 1 port in >= 1 set.\n");
263 exit(1);
264 }
265 }
266}
267
268void setup_server_ports(struct port_args *ports)
269{
270 kern_return_t ret = 0;
271 mach_port_t bsport;
272 mach_port_t port;
273
274 ports->req_size = MAX(sizeof(ipc_inline_message) +
275 sizeof(u_int32_t) * num_ints,
276 sizeof(ipc_complex_message));
277 ports->reply_size = sizeof(ipc_trivial_message) -
278 sizeof(mach_msg_trailer_t);
279 ports->req_msg = malloc(ports->req_size);
280 ports->reply_msg = malloc(ports->reply_size);
281 if (setcount > 0) {
282 ports->set = (mach_port_t *)calloc(sizeof(mach_port_t), setcount);
283 if (!ports->set) {
284 fprintf(stderr, "calloc(%lu, %d) failed!\n", sizeof(mach_port_t), setcount);
285 exit(1);
286 }
287 }
288 if (stress_prepost) {
289 ports->port_list = (mach_port_t *)calloc(sizeof(mach_port_t), portcount);
290 if (!ports->port_list) {
291 fprintf(stderr, "calloc(%lu, %d) failed!\n", sizeof(mach_port_t), portcount);
292 exit(1);
293 }
294 }
295
296 if (useset) {
297 mach_port_t set;
298 if (setcount < 1) {
299 fprintf(stderr, "Can't use sets with a setcount of %d\n", setcount);
300 exit(1);
301 }
302
303 for (int ns = 0; ns < setcount; ns++) {
304 ret = mach_port_allocate(mach_task_self(),
305 MACH_PORT_RIGHT_PORT_SET,
306 &ports->set[ns]);
307 if (KERN_SUCCESS != ret) {
308 mach_error("mach_port_allocate(SET): ", ret);
309 exit(1);
310 }
311 if (verbose > 1)
312 printf("SVR[%d] allocated set[%d] %#x\n",
313 ports->server_num, ns, ports->set[ns]);
314
315 set = ports->set[ns];
316 }
317
318 /* receive on a port set (always use the first in the chain) */
319 ports->rcv_set = ports->set[0];
320 }
321
322 /* stuff the portset(s) with ports */
323 for (int i = 0; i < portcount; i++) {
324 ret = mach_port_allocate(mach_task_self(),
325 MACH_PORT_RIGHT_RECEIVE,
326 &port);
327 if (KERN_SUCCESS != ret) {
328 mach_error("mach_port_allocate(PORT): ", ret);
329 exit(1);
330 }
331
332 if (stress_prepost)
333 ports->port_list[i] = port;
334
335 if (useset) {
336 /* insert the port into _all_ allocated lowest-level sets */
337 for (int ns = 0; ns < setcount; ns++) {
338 if (verbose > 1)
339 printf("SVR[%d] moving port %#x into set %#x...\n",
340 ports->server_num, port, ports->set[ns]);
341 ret = mach_port_insert_member(mach_task_self(),
342 port, ports->set[ns]);
343 if (KERN_SUCCESS != ret) {
344 mach_error("mach_port_insert_member(): ", ret);
345 exit(1);
346 }
347 }
348 }
349 }
350
351 /* use the last one as the server's bootstrap port */
352 ports->port = port;
353
354 if (stress_prepost) {
355 /* insert a send right for _each_ port */
356 for (int i = 0; i < portcount; i++) {
357 ret = mach_port_insert_right(mach_task_self(),
358 ports->port_list[i],
359 ports->port_list[i],
360 MACH_MSG_TYPE_MAKE_SEND);
361 if (KERN_SUCCESS != ret) {
362 mach_error("mach_port_insert_right(): ", ret);
363 exit(1);
364 }
365 }
366 } else {
367 ret = mach_port_insert_right(mach_task_self(),
368 ports->port,
369 ports->port,
370 MACH_MSG_TYPE_MAKE_SEND);
371 if (KERN_SUCCESS != ret) {
372 mach_error("mach_port_insert_right(): ", ret);
373 exit(1);
374 }
375 }
376
377 ret = task_get_bootstrap_port(mach_task_self(), &bsport);
378 if (KERN_SUCCESS != ret) {
379 mach_error("task_get_bootstrap_port(): ", ret);
380 exit(1);
381 }
382
383 if (verbose) {
384 printf("server waiting for IPC messages from client on port '%s' (%#x).\n",
385 server_port_name[ports->server_num], ports->port);
386 }
387 ret = bootstrap_register(bsport,
388 server_port_name[ports->server_num],
389 ports->port);
390 if (KERN_SUCCESS != ret) {
391 mach_error("bootstrap_register(): ", ret);
392 exit(1);
393 }
394}
395
396void setup_client_ports(struct port_args *ports)
397{
398 kern_return_t ret = 0;
399 switch(msg_type) {
400 case msg_type_trivial:
401 ports->req_size = sizeof(ipc_trivial_message);
402 break;
403 case msg_type_inline:
404 ports->req_size = sizeof(ipc_inline_message) +
405 sizeof(u_int32_t) * num_ints;
406 break;
407 case msg_type_complex:
408 ports->req_size = sizeof(ipc_complex_message);
409 break;
410 }
411 ports->req_size -= sizeof(mach_msg_trailer_t);
412 ports->reply_size = sizeof(ipc_trivial_message);
413 ports->req_msg = malloc(ports->req_size);
414 ports->reply_msg = malloc(ports->reply_size);
415
416 ret = mach_port_allocate(mach_task_self(),
417 MACH_PORT_RIGHT_RECEIVE,
418 &(ports->port));
419 if (KERN_SUCCESS != ret) {
420 mach_error("mach_port_allocate(): ", ret);
421 exit(1);
422 }
423 if (verbose) {
424 printf("Client sending %d %s IPC messages to port '%s' in %s mode\n",
425 num_msgs, (msg_type == msg_type_inline) ?
426 "inline" : ((msg_type == msg_type_complex) ?
427 "complex" : "trivial"),
428 server_port_name[ports->server_num],
429 (oneway ? "oneway" : "rpc"));
430 }
431}
432
433
434static void
435thread_setup(int tag) {
436 kern_return_t ret;
437 thread_extended_policy_data_t epolicy;
438 thread_affinity_policy_data_t policy;
439
440 if (!timeshare) {
441 epolicy.timeshare = FALSE;
442 ret = thread_policy_set(
443 mach_thread_self(), THREAD_EXTENDED_POLICY,
444 (thread_policy_t) &epolicy,
445 THREAD_EXTENDED_POLICY_COUNT);
446 if (ret != KERN_SUCCESS)
447 printf("thread_policy_set(THREAD_EXTENDED_POLICY) returned %d\n", ret);
448 }
449
450 if (affinity) {
451 policy.affinity_tag = tag;
452 ret = thread_policy_set(
453 mach_thread_self(), THREAD_AFFINITY_POLICY,
454 (thread_policy_t) &policy,
455 THREAD_AFFINITY_POLICY_COUNT);
456 if (ret != KERN_SUCCESS)
457 printf("thread_policy_set(THREAD_AFFINITY_POLICY) returned %d\n", ret);
458 }
459}
460
461void *
462server(void *serverarg)
463{
464 int idx;
465 kern_return_t ret;
466 int totalmsg = num_msgs * num_clients;
467 mach_port_t recv_port;
468 uint64_t starttm, endtm;
469
470 int svr_num = (int)(uintptr_t)serverarg;
471 struct port_args *args = &server_port_args[svr_num];
472
473 args->server_num = svr_num;
474 setup_server_ports(args);
475
476 thread_setup(args->server_num + 1);
477
478 recv_port = (useset) ? args->rcv_set : args->port;
479
480 for (idx = 0; idx < totalmsg; idx++) {
481 if (verbose > 2)
482 printf("server awaiting message %d\n", idx);
483 ret = mach_msg(args->req_msg,
484 MACH_RCV_MSG|MACH_RCV_INTERRUPT|MACH_RCV_LARGE,
485 0,
486 args->req_size,
487 recv_port,
488 MACH_MSG_TIMEOUT_NONE,
489 MACH_PORT_NULL);
490 if (MACH_RCV_INTERRUPTED == ret)
491 break;
492 if (MACH_MSG_SUCCESS != ret) {
493 if (verbose)
494 printf("mach_msg() ret=%d", ret);
495 mach_error("mach_msg (receive): ", ret);
496 exit(1);
497 }
498 if (verbose > 2)
499 printf("server received message %d\n", idx);
500 if (args->req_msg->msgh_bits & MACH_MSGH_BITS_COMPLEX) {
501 ret = vm_deallocate(mach_task_self(),
502 (vm_address_t)((ipc_complex_message *)args->req_msg)->descriptor.address,
503 ((ipc_complex_message *)args->req_msg)->descriptor.size);
504 }
505
506 if (1 == args->req_msg->msgh_id) {
507 if (verbose > 2)
508 printf("server sending reply %d\n", idx);
509 args->reply_msg->msgh_bits = MACH_MSGH_BITS(MACH_MSG_TYPE_MOVE_SEND_ONCE, 0);
510 args->reply_msg->msgh_size = args->reply_size;
511 args->reply_msg->msgh_remote_port = args->req_msg->msgh_remote_port;
512 args->reply_msg->msgh_local_port = MACH_PORT_NULL;
513 args->reply_msg->msgh_id = 2;
514 ret = mach_msg(args->reply_msg,
515 MACH_SEND_MSG,
516 args->reply_size,
517 0,
518 MACH_PORT_NULL,
519 MACH_MSG_TIMEOUT_NONE,
520 MACH_PORT_NULL);
521 if (MACH_MSG_SUCCESS != ret) {
522 mach_error("mach_msg (send): ", ret);
523 exit(1);
524 }
525 }
526 }
527
528 if (!useset)
529 return NULL;
530
531 if (verbose < 1)
532 return NULL;
533
534 uint64_t deltans = 0;
535 /*
536 * If we're using multiple sets, explicitly tear them all down
537 * and measure the time.
538 */
539 for (int ns = 0; ns < setcount; ns++) {
540 if (verbose > 1)
541 printf("\tTearing down set[%d] %#x...\n", ns, args->set[ns]);
542 starttm = mach_absolute_time();
543 ret = mach_port_mod_refs(mach_task_self(), args->set[ns], MACH_PORT_RIGHT_PORT_SET, -1);
544 endtm = mach_absolute_time();
545 deltans += abs_to_ns(endtm - starttm);
546 if (ret != KERN_SUCCESS) {
547 mach_error("mach_port_mod_refs(): ", ret);
548 exit(1);
549 }
550 }
551
552 uint64_t nlinks = (uint64_t)setcount * (uint64_t)portcount;
553
554 printf("\tteardown of %llu links took %llu ns\n", nlinks, deltans);
555 printf("\t%lluns per set\n", deltans / (uint64_t)setcount);
556
557 return NULL;
558}
559
560static inline void
561client_spin_loop(unsigned count, void (fn)(void))
562{
563 while (count--)
564 fn();
565}
566
567static long dummy_memory;
568static long *client_memory = &dummy_memory;
569static void
570client_work_atom(void)
571{
572 static int i;
573
574 if (++i > client_pages * PAGE_SIZE / sizeof(long))
575 i = 0;
576 client_memory[i] = 0;
577}
578
579static int calibration_count = 10000;
580static int calibration_usec;
581static void *
582calibrate_client_work(void)
583{
584 long dummy;
585 struct timeval nowtv;
586 struct timeval warmuptv = { 0, 100 * 1000 }; /* 100ms */
587 struct timeval starttv;
588 struct timeval endtv;
589
590 if (client_spin) {
591 /* Warm-up the stepper first... */
592 gettimeofday(&nowtv, NULL);
593 timeradd(&nowtv, &warmuptv, &endtv);
594 do {
595 client_spin_loop(calibration_count, client_work_atom);
596 gettimeofday(&nowtv, NULL);
597 } while (timercmp(&nowtv, &endtv, < ));
598
599 /* Now do the calibration */
600 while (TRUE) {
601 gettimeofday(&starttv, NULL);
602 client_spin_loop(calibration_count, client_work_atom);
603 gettimeofday(&endtv, NULL);
604 if (endtv.tv_sec - starttv.tv_sec > 1) {
605 calibration_count /= 10;
606 continue;
607 }
608 calibration_usec = endtv.tv_usec - starttv.tv_usec;
609 if (endtv.tv_usec < starttv.tv_usec) {
610 calibration_usec += 1000000;
611 }
612 if (calibration_usec < 1000) {
613 calibration_count *= 10;
614 continue;
615 }
616 calibration_count /= calibration_usec;
617 break;
618 }
619 if (verbose > 1)
620 printf("calibration_count=%d calibration_usec=%d\n",
621 calibration_count, calibration_usec);
622 }
623 return NULL;
624}
625
626static void *
627client_work(void)
628{
629
630 if (client_spin) {
631 client_spin_loop(calibration_count*client_spin,
632 client_work_atom);
633 }
634
635 if (client_delay) {
636 usleep(client_delay);
637 }
638 return NULL;
639}
640
641void *client(void *threadarg)
642{
643 struct port_args args;
644 struct port_args *svr_args = NULL;
645 int idx;
646 mach_msg_header_t *req, *reply;
647 mach_port_t bsport, servport;
648 kern_return_t ret;
649 int server_num = (int)(uintptr_t)threadarg;
650 void *ints = malloc(sizeof(u_int32_t) * num_ints);
651
652 if (verbose)
653 printf("client(%d) started, server port name %s\n",
654 server_num, server_port_name[server_num]);
655
656 args.server_num = server_num;
657 thread_setup(server_num + 1);
658
659 if (stress_prepost)
660 svr_args = &server_port_args[server_num];
661
662 /* find server port */
663 ret = task_get_bootstrap_port(mach_task_self(), &bsport);
664 if (KERN_SUCCESS != ret) {
665 mach_error("task_get_bootstrap_port(): ", ret);
666 exit(1);
667 }
668 ret = bootstrap_look_up(bsport,
669 server_port_name[server_num],
670 &servport);
671 if (KERN_SUCCESS != ret) {
672 mach_error("bootstrap_look_up(): ", ret);
673 exit(1);
674 }
675
676 setup_client_ports(&args);
677
678 /* Allocate and touch memory */
679 if (client_pages) {
680 unsigned i;
681 client_memory = (long *) malloc(client_pages * PAGE_SIZE);
682 for (i = 0; i < client_pages; i++)
683 client_memory[i * PAGE_SIZE / sizeof(long)] = 0;
684 }
685
686 uint64_t starttm, endtm;
687
688 /* start message loop */
689 for (idx = 0; idx < num_msgs; idx++) {
690 req = args.req_msg;
691 reply = args.reply_msg;
692
693 req->msgh_size = args.req_size;
694 if (stress_prepost) {
695 req->msgh_remote_port = svr_args->port_list[idx % portcount];
696 } else {
697 req->msgh_remote_port = servport;
698 }
699 if (oneway) {
700 req->msgh_bits = MACH_MSGH_BITS(MACH_MSG_TYPE_COPY_SEND, 0);
701 req->msgh_local_port = MACH_PORT_NULL;
702 } else {
703 req->msgh_bits = MACH_MSGH_BITS(MACH_MSG_TYPE_COPY_SEND,
704 MACH_MSG_TYPE_MAKE_SEND_ONCE);
705 req->msgh_local_port = args.port;
706 }
707 req->msgh_id = oneway ? 0 : 1;
708 if (msg_type == msg_type_complex) {
709 (req)->msgh_bits |= MACH_MSGH_BITS_COMPLEX;
710 ((ipc_complex_message *)req)->body.msgh_descriptor_count = 1;
711 ((ipc_complex_message *)req)->descriptor.address = ints;
712 ((ipc_complex_message *)req)->descriptor.size =
713 num_ints * sizeof(u_int32_t);
714 ((ipc_complex_message *)req)->descriptor.deallocate = FALSE;
715 ((ipc_complex_message *)req)->descriptor.copy = MACH_MSG_VIRTUAL_COPY;
716 ((ipc_complex_message *)req)->descriptor.type = MACH_MSG_OOL_DESCRIPTOR;
717 }
718 if (verbose > 2)
719 printf("client sending message %d to port %#x\n",
720 idx, req->msgh_remote_port);
721 starttm = mach_absolute_time();
722 ret = mach_msg(req,
723 MACH_SEND_MSG,
724 args.req_size,
725 0,
726 MACH_PORT_NULL,
727 MACH_MSG_TIMEOUT_NONE,
728 MACH_PORT_NULL);
729 endtm = mach_absolute_time();
730 if (MACH_MSG_SUCCESS != ret) {
731 mach_error("mach_msg (send): ", ret);
732 fprintf(stderr, "bailing after %u iterations\n", idx);
733 exit(1);
734 break;
735 }
736 if (stress_prepost)
737 OSAtomicAdd64(endtm - starttm, &g_client_send_time);
738
739 if (!oneway) {
740 if (verbose > 2)
741 printf("client awaiting reply %d\n", idx);
742 reply->msgh_bits = 0;
743 reply->msgh_size = args.reply_size;
744 reply->msgh_local_port = args.port;
745 ret = mach_msg(args.reply_msg,
746 MACH_RCV_MSG|MACH_RCV_INTERRUPT,
747 0,
748 args.reply_size,
749 args.port,
750 MACH_MSG_TIMEOUT_NONE,
751 MACH_PORT_NULL);
752 if (MACH_MSG_SUCCESS != ret) {
753 mach_error("mach_msg (receive): ", ret);
754 fprintf(stderr, "bailing after %u iterations\n",
755 idx);
756 exit(1);
757 }
758 if (verbose > 2)
759 printf("client received reply %d\n", idx);
760 }
761
762 client_work();
763 }
764
765 free(ints);
766 return NULL;
767}
768
769static void
770thread_spawn(thread_id_t *thread, void *(fn)(void *), void *arg) {
771 if (threaded) {
772 kern_return_t ret;
773 ret = pthread_create(
774 &thread->tid,
775 NULL,
776 fn,
777 arg);
778 if (ret != 0)
779 err(1, "pthread_create()");
780 if (verbose > 1)
781 printf("created pthread %p\n", thread->tid);
782 } else {
783 thread->pid = fork();
784 if (thread->pid == 0) {
785 if (verbose > 1)
786 printf("calling %p(%p)\n", fn, arg);
787 fn(arg);
788 exit(0);
789 }
790 if (verbose > 1)
791 printf("forked pid %d\n", thread->pid);
792 }
793}
794
795static void
796thread_join(thread_id_t *thread) {
797 if (threaded) {
798 kern_return_t ret;
799 if (verbose > 1)
800 printf("joining thread %p\n", thread->tid);
801 ret = pthread_join(thread->tid, NULL);
802 if (ret != KERN_SUCCESS)
803 err(1, "pthread_join(%p)", thread->tid);
804 } else {
805 int stat;
806 if (verbose > 1)
807 printf("waiting for pid %d\n", thread->pid);
808 waitpid(thread->pid, &stat, 0);
809 }
810}
811
812static void
813wait_for_servers(void)
814{
815 int i;
816 int retry_count = 10;
817 mach_port_t bsport, servport;
818 kern_return_t ret;
819
820 /* find server port */
821 ret = task_get_bootstrap_port(mach_task_self(), &bsport);
822 if (KERN_SUCCESS != ret) {
823 mach_error("task_get_bootstrap_port(): ", ret);
824 exit(1);
825 }
826
827 while (retry_count-- > 0) {
828 for (i = 0; i < num_servers; i++) {
829 ret = bootstrap_look_up(bsport,
830 server_port_name[i],
831 &servport);
832 if (ret != KERN_SUCCESS) {
833 break;
834 }
835 }
836 if (ret == KERN_SUCCESS)
837 return;
838 usleep(100 * 1000); /* 100ms */
839 }
840 fprintf(stderr, "Server(s) failed to register\n");
841 exit(1);
842}
843
844int main(int argc, char *argv[])
845{
846 int i;
847 int j;
848 thread_id_t *client_id;
849 thread_id_t *server_id;
850
851 signal(SIGINT, signal_handler);
852 parse_args(argc, argv);
853
854 if (mach_timebase_info(&g_timebase) != KERN_SUCCESS) {
855 fprintf(stderr, "Can't get mach_timebase_info!\n");
856 exit(1);
857 }
858
859 calibrate_client_work();
860
861 /*
862 * If we're using affinity create an empty namespace now
863 * so this is shared by all our offspring.
864 */
865 if (affinity)
866 thread_setup(0);
867
868 server_id = (thread_id_t *) malloc(num_servers * sizeof(thread_id_t));
869 server_port_name = (char **) malloc(num_servers * sizeof(char *));
870 server_port_args = (struct port_args *)calloc(sizeof(struct port_args), num_servers);
871 if (!server_id || !server_port_name || !server_port_args) {
872 fprintf(stderr, "malloc/calloc of %d server book keeping structs failed\n", num_servers);
873 exit(1);
874 }
875
876 if (verbose)
877 printf("creating %d servers\n", num_servers);
878 for (i = 0; i < num_servers; i++) {
879 server_port_name[i] = (char *) malloc(sizeof("PORT.pppppp.xx"));
880 /* PORT names include pid of main process for disambiguation */
881 sprintf(server_port_name[i], "PORT.%06d.%02d", getpid(), i);
882 thread_spawn(&server_id[i], server, (void *) (long) i);
883 }
884
885 int totalclients = num_servers * num_clients;
886 int totalmsg = num_msgs * totalclients;
887 struct timeval starttv, endtv, deltatv;
888
889 /*
890 * Wait for all servers to have registered all ports before starting
891 * the clients and the clock.
892 */
893 wait_for_servers();
894
895 printf("%d server%s, %d client%s per server (%d total) %u messages...",
896 num_servers, (num_servers > 1)? "s" : "",
897 num_clients, (num_clients > 1)? "s" : "",
898 totalclients,
899 totalmsg);
900 fflush(stdout);
901
902 /* Call gettimeofday() once and throw away result; some implementations
903 * (like Mach's) cache some time zone info on first call.
904 */
905 gettimeofday(&starttv, NULL);
906 gettimeofday(&starttv, NULL);
907
908 client_id = (thread_id_t *) malloc(totalclients * sizeof(thread_id_t));
909 if (verbose)
910 printf("creating %d clients\n", totalclients);
911 for (i = 0; i < num_servers; i++) {
912 for (j = 0; j < num_clients; j++) {
913 thread_spawn(
914 &client_id[(i*num_clients) + j],
915 client,
916 (void *) (long) i);
917 }
918 }
919
920 /* Wait for servers to complete */
921 for (i = 0; i < num_servers; i++) {
922 thread_join(&server_id[i]);
923 }
924
925 gettimeofday(&endtv, NULL);
926 if (verbose)
927 printf("all servers complete: waiting for clients...\n");
928
929 for (i = 0; i < totalclients; i++) {
930 thread_join(&client_id[i]);
931 }
932
933 /* report results */
934 deltatv.tv_sec = endtv.tv_sec - starttv.tv_sec;
935 deltatv.tv_usec = endtv.tv_usec - starttv.tv_usec;
936 if (endtv.tv_usec < starttv.tv_usec) {
937 deltatv.tv_sec--;
938 deltatv.tv_usec += 1000000;
939 }
940
941 double dsecs = (double) deltatv.tv_sec +
942 1.0E-6 * (double) deltatv.tv_usec;
943
944 printf(" in %lu.%03u seconds\n",
945 deltatv.tv_sec, deltatv.tv_usec/1000);
946 printf(" throughput in messages/sec: %g\n",
947 (double)totalmsg / dsecs);
948 printf(" average message latency (usec): %2.3g\n",
949 dsecs * 1.0E6 / (double) totalmsg);
950
951 double time_in_sec = (double)deltatv.tv_sec + (double)deltatv.tv_usec/1000.0;
952 double throughput_msg_p_sec = (double) totalmsg/dsecs;
953 double avg_msg_latency = dsecs*1.0E6 / (double)totalmsg;
954
955 if (save_perfdata == TRUE) {
956 char name[256];
957 snprintf(name, sizeof(name), "%s_avg_msg_latency", basename(argv[0]));
958 record_perf_data(name, "usec", avg_msg_latency, "Message latency measured in microseconds. Lower is better", stderr);
959 }
960
961 if (stress_prepost) {
962 int64_t sendns = abs_to_ns(g_client_send_time);
963 dsecs = (double)sendns / (double)NSEC_PER_SEC;
964 printf(" total send time: %2.3gs\n", dsecs);
965 printf(" average send time (usec): %2.3g\n",
966 dsecs * 1.0E6 / (double)totalmsg);
967 }
968
969 return (0);
970
971}