]>
Commit | Line | Data |
---|---|---|
2d21ac55 | 1 | #include <AvailabilityMacros.h> |
fe8ab488 | 2 | #include <mach/thread_policy.h> |
2d21ac55 A |
3 | |
4 | #include <pthread.h> | |
5 | #include <stdio.h> | |
6 | #include <stdlib.h> | |
7 | #include <string.h> | |
8 | #include <err.h> | |
316670eb | 9 | #include <unistd.h> |
2d21ac55 A |
10 | |
11 | #include <pthread.h> | |
12 | #include <mach/mach.h> | |
13 | #include <mach/mach_error.h> | |
3e170ce0 | 14 | #include <mach/mach_time.h> |
2d21ac55 A |
15 | #include <mach/notify.h> |
16 | #include <servers/bootstrap.h> | |
17 | #include <sys/types.h> | |
18 | #include <sys/time.h> | |
19 | #include <sys/signal.h> | |
20 | ||
3e170ce0 A |
21 | #include <libkern/OSAtomic.h> |
22 | ||
2d21ac55 A |
23 | #define MAX(A, B) ((A) < (B) ? (B) : (A)) |
24 | ||
2d21ac55 A |
25 | |
26 | typedef struct { | |
27 | mach_msg_header_t header; | |
28 | mach_msg_trailer_t trailer; // subtract this when sending | |
29 | } ipc_trivial_message; | |
30 | ||
31 | typedef struct { | |
32 | mach_msg_header_t header; | |
2d21ac55 A |
33 | u_int32_t numbers[0]; |
34 | mach_msg_trailer_t trailer; // subtract this when sending | |
35 | } ipc_inline_message; | |
36 | ||
37 | typedef struct { | |
38 | mach_msg_header_t header; | |
39 | mach_msg_body_t body; | |
40 | mach_msg_ool_descriptor_t descriptor; | |
41 | mach_msg_trailer_t trailer; // subtract this when sending | |
42 | } ipc_complex_message; | |
43 | ||
44 | enum { | |
45 | msg_type_trivial = 0, | |
46 | msg_type_inline = 1, | |
47 | msg_type_complex = 2 | |
48 | }; | |
49 | ||
50 | struct port_args { | |
51 | int server_num; | |
52 | int req_size; | |
53 | mach_msg_header_t *req_msg; | |
54 | int reply_size; | |
55 | mach_msg_header_t *reply_msg; | |
56 | mach_port_t port; | |
3e170ce0 A |
57 | mach_port_t rcv_set; |
58 | ||
59 | mach_port_t *set; | |
60 | mach_port_t *port_list; | |
2d21ac55 A |
61 | }; |
62 | ||
63 | typedef union { | |
64 | pid_t pid; | |
65 | pthread_t tid; | |
66 | } thread_id_t; | |
67 | ||
68 | /* Global options */ | |
3e170ce0 | 69 | static int verbose = 0; |
2d21ac55 A |
70 | static boolean_t affinity = FALSE; |
71 | static boolean_t timeshare = FALSE; | |
72 | static boolean_t threaded = FALSE; | |
73 | static boolean_t oneway = FALSE; | |
b0d623f7 | 74 | static boolean_t useset = FALSE; |
2d21ac55 A |
75 | int msg_type; |
76 | int num_ints; | |
77 | int num_msgs; | |
78 | int num_clients; | |
79 | int num_servers; | |
80 | int client_delay; | |
81 | int client_spin; | |
82 | int client_pages; | |
b0d623f7 | 83 | int portcount = 1; |
3e170ce0 A |
84 | int setcount = 0; |
85 | boolean_t stress_prepost = FALSE; | |
2d21ac55 A |
86 | char **server_port_name; |
87 | ||
3e170ce0 A |
88 | struct port_args *server_port_args; |
89 | ||
90 | /* global data */ | |
91 | mach_timebase_info_data_t g_timebase; | |
92 | int64_t g_client_send_time = 0; | |
93 | ||
94 | static inline uint64_t ns_to_abs(uint64_t ns) | |
95 | { | |
96 | return ns * g_timebase.denom / g_timebase.numer; | |
97 | } | |
98 | ||
99 | static inline uint64_t abs_to_ns(uint64_t abs) | |
100 | { | |
101 | return abs * g_timebase.numer / g_timebase.denom; | |
102 | } | |
103 | ||
104 | ||
2d21ac55 A |
105 | void signal_handler(int sig) { |
106 | } | |
107 | ||
108 | void usage(const char *progname) { | |
109 | fprintf(stderr, "usage: %s [options]\n", progname); | |
110 | fprintf(stderr, "where options are:\n"); | |
111 | fprintf(stderr, " -affinity\t\tthreads use affinity\n"); | |
112 | fprintf(stderr, " -timeshare\t\tthreads use timeshare\n"); | |
113 | fprintf(stderr, " -threaded\t\tuse (p)threads\n"); | |
3e170ce0 | 114 | fprintf(stderr, " -verbose\t\tbe verbose (use multiple times to increase verbosity)\n"); |
2d21ac55 A |
115 | fprintf(stderr, " -oneway\t\tdo not request return reply\n"); |
116 | fprintf(stderr, " -count num\t\tnumber of messages to send\n"); | |
117 | fprintf(stderr, " -type trivial|inline|complex\ttype of messages to send\n"); | |
118 | fprintf(stderr, " -numints num\tnumber of 32-bit ints to send in messages\n"); | |
3e170ce0 | 119 | fprintf(stderr, " -servers num\tnumber of server threads to run\n"); |
2d21ac55 A |
120 | fprintf(stderr, " -clients num\tnumber of clients per server\n"); |
121 | fprintf(stderr, " -delay num\t\tmicroseconds to sleep clients between messages\n"); | |
122 | fprintf(stderr, " -work num\t\tmicroseconds of client work\n"); | |
123 | fprintf(stderr, " -pages num\t\tpages of memory touched by client work\n"); | |
3e170ce0 A |
124 | fprintf(stderr, " -set nset num\tcreate [nset] portsets and [num] ports in each server.\n"); |
125 | fprintf(stderr, " \tEach port is connected to each set.\n"); | |
126 | fprintf(stderr, " -prepost\t\tstress the prepost system (implies -threaded, requires -set X Y)\n"); | |
2d21ac55 A |
127 | fprintf(stderr, "default values are:\n"); |
128 | fprintf(stderr, " . no affinity\n"); | |
129 | fprintf(stderr, " . not timeshare\n"); | |
3e170ce0 | 130 | fprintf(stderr, " . not threaded\n"); |
2d21ac55 A |
131 | fprintf(stderr, " . not verbose\n"); |
132 | fprintf(stderr, " . not oneway\n"); | |
133 | fprintf(stderr, " . client sends 100000 messages\n"); | |
134 | fprintf(stderr, " . inline message type\n"); | |
135 | fprintf(stderr, " . 64 32-bit integers in inline/complex messages\n"); | |
136 | fprintf(stderr, " . (num_available_processors+1)%%2 servers\n"); | |
137 | fprintf(stderr, " . 4 clients per server\n"); | |
138 | fprintf(stderr, " . no delay\n"); | |
3e170ce0 A |
139 | fprintf(stderr, " . no sets / extra ports\n"); |
140 | fprintf(stderr, " . no prepost stress\n"); | |
2d21ac55 A |
141 | exit(1); |
142 | } | |
143 | ||
144 | void parse_args(int argc, char *argv[]) { | |
145 | host_basic_info_data_t info; | |
146 | mach_msg_type_number_t count; | |
147 | kern_return_t result; | |
148 | ||
149 | /* Initialize defaults */ | |
150 | msg_type = msg_type_trivial; | |
151 | num_ints = 64; | |
152 | num_msgs = 100000; | |
153 | client_delay = 0; | |
154 | num_clients = 4; | |
155 | ||
156 | count = HOST_BASIC_INFO_COUNT; | |
157 | result = host_info(mach_host_self(), HOST_BASIC_INFO, | |
158 | (host_info_t)&info, &count); | |
159 | if (result == KERN_SUCCESS && info.avail_cpus > 1) | |
160 | num_servers = info.avail_cpus / 2; | |
161 | else | |
162 | num_servers = 1; | |
163 | ||
164 | const char *progname = argv[0]; | |
165 | argc--; argv++; | |
166 | while (0 < argc) { | |
167 | if (0 == strcmp("-verbose", argv[0])) { | |
3e170ce0 | 168 | verbose++; |
2d21ac55 A |
169 | argc--; argv++; |
170 | } else if (0 == strcmp("-affinity", argv[0])) { | |
171 | affinity = TRUE; | |
172 | argc--; argv++; | |
173 | } else if (0 == strcmp("-timeshare", argv[0])) { | |
174 | timeshare = TRUE; | |
175 | argc--; argv++; | |
176 | } else if (0 == strcmp("-threaded", argv[0])) { | |
177 | threaded = TRUE; | |
178 | argc--; argv++; | |
179 | } else if (0 == strcmp("-oneway", argv[0])) { | |
180 | oneway = TRUE; | |
181 | argc--; argv++; | |
182 | } else if (0 == strcmp("-type", argv[0])) { | |
183 | if (argc < 2) | |
184 | usage(progname); | |
185 | if (0 == strcmp("trivial", argv[1])) { | |
186 | msg_type = msg_type_trivial; | |
187 | } else if (0 == strcmp("inline", argv[1])) { | |
188 | msg_type = msg_type_inline; | |
189 | } else if (0 == strcmp("complex", argv[1])) { | |
190 | msg_type = msg_type_complex; | |
191 | } else | |
192 | usage(progname); | |
193 | argc -= 2; argv += 2; | |
194 | } else if (0 == strcmp("-numints", argv[0])) { | |
195 | if (argc < 2) | |
196 | usage(progname); | |
197 | num_ints = strtoul(argv[1], NULL, 0); | |
198 | argc -= 2; argv += 2; | |
199 | } else if (0 == strcmp("-count", argv[0])) { | |
200 | if (argc < 2) | |
201 | usage(progname); | |
202 | num_msgs = strtoul(argv[1], NULL, 0); | |
203 | argc -= 2; argv += 2; | |
204 | } else if (0 == strcmp("-clients", argv[0])) { | |
205 | if (argc < 2) | |
206 | usage(progname); | |
207 | num_clients = strtoul(argv[1], NULL, 0); | |
208 | argc -= 2; argv += 2; | |
209 | } else if (0 == strcmp("-servers", argv[0])) { | |
210 | if (argc < 2) | |
211 | usage(progname); | |
212 | num_servers = strtoul(argv[1], NULL, 0); | |
213 | argc -= 2; argv += 2; | |
214 | } else if (0 == strcmp("-delay", argv[0])) { | |
215 | if (argc < 2) | |
216 | usage(progname); | |
217 | client_delay = strtoul(argv[1], NULL, 0); | |
218 | argc -= 2; argv += 2; | |
219 | } else if (0 == strcmp("-spin", argv[0])) { | |
220 | if (argc < 2) | |
221 | usage(progname); | |
222 | client_spin = strtoul(argv[1], NULL, 0); | |
223 | argc -= 2; argv += 2; | |
224 | } else if (0 == strcmp("-pages", argv[0])) { | |
225 | if (argc < 2) | |
226 | usage(progname); | |
227 | client_pages = strtoul(argv[1], NULL, 0); | |
228 | argc -= 2; argv += 2; | |
b0d623f7 | 229 | } else if (0 == strcmp("-set", argv[0])) { |
3e170ce0 A |
230 | if (argc < 3) |
231 | usage(progname); | |
232 | setcount = strtoul(argv[1], NULL, 0); | |
233 | portcount = strtoul(argv[2], NULL, 0); | |
234 | if (setcount <= 0 || portcount <= 0) | |
b0d623f7 | 235 | usage(progname); |
b0d623f7 | 236 | useset = TRUE; |
3e170ce0 A |
237 | argc -= 3; argv += 3; |
238 | } else if (0 == strcmp("-prepost", argv[0])) { | |
239 | stress_prepost = TRUE; | |
240 | threaded = TRUE; | |
b0d623f7 | 241 | argc--; argv++; |
3e170ce0 A |
242 | } else { |
243 | fprintf(stderr, "unknown option '%s'\n", argv[0]); | |
2d21ac55 | 244 | usage(progname); |
3e170ce0 A |
245 | } |
246 | } | |
247 | ||
248 | if (stress_prepost) { | |
249 | if (!threaded) { | |
250 | fprintf(stderr, "Prepost stress test _must_ be threaded\n"); | |
251 | exit(1); | |
252 | } | |
253 | if (portcount < 1 || setcount < 1) { | |
254 | fprintf(stderr, "Prepost stress test requires >= 1 port in >= 1 set.\n"); | |
255 | exit(1); | |
256 | } | |
2d21ac55 A |
257 | } |
258 | } | |
259 | ||
260 | void setup_server_ports(struct port_args *ports) | |
261 | { | |
262 | kern_return_t ret = 0; | |
263 | mach_port_t bsport; | |
b0d623f7 | 264 | mach_port_t port; |
2d21ac55 A |
265 | |
266 | ports->req_size = MAX(sizeof(ipc_inline_message) + | |
267 | sizeof(u_int32_t) * num_ints, | |
268 | sizeof(ipc_complex_message)); | |
269 | ports->reply_size = sizeof(ipc_trivial_message) - | |
270 | sizeof(mach_msg_trailer_t); | |
271 | ports->req_msg = malloc(ports->req_size); | |
272 | ports->reply_msg = malloc(ports->reply_size); | |
3e170ce0 A |
273 | if (setcount > 0) { |
274 | ports->set = (mach_port_t *)calloc(sizeof(mach_port_t), setcount); | |
275 | if (!ports->set) { | |
276 | fprintf(stderr, "calloc(%lu, %d) failed!\n", sizeof(mach_port_t), setcount); | |
277 | exit(1); | |
278 | } | |
279 | } | |
280 | if (stress_prepost) { | |
281 | ports->port_list = (mach_port_t *)calloc(sizeof(mach_port_t), portcount); | |
282 | if (!ports->port_list) { | |
283 | fprintf(stderr, "calloc(%lu, %d) failed!\n", sizeof(mach_port_t), portcount); | |
284 | exit(1); | |
285 | } | |
286 | } | |
2d21ac55 | 287 | |
b0d623f7 | 288 | if (useset) { |
3e170ce0 A |
289 | mach_port_t set; |
290 | if (setcount < 1) { | |
291 | fprintf(stderr, "Can't use sets with a setcount of %d\n", setcount); | |
b0d623f7 A |
292 | exit(1); |
293 | } | |
3e170ce0 A |
294 | |
295 | for (int ns = 0; ns < setcount; ns++) { | |
296 | ret = mach_port_allocate(mach_task_self(), | |
297 | MACH_PORT_RIGHT_PORT_SET, | |
298 | &ports->set[ns]); | |
299 | if (KERN_SUCCESS != ret) { | |
300 | mach_error("mach_port_allocate(SET): ", ret); | |
301 | exit(1); | |
302 | } | |
303 | if (verbose > 1) | |
304 | printf("SVR[%d] allocated set[%d] %#x\n", | |
305 | ports->server_num, ns, ports->set[ns]); | |
306 | ||
307 | set = ports->set[ns]; | |
308 | } | |
309 | ||
310 | /* receive on a port set (always use the first in the chain) */ | |
311 | ports->rcv_set = ports->set[0]; | |
b0d623f7 A |
312 | } |
313 | ||
3e170ce0 A |
314 | /* stuff the portset(s) with ports */ |
315 | for (int i = 0; i < portcount; i++) { | |
b0d623f7 A |
316 | ret = mach_port_allocate(mach_task_self(), |
317 | MACH_PORT_RIGHT_RECEIVE, | |
318 | &port); | |
319 | if (KERN_SUCCESS != ret) { | |
320 | mach_error("mach_port_allocate(PORT): ", ret); | |
321 | exit(1); | |
322 | } | |
323 | ||
3e170ce0 A |
324 | if (stress_prepost) |
325 | ports->port_list[i] = port; | |
326 | ||
b0d623f7 | 327 | if (useset) { |
3e170ce0 A |
328 | /* insert the port into _all_ allocated lowest-level sets */ |
329 | for (int ns = 0; ns < setcount; ns++) { | |
330 | if (verbose > 1) | |
331 | printf("SVR[%d] moving port %#x into set %#x...\n", | |
332 | ports->server_num, port, ports->set[ns]); | |
333 | ret = mach_port_insert_member(mach_task_self(), | |
334 | port, ports->set[ns]); | |
335 | if (KERN_SUCCESS != ret) { | |
336 | mach_error("mach_port_insert_member(): ", ret); | |
337 | exit(1); | |
338 | } | |
b0d623f7 A |
339 | } |
340 | } | |
2d21ac55 A |
341 | } |
342 | ||
3e170ce0 | 343 | /* use the last one as the server's bootstrap port */ |
b0d623f7 A |
344 | ports->port = port; |
345 | ||
3e170ce0 A |
346 | if (stress_prepost) { |
347 | /* insert a send right for _each_ port */ | |
348 | for (int i = 0; i < portcount; i++) { | |
349 | ret = mach_port_insert_right(mach_task_self(), | |
350 | ports->port_list[i], | |
351 | ports->port_list[i], | |
352 | MACH_MSG_TYPE_MAKE_SEND); | |
353 | if (KERN_SUCCESS != ret) { | |
354 | mach_error("mach_port_insert_right(): ", ret); | |
355 | exit(1); | |
356 | } | |
357 | } | |
358 | } else { | |
359 | ret = mach_port_insert_right(mach_task_self(), | |
360 | ports->port, | |
361 | ports->port, | |
362 | MACH_MSG_TYPE_MAKE_SEND); | |
363 | if (KERN_SUCCESS != ret) { | |
364 | mach_error("mach_port_insert_right(): ", ret); | |
365 | exit(1); | |
366 | } | |
2d21ac55 A |
367 | } |
368 | ||
369 | ret = task_get_bootstrap_port(mach_task_self(), &bsport); | |
370 | if (KERN_SUCCESS != ret) { | |
371 | mach_error("task_get_bootstrap_port(): ", ret); | |
372 | exit(1); | |
373 | } | |
374 | ||
375 | if (verbose) { | |
3e170ce0 A |
376 | printf("server waiting for IPC messages from client on port '%s' (%#x).\n", |
377 | server_port_name[ports->server_num], ports->port); | |
2d21ac55 A |
378 | } |
379 | ret = bootstrap_register(bsport, | |
380 | server_port_name[ports->server_num], | |
381 | ports->port); | |
382 | if (KERN_SUCCESS != ret) { | |
383 | mach_error("bootstrap_register(): ", ret); | |
384 | exit(1); | |
385 | } | |
386 | } | |
387 | ||
388 | void setup_client_ports(struct port_args *ports) | |
389 | { | |
390 | kern_return_t ret = 0; | |
391 | switch(msg_type) { | |
392 | case msg_type_trivial: | |
393 | ports->req_size = sizeof(ipc_trivial_message); | |
394 | break; | |
395 | case msg_type_inline: | |
396 | ports->req_size = sizeof(ipc_inline_message) + | |
397 | sizeof(u_int32_t) * num_ints; | |
398 | break; | |
399 | case msg_type_complex: | |
400 | ports->req_size = sizeof(ipc_complex_message); | |
401 | break; | |
402 | } | |
403 | ports->req_size -= sizeof(mach_msg_trailer_t); | |
404 | ports->reply_size = sizeof(ipc_trivial_message); | |
405 | ports->req_msg = malloc(ports->req_size); | |
406 | ports->reply_msg = malloc(ports->reply_size); | |
407 | ||
408 | ret = mach_port_allocate(mach_task_self(), | |
409 | MACH_PORT_RIGHT_RECEIVE, | |
410 | &(ports->port)); | |
411 | if (KERN_SUCCESS != ret) { | |
412 | mach_error("mach_port_allocate(): ", ret); | |
413 | exit(1); | |
414 | } | |
415 | if (verbose) { | |
3e170ce0 | 416 | printf("Client sending %d %s IPC messages to port '%s' in %s mode\n", |
2d21ac55 A |
417 | num_msgs, (msg_type == msg_type_inline) ? |
418 | "inline" : ((msg_type == msg_type_complex) ? | |
419 | "complex" : "trivial"), | |
420 | server_port_name[ports->server_num], | |
421 | (oneway ? "oneway" : "rpc")); | |
422 | } | |
2d21ac55 A |
423 | } |
424 | ||
425 | ||
426 | static void | |
427 | thread_setup(int tag) { | |
2d21ac55 A |
428 | kern_return_t ret; |
429 | thread_extended_policy_data_t epolicy; | |
430 | thread_affinity_policy_data_t policy; | |
431 | ||
432 | if (!timeshare) { | |
433 | epolicy.timeshare = FALSE; | |
434 | ret = thread_policy_set( | |
435 | mach_thread_self(), THREAD_EXTENDED_POLICY, | |
436 | (thread_policy_t) &epolicy, | |
437 | THREAD_EXTENDED_POLICY_COUNT); | |
438 | if (ret != KERN_SUCCESS) | |
439 | printf("thread_policy_set(THREAD_EXTENDED_POLICY) returned %d\n", ret); | |
440 | } | |
441 | ||
442 | if (affinity) { | |
443 | policy.affinity_tag = tag; | |
444 | ret = thread_policy_set( | |
445 | mach_thread_self(), THREAD_AFFINITY_POLICY, | |
446 | (thread_policy_t) &policy, | |
447 | THREAD_AFFINITY_POLICY_COUNT); | |
448 | if (ret != KERN_SUCCESS) | |
449 | printf("thread_policy_set(THREAD_AFFINITY_POLICY) returned %d\n", ret); | |
450 | } | |
2d21ac55 A |
451 | } |
452 | ||
453 | void * | |
3e170ce0 | 454 | server(void *serverarg) |
2d21ac55 | 455 | { |
2d21ac55 A |
456 | int idx; |
457 | kern_return_t ret; | |
458 | int totalmsg = num_msgs * num_clients; | |
b0d623f7 | 459 | mach_port_t recv_port; |
3e170ce0 A |
460 | uint64_t starttm, endtm; |
461 | ||
462 | int svr_num = (int)(uintptr_t)serverarg; | |
463 | struct port_args *args = &server_port_args[svr_num]; | |
2d21ac55 | 464 | |
3e170ce0 A |
465 | args->server_num = svr_num; |
466 | setup_server_ports(args); | |
2d21ac55 | 467 | |
3e170ce0 | 468 | thread_setup(args->server_num + 1); |
2d21ac55 | 469 | |
3e170ce0 | 470 | recv_port = (useset) ? args->rcv_set : args->port; |
b0d623f7 | 471 | |
2d21ac55 | 472 | for (idx = 0; idx < totalmsg; idx++) { |
3e170ce0 | 473 | if (verbose > 2) |
2d21ac55 | 474 | printf("server awaiting message %d\n", idx); |
3e170ce0 | 475 | ret = mach_msg(args->req_msg, |
2d21ac55 A |
476 | MACH_RCV_MSG|MACH_RCV_INTERRUPT|MACH_RCV_LARGE, |
477 | 0, | |
3e170ce0 | 478 | args->req_size, |
b0d623f7 | 479 | recv_port, |
2d21ac55 A |
480 | MACH_MSG_TIMEOUT_NONE, |
481 | MACH_PORT_NULL); | |
482 | if (MACH_RCV_INTERRUPTED == ret) | |
483 | break; | |
484 | if (MACH_MSG_SUCCESS != ret) { | |
485 | if (verbose) | |
486 | printf("mach_msg() ret=%d", ret); | |
487 | mach_error("mach_msg (receive): ", ret); | |
488 | exit(1); | |
489 | } | |
3e170ce0 | 490 | if (verbose > 2) |
2d21ac55 | 491 | printf("server received message %d\n", idx); |
3e170ce0 | 492 | if (args->req_msg->msgh_bits & MACH_MSGH_BITS_COMPLEX) { |
2d21ac55 | 493 | ret = vm_deallocate(mach_task_self(), |
3e170ce0 A |
494 | (vm_address_t)((ipc_complex_message *)args->req_msg)->descriptor.address, |
495 | ((ipc_complex_message *)args->req_msg)->descriptor.size); | |
2d21ac55 A |
496 | } |
497 | ||
3e170ce0 A |
498 | if (1 == args->req_msg->msgh_id) { |
499 | if (verbose > 2) | |
2d21ac55 | 500 | printf("server sending reply %d\n", idx); |
3e170ce0 A |
501 | args->reply_msg->msgh_bits = MACH_MSGH_BITS(MACH_MSG_TYPE_MOVE_SEND_ONCE, 0); |
502 | args->reply_msg->msgh_size = args->reply_size; | |
503 | args->reply_msg->msgh_remote_port = args->req_msg->msgh_remote_port; | |
504 | args->reply_msg->msgh_local_port = MACH_PORT_NULL; | |
505 | args->reply_msg->msgh_id = 2; | |
506 | ret = mach_msg(args->reply_msg, | |
2d21ac55 | 507 | MACH_SEND_MSG, |
3e170ce0 | 508 | args->reply_size, |
2d21ac55 A |
509 | 0, |
510 | MACH_PORT_NULL, | |
511 | MACH_MSG_TIMEOUT_NONE, | |
512 | MACH_PORT_NULL); | |
513 | if (MACH_MSG_SUCCESS != ret) { | |
514 | mach_error("mach_msg (send): ", ret); | |
515 | exit(1); | |
516 | } | |
517 | } | |
518 | } | |
3e170ce0 A |
519 | |
520 | if (!useset) | |
521 | return NULL; | |
522 | ||
523 | if (verbose < 1) | |
524 | return NULL; | |
525 | ||
526 | uint64_t deltans = 0; | |
527 | /* | |
528 | * If we're using multiple sets, explicitly tear them all down | |
529 | * and measure the time. | |
530 | */ | |
531 | for (int ns = 0; ns < setcount; ns++) { | |
532 | if (verbose > 1) | |
533 | printf("\tTearing down set[%d] %#x...\n", ns, args->set[ns]); | |
534 | starttm = mach_absolute_time(); | |
535 | ret = mach_port_mod_refs(mach_task_self(), args->set[ns], MACH_PORT_RIGHT_PORT_SET, -1); | |
536 | endtm = mach_absolute_time(); | |
537 | deltans += abs_to_ns(endtm - starttm); | |
538 | if (ret != KERN_SUCCESS) { | |
539 | mach_error("mach_port_mod_refs(): ", ret); | |
540 | exit(1); | |
541 | } | |
542 | } | |
543 | ||
544 | uint64_t nlinks = (uint64_t)setcount * (uint64_t)portcount; | |
545 | ||
546 | printf("\tteardown of %llu links took %llu ns\n", nlinks, deltans); | |
547 | printf("\t%lluns per set\n", deltans / (uint64_t)setcount); | |
548 | ||
316670eb | 549 | return NULL; |
2d21ac55 A |
550 | } |
551 | ||
552 | static inline void | |
553 | client_spin_loop(unsigned count, void (fn)(void)) | |
554 | { | |
555 | while (count--) | |
556 | fn(); | |
557 | } | |
558 | ||
559 | static long dummy_memory; | |
560 | static long *client_memory = &dummy_memory; | |
561 | static void | |
562 | client_work_atom(void) | |
563 | { | |
564 | static int i; | |
565 | ||
566 | if (++i > client_pages * PAGE_SIZE / sizeof(long)) | |
567 | i = 0; | |
568 | client_memory[i] = 0; | |
569 | } | |
570 | ||
571 | static int calibration_count = 10000; | |
572 | static int calibration_usec; | |
573 | static void * | |
574 | calibrate_client_work(void) | |
575 | { | |
576 | long dummy; | |
577 | struct timeval nowtv; | |
578 | struct timeval warmuptv = { 0, 100 * 1000 }; /* 100ms */ | |
579 | struct timeval starttv; | |
580 | struct timeval endtv; | |
581 | ||
582 | if (client_spin) { | |
583 | /* Warm-up the stepper first... */ | |
584 | gettimeofday(&nowtv, NULL); | |
585 | timeradd(&nowtv, &warmuptv, &endtv); | |
586 | do { | |
587 | client_spin_loop(calibration_count, client_work_atom); | |
588 | gettimeofday(&nowtv, NULL); | |
589 | } while (timercmp(&nowtv, &endtv, < )); | |
590 | ||
591 | /* Now do the calibration */ | |
592 | while (TRUE) { | |
593 | gettimeofday(&starttv, NULL); | |
594 | client_spin_loop(calibration_count, client_work_atom); | |
595 | gettimeofday(&endtv, NULL); | |
596 | if (endtv.tv_sec - starttv.tv_sec > 1) { | |
597 | calibration_count /= 10; | |
598 | continue; | |
599 | } | |
600 | calibration_usec = endtv.tv_usec - starttv.tv_usec; | |
601 | if (endtv.tv_usec < starttv.tv_usec) { | |
602 | calibration_usec += 1000000; | |
603 | } | |
604 | if (calibration_usec < 1000) { | |
605 | calibration_count *= 10; | |
606 | continue; | |
607 | } | |
608 | calibration_count /= calibration_usec; | |
609 | break; | |
610 | } | |
3e170ce0 | 611 | if (verbose > 1) |
2d21ac55 A |
612 | printf("calibration_count=%d calibration_usec=%d\n", |
613 | calibration_count, calibration_usec); | |
614 | } | |
316670eb | 615 | return NULL; |
2d21ac55 A |
616 | } |
617 | ||
618 | static void * | |
619 | client_work(void) | |
620 | { | |
621 | ||
622 | if (client_spin) { | |
623 | client_spin_loop(calibration_count*client_spin, | |
624 | client_work_atom); | |
625 | } | |
626 | ||
627 | if (client_delay) { | |
628 | usleep(client_delay); | |
629 | } | |
316670eb | 630 | return NULL; |
2d21ac55 A |
631 | } |
632 | ||
633 | void *client(void *threadarg) | |
634 | { | |
635 | struct port_args args; | |
3e170ce0 | 636 | struct port_args *svr_args = NULL; |
2d21ac55 A |
637 | int idx; |
638 | mach_msg_header_t *req, *reply; | |
639 | mach_port_t bsport, servport; | |
640 | kern_return_t ret; | |
3e170ce0 | 641 | int server_num = (int)(uintptr_t)threadarg; |
2d21ac55 A |
642 | void *ints = malloc(sizeof(u_int32_t) * num_ints); |
643 | ||
644 | if (verbose) | |
645 | printf("client(%d) started, server port name %s\n", | |
646 | server_num, server_port_name[server_num]); | |
647 | ||
648 | args.server_num = server_num; | |
649 | thread_setup(server_num + 1); | |
650 | ||
3e170ce0 A |
651 | if (stress_prepost) |
652 | svr_args = &server_port_args[server_num]; | |
653 | ||
2d21ac55 A |
654 | /* find server port */ |
655 | ret = task_get_bootstrap_port(mach_task_self(), &bsport); | |
656 | if (KERN_SUCCESS != ret) { | |
657 | mach_error("task_get_bootstrap_port(): ", ret); | |
658 | exit(1); | |
659 | } | |
660 | ret = bootstrap_look_up(bsport, | |
661 | server_port_name[server_num], | |
662 | &servport); | |
663 | if (KERN_SUCCESS != ret) { | |
664 | mach_error("bootstrap_look_up(): ", ret); | |
665 | exit(1); | |
666 | } | |
667 | ||
668 | setup_client_ports(&args); | |
669 | ||
670 | /* Allocate and touch memory */ | |
671 | if (client_pages) { | |
672 | unsigned i; | |
673 | client_memory = (long *) malloc(client_pages * PAGE_SIZE); | |
674 | for (i = 0; i < client_pages; i++) | |
675 | client_memory[i * PAGE_SIZE / sizeof(long)] = 0; | |
676 | } | |
3e170ce0 A |
677 | |
678 | uint64_t starttm, endtm; | |
2d21ac55 A |
679 | |
680 | /* start message loop */ | |
681 | for (idx = 0; idx < num_msgs; idx++) { | |
682 | req = args.req_msg; | |
683 | reply = args.reply_msg; | |
684 | ||
2d21ac55 | 685 | req->msgh_size = args.req_size; |
3e170ce0 A |
686 | if (stress_prepost) { |
687 | req->msgh_remote_port = svr_args->port_list[idx % portcount]; | |
688 | } else { | |
689 | req->msgh_remote_port = servport; | |
690 | } | |
691 | if (oneway) { | |
692 | req->msgh_bits = MACH_MSGH_BITS(MACH_MSG_TYPE_COPY_SEND, 0); | |
693 | req->msgh_local_port = MACH_PORT_NULL; | |
694 | } else { | |
695 | req->msgh_bits = MACH_MSGH_BITS(MACH_MSG_TYPE_COPY_SEND, | |
696 | MACH_MSG_TYPE_MAKE_SEND_ONCE); | |
697 | req->msgh_local_port = args.port; | |
698 | } | |
2d21ac55 | 699 | req->msgh_id = oneway ? 0 : 1; |
b0d623f7 A |
700 | if (msg_type == msg_type_complex) { |
701 | (req)->msgh_bits |= MACH_MSGH_BITS_COMPLEX; | |
702 | ((ipc_complex_message *)req)->body.msgh_descriptor_count = 1; | |
703 | ((ipc_complex_message *)req)->descriptor.address = ints; | |
704 | ((ipc_complex_message *)req)->descriptor.size = | |
705 | num_ints * sizeof(u_int32_t); | |
706 | ((ipc_complex_message *)req)->descriptor.deallocate = FALSE; | |
707 | ((ipc_complex_message *)req)->descriptor.copy = MACH_MSG_VIRTUAL_COPY; | |
708 | ((ipc_complex_message *)req)->descriptor.type = MACH_MSG_OOL_DESCRIPTOR; | |
2d21ac55 | 709 | } |
3e170ce0 A |
710 | if (verbose > 2) |
711 | printf("client sending message %d to port %#x\n", | |
712 | idx, req->msgh_remote_port); | |
713 | starttm = mach_absolute_time(); | |
2d21ac55 A |
714 | ret = mach_msg(req, |
715 | MACH_SEND_MSG, | |
716 | args.req_size, | |
717 | 0, | |
718 | MACH_PORT_NULL, | |
719 | MACH_MSG_TIMEOUT_NONE, | |
720 | MACH_PORT_NULL); | |
3e170ce0 | 721 | endtm = mach_absolute_time(); |
2d21ac55 A |
722 | if (MACH_MSG_SUCCESS != ret) { |
723 | mach_error("mach_msg (send): ", ret); | |
724 | fprintf(stderr, "bailing after %u iterations\n", idx); | |
725 | exit(1); | |
726 | break; | |
727 | } | |
3e170ce0 A |
728 | if (stress_prepost) |
729 | OSAtomicAdd64(endtm - starttm, &g_client_send_time); | |
730 | ||
2d21ac55 | 731 | if (!oneway) { |
3e170ce0 | 732 | if (verbose > 2) |
2d21ac55 A |
733 | printf("client awaiting reply %d\n", idx); |
734 | reply->msgh_bits = 0; | |
735 | reply->msgh_size = args.reply_size; | |
736 | reply->msgh_local_port = args.port; | |
737 | ret = mach_msg(args.reply_msg, | |
738 | MACH_RCV_MSG|MACH_RCV_INTERRUPT, | |
739 | 0, | |
740 | args.reply_size, | |
741 | args.port, | |
742 | MACH_MSG_TIMEOUT_NONE, | |
743 | MACH_PORT_NULL); | |
744 | if (MACH_MSG_SUCCESS != ret) { | |
745 | mach_error("mach_msg (receive): ", ret); | |
746 | fprintf(stderr, "bailing after %u iterations\n", | |
747 | idx); | |
748 | exit(1); | |
749 | } | |
3e170ce0 | 750 | if (verbose > 2) |
2d21ac55 A |
751 | printf("client received reply %d\n", idx); |
752 | } | |
753 | ||
754 | client_work(); | |
755 | } | |
756 | ||
757 | free(ints); | |
316670eb | 758 | return NULL; |
2d21ac55 A |
759 | } |
760 | ||
761 | static void | |
762 | thread_spawn(thread_id_t *thread, void *(fn)(void *), void *arg) { | |
763 | if (threaded) { | |
764 | kern_return_t ret; | |
765 | ret = pthread_create( | |
766 | &thread->tid, | |
767 | NULL, | |
768 | fn, | |
769 | arg); | |
770 | if (ret != 0) | |
771 | err(1, "pthread_create()"); | |
3e170ce0 | 772 | if (verbose > 1) |
316670eb | 773 | printf("created pthread %p\n", thread->tid); |
2d21ac55 A |
774 | } else { |
775 | thread->pid = fork(); | |
776 | if (thread->pid == 0) { | |
3e170ce0 | 777 | if (verbose > 1) |
316670eb | 778 | printf("calling %p(%p)\n", fn, arg); |
2d21ac55 A |
779 | fn(arg); |
780 | exit(0); | |
781 | } | |
3e170ce0 | 782 | if (verbose > 1) |
2d21ac55 A |
783 | printf("forked pid %d\n", thread->pid); |
784 | } | |
785 | } | |
786 | ||
787 | static void | |
788 | thread_join(thread_id_t *thread) { | |
789 | if (threaded) { | |
790 | kern_return_t ret; | |
3e170ce0 | 791 | if (verbose > 1) |
316670eb | 792 | printf("joining thread %p\n", thread->tid); |
2d21ac55 A |
793 | ret = pthread_join(thread->tid, NULL); |
794 | if (ret != KERN_SUCCESS) | |
316670eb | 795 | err(1, "pthread_join(%p)", thread->tid); |
2d21ac55 A |
796 | } else { |
797 | int stat; | |
3e170ce0 | 798 | if (verbose > 1) |
2d21ac55 A |
799 | printf("waiting for pid %d\n", thread->pid); |
800 | waitpid(thread->pid, &stat, 0); | |
801 | } | |
802 | } | |
803 | ||
804 | static void | |
805 | wait_for_servers(void) | |
806 | { | |
807 | int i; | |
808 | int retry_count = 10; | |
809 | mach_port_t bsport, servport; | |
810 | kern_return_t ret; | |
811 | ||
812 | /* find server port */ | |
813 | ret = task_get_bootstrap_port(mach_task_self(), &bsport); | |
814 | if (KERN_SUCCESS != ret) { | |
815 | mach_error("task_get_bootstrap_port(): ", ret); | |
816 | exit(1); | |
817 | } | |
818 | ||
819 | while (retry_count-- > 0) { | |
820 | for (i = 0; i < num_servers; i++) { | |
821 | ret = bootstrap_look_up(bsport, | |
822 | server_port_name[i], | |
823 | &servport); | |
824 | if (ret != KERN_SUCCESS) { | |
825 | break; | |
826 | } | |
827 | } | |
828 | if (ret == KERN_SUCCESS) | |
829 | return; | |
830 | usleep(100 * 1000); /* 100ms */ | |
831 | } | |
832 | fprintf(stderr, "Server(s) failed to register\n"); | |
833 | exit(1); | |
834 | } | |
835 | ||
836 | int main(int argc, char *argv[]) | |
837 | { | |
838 | int i; | |
839 | int j; | |
840 | thread_id_t *client_id; | |
841 | thread_id_t *server_id; | |
842 | ||
843 | signal(SIGINT, signal_handler); | |
844 | parse_args(argc, argv); | |
845 | ||
3e170ce0 A |
846 | if (mach_timebase_info(&g_timebase) != KERN_SUCCESS) { |
847 | fprintf(stderr, "Can't get mach_timebase_info!\n"); | |
848 | exit(1); | |
849 | } | |
850 | ||
2d21ac55 A |
851 | calibrate_client_work(); |
852 | ||
853 | /* | |
854 | * If we're using affinity create an empty namespace now | |
855 | * so this is shared by all our offspring. | |
856 | */ | |
857 | if (affinity) | |
858 | thread_setup(0); | |
859 | ||
860 | server_id = (thread_id_t *) malloc(num_servers * sizeof(thread_id_t)); | |
861 | server_port_name = (char **) malloc(num_servers * sizeof(char *)); | |
3e170ce0 A |
862 | server_port_args = (struct port_args *)calloc(sizeof(struct port_args), num_servers); |
863 | if (!server_id || !server_port_name || !server_port_args) { | |
864 | fprintf(stderr, "malloc/calloc of %d server book keeping structs failed\n", num_servers); | |
865 | exit(1); | |
866 | } | |
867 | ||
2d21ac55 A |
868 | if (verbose) |
869 | printf("creating %d servers\n", num_servers); | |
870 | for (i = 0; i < num_servers; i++) { | |
871 | server_port_name[i] = (char *) malloc(sizeof("PORT.pppppp.xx")); | |
872 | /* PORT names include pid of main process for disambiguation */ | |
873 | sprintf(server_port_name[i], "PORT.%06d.%02d", getpid(), i); | |
874 | thread_spawn(&server_id[i], server, (void *) (long) i); | |
875 | } | |
876 | ||
877 | int totalclients = num_servers * num_clients; | |
878 | int totalmsg = num_msgs * totalclients; | |
879 | struct timeval starttv, endtv, deltatv; | |
880 | ||
881 | /* | |
882 | * Wait for all servers to have registered all ports before starting | |
883 | * the clients and the clock. | |
884 | */ | |
885 | wait_for_servers(); | |
886 | ||
887 | printf("%d server%s, %d client%s per server (%d total) %u messages...", | |
888 | num_servers, (num_servers > 1)? "s" : "", | |
889 | num_clients, (num_clients > 1)? "s" : "", | |
890 | totalclients, | |
891 | totalmsg); | |
892 | fflush(stdout); | |
893 | ||
894 | /* Call gettimeofday() once and throw away result; some implementations | |
895 | * (like Mach's) cache some time zone info on first call. | |
896 | */ | |
897 | gettimeofday(&starttv, NULL); | |
898 | gettimeofday(&starttv, NULL); | |
899 | ||
900 | client_id = (thread_id_t *) malloc(totalclients * sizeof(thread_id_t)); | |
901 | if (verbose) | |
902 | printf("creating %d clients\n", totalclients); | |
903 | for (i = 0; i < num_servers; i++) { | |
904 | for (j = 0; j < num_clients; j++) { | |
905 | thread_spawn( | |
906 | &client_id[(i*num_clients) + j], | |
907 | client, | |
908 | (void *) (long) i); | |
909 | } | |
910 | } | |
911 | ||
912 | /* Wait for servers to complete */ | |
913 | for (i = 0; i < num_servers; i++) { | |
914 | thread_join(&server_id[i]); | |
915 | } | |
916 | ||
917 | gettimeofday(&endtv, NULL); | |
3e170ce0 A |
918 | if (verbose) |
919 | printf("all servers complete: waiting for clients...\n"); | |
2d21ac55 A |
920 | |
921 | for (i = 0; i < totalclients; i++) { | |
922 | thread_join(&client_id[i]); | |
923 | } | |
924 | ||
925 | /* report results */ | |
926 | deltatv.tv_sec = endtv.tv_sec - starttv.tv_sec; | |
927 | deltatv.tv_usec = endtv.tv_usec - starttv.tv_usec; | |
928 | if (endtv.tv_usec < starttv.tv_usec) { | |
929 | deltatv.tv_sec--; | |
930 | deltatv.tv_usec += 1000000; | |
931 | } | |
932 | ||
933 | double dsecs = (double) deltatv.tv_sec + | |
934 | 1.0E-6 * (double) deltatv.tv_usec; | |
935 | ||
3e170ce0 | 936 | printf(" in %lu.%03u seconds\n", |
2d21ac55 A |
937 | deltatv.tv_sec, deltatv.tv_usec/1000); |
938 | printf(" throughput in messages/sec: %g\n", | |
939 | (double)totalmsg / dsecs); | |
940 | printf(" average message latency (usec): %2.3g\n", | |
941 | dsecs * 1.0E6 / (double) totalmsg); | |
942 | ||
3e170ce0 A |
943 | if (stress_prepost) { |
944 | int64_t sendns = abs_to_ns(g_client_send_time); | |
945 | dsecs = (double)sendns / (double)NSEC_PER_SEC; | |
946 | printf(" total send time: %2.3gs\n", dsecs); | |
947 | printf(" average send time (usec): %2.3g\n", | |
948 | dsecs * 1.0E6 / (double)totalmsg); | |
949 | } | |
950 | ||
2d21ac55 A |
951 | return (0); |
952 | ||
953 | } |