]>
git.saurik.com Git - apple/xnu.git/blob - bsd/dev/unix_startup.c
2 * Copyright (c) 2000-2014 Apple Inc. All rights reserved.
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
29 * Copyright (c) 1992,7 NeXT Computer, Inc.
31 * Unix data structure initialization.
35 #include <mach/mach_types.h>
37 #include <kern/startup.h>
38 #include <vm/vm_kern.h>
39 #include <mach/vm_prot.h>
41 #include <sys/param.h>
42 #include <sys/buf_internal.h>
43 #include <sys/file_internal.h>
44 #include <sys/proc_internal.h>
45 #include <sys/mcache.h>
47 #include <sys/systm.h>
49 #include <sys/vnode.h>
50 #include <sys/sysctl.h>
51 #include <machine/cons.h>
52 #include <pexpert/pexpert.h>
53 #include <sys/socketvar.h>
54 #include <pexpert/pexpert.h>
55 #include <netinet/tcp_var.h>
57 extern uint32_t kern_maxvnodes
;
58 extern vm_map_t mb_map
;
61 extern uint32_t tcp_sendspace
;
62 extern uint32_t tcp_recvspace
;
65 void bsd_bufferinit(void);
67 unsigned int bsd_mbuf_cluster_reserve(boolean_t
*);
68 void bsd_scale_setup(int);
69 void bsd_exec_setup(int);
72 * Declare these as initialized data so we can patch them.
76 int max_nbuf_headers
= NBUF
;
77 int niobuf_headers
= (NBUF
/ 2) + 2048;
78 int nbuf_hashelements
= NBUF
;
79 int nbuf_headers
= NBUF
;
81 int max_nbuf_headers
= 0;
82 int niobuf_headers
= 0;
83 int nbuf_hashelements
= 0;
87 SYSCTL_INT(_kern
, OID_AUTO
, nbuf
, CTLFLAG_RD
| CTLFLAG_LOCKED
, &nbuf_headers
, 0, "");
88 SYSCTL_INT(_kern
, OID_AUTO
, maxnbuf
, CTLFLAG_RW
| CTLFLAG_LOCKED
| CTLFLAG_KERN
, &max_nbuf_headers
, 0, "");
90 __private_extern__
int customnbuf
= 0;
93 /* Indicates a server boot when set */
94 TUNABLE(int, serverperfmode
, "serverperfmode", 0);
97 static unsigned int mbuf_poolsz
;
101 vm_map_t bufferhdr_map
;
102 static int vnodes_sized
= 0;
104 extern void bsd_startupearly(void);
107 bsd_startupearly(void)
109 vm_offset_t firstaddr
;
113 /* clip the number of buf headers upto 16k */
114 if (max_nbuf_headers
== 0) {
115 max_nbuf_headers
= (int)atop_kernel(sane_size
/ 50); /* Get 2% of ram, but no more than we can map */
117 if ((customnbuf
== 0) && ((unsigned int)max_nbuf_headers
> 16384)) {
118 max_nbuf_headers
= 16384;
120 if (max_nbuf_headers
< CONFIG_MIN_NBUF
) {
121 max_nbuf_headers
= CONFIG_MIN_NBUF
;
124 /* clip the number of hash elements to 200000 */
125 if ((customnbuf
== 0) && nbuf_hashelements
== 0) {
126 nbuf_hashelements
= (int)atop_kernel(sane_size
/ 50);
127 if ((unsigned int)nbuf_hashelements
> 200000) {
128 nbuf_hashelements
= 200000;
131 nbuf_hashelements
= max_nbuf_headers
;
134 if (niobuf_headers
== 0) {
135 if (max_nbuf_headers
< 4096) {
136 niobuf_headers
= max_nbuf_headers
;
138 niobuf_headers
= (max_nbuf_headers
/ 2) + 2048;
141 if (niobuf_headers
< CONFIG_MIN_NIOBUF
) {
142 niobuf_headers
= CONFIG_MIN_NIOBUF
;
145 size
= (max_nbuf_headers
+ niobuf_headers
) * sizeof(struct buf
);
146 size
= round_page(size
);
148 ret
= kmem_suballoc(kernel_map
,
153 VM_MAP_KERNEL_FLAGS_NONE
,
157 if (ret
!= KERN_SUCCESS
) {
158 panic("Failed to create bufferhdr_map");
161 ret
= kernel_memory_allocate(bufferhdr_map
,
165 KMA_HERE
| KMA_KOBJECT
,
166 VM_KERN_MEMORY_FILE
);
168 if (ret
!= KERN_SUCCESS
) {
169 panic("Failed to allocate bufferhdr_map");
172 buf_headers
= (struct buf
*) firstaddr
;
173 bzero(buf_headers
, size
);
177 static const unsigned int maxspace
= 128 * 1024;
180 nmbclusters
= bsd_mbuf_cluster_reserve(NULL
) / MCLBYTES
;
183 if ((scale
= nmbclusters
/ NMBCLUSTERS
) > 1) {
184 tcp_sendspace
*= scale
;
185 tcp_recvspace
*= scale
;
187 if (tcp_sendspace
> maxspace
) {
188 tcp_sendspace
= maxspace
;
190 if (tcp_recvspace
> maxspace
) {
191 tcp_recvspace
= maxspace
;
198 if (vnodes_sized
== 0) {
199 if (!PE_get_default("kern.maxvnodes", &desiredvnodes
, sizeof(desiredvnodes
))) {
201 * Size vnodes based on memory
202 * Number vnodes is (memsize/64k) + 1024
203 * This is the calculation that is used by launchd in tiger
204 * we are clipping the max based on 16G
205 * ie ((16*1024*1024*1024)/(64 *1024)) + 1024 = 263168;
206 * CONFIG_VNODES is set to 263168 for "medium" configurations (the default)
207 * but can be smaller or larger.
209 desiredvnodes
= (int)(sane_size
/ 65536) + 1024;
211 if (desiredvnodes
> CONFIG_VNODES
) {
212 desiredvnodes
= CONFIG_VNODES
;
227 * Note: Console device initialized in kminit() from bsd_autoconf()
228 * prior to call to us in bsd_init().
234 ret
= kmem_suballoc(kernel_map
,
235 (vm_offset_t
*) &mbutl
,
236 (vm_size_t
) (nmbclusters
* MCLBYTES
),
239 VM_MAP_KERNEL_FLAGS_NONE
,
243 if (ret
!= KERN_SUCCESS
) {
244 panic("Failed to allocate mb_map\n");
249 * Set up buffers, so they can be used to read disk labels.
254 /* 512 MB (K32) or 2 GB (K64) hard limit on size of the mbuf pool */
255 #if !defined(__LP64__)
256 #define MAX_MBUF_POOL (512 << MBSHIFT)
258 #define MAX_MBUF_POOL (2ULL << GBSHIFT)
259 #endif /* !__LP64__ */
260 #define MAX_NCL (MAX_MBUF_POOL >> MCLSHIFT)
264 * this has been broken out into a separate routine that
265 * can be called from the x86 early vm initialization to
266 * determine how much lo memory to reserve on systems with
267 * DMA hardware that can't fully address all of the physical
268 * memory that is present.
271 bsd_mbuf_cluster_reserve(boolean_t
*overridden
)
274 static boolean_t was_overridden
= FALSE
;
276 /* If called more than once, return the previously calculated size */
277 if (mbuf_poolsz
!= 0) {
282 * Some of these are parsed in parse_bsd_args(), but for x86 we get
283 * here early from i386_vm_init() and so we parse them now, in order
284 * to correctly compute the size of the low-memory VM pool. It is
285 * redundant but rather harmless.
287 (void) PE_parse_boot_argn("ncl", &ncl
, sizeof(ncl
));
288 (void) PE_parse_boot_argn("mbuf_pool", &mbuf_pool
, sizeof(mbuf_pool
));
291 * Convert "mbuf_pool" from MB to # of 2KB clusters; it is
292 * equivalent to "ncl", except that it uses different unit.
294 if (mbuf_pool
!= 0) {
295 ncl
= (mbuf_pool
<< MBSHIFT
) >> MCLSHIFT
;
298 if (sane_size
> (64 * 1024 * 1024) || ncl
!= 0) {
299 if (ncl
|| serverperfmode
) {
300 was_overridden
= TRUE
;
303 if ((nmbclusters
= ncl
) == 0) {
304 /* Auto-configure the mbuf pool size */
305 nmbclusters
= mbuf_default_ncl(mem_actual
);
307 /* Make sure it's not odd in case ncl is manually set */
308 if (nmbclusters
& 0x1) {
312 /* And obey the upper limit */
313 if (nmbclusters
> MAX_NCL
) {
314 nmbclusters
= MAX_NCL
;
318 /* Round it down to nearest multiple of PAGE_SIZE */
319 nmbclusters
= (unsigned int)P2ROUNDDOWN(nmbclusters
, NCLPG
);
321 mbuf_poolsz
= nmbclusters
<< MCLSHIFT
;
324 *overridden
= was_overridden
;
331 #if defined(__LP64__)
332 extern int tcp_tcbhashsize
;
333 extern int max_cached_sock_count
;
338 bsd_scale_setup(int scale
)
340 #if defined(__LP64__)
341 if ((scale
> 0) && (serverperfmode
== 0)) {
343 maxprocperuid
= (maxproc
* 2) / 3;
346 maxfilesperproc
= maxfiles
/ 2;
349 /* Apply server scaling rules */
350 if ((scale
> 0) && (serverperfmode
!= 0)) {
351 maxproc
= 2500 * scale
;
352 hard_maxproc
= maxproc
;
354 maxprocperuid
= (maxproc
* 3) / 4;
355 maxfiles
= (150000 * scale
);
356 maxfilesperproc
= maxfiles
/ 2;
357 desiredvnodes
= maxfiles
;
359 tcp_tfo_backlog
= 100 * scale
;
361 /* clip somaxconn at 32G level */
364 * For scale > 4 (> 32G), clip
365 * tcp_tcbhashsize to 32K
367 tcp_tcbhashsize
= 32 * 1024;
370 /* clip at 64G level */
371 max_cached_sock_count
= 165000;
373 max_cached_sock_count
= 60000 + ((scale
- 1) * 15000);
376 somaxconn
= 512 * scale
;
377 tcp_tcbhashsize
= 4 * 1024 * scale
;
378 max_cached_sock_count
= 60000 + ((scale
- 1) * 15000);
382 if (maxproc
> hard_maxproc
) {
383 hard_maxproc
= maxproc
;
386 bsd_exec_setup(scale
);