]>
git.saurik.com Git - apple/xnu.git/blob - bsd/dev/unix_startup.c
2 * Copyright (c) 2000-2014 Apple Inc. All rights reserved.
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
29 * Copyright (c) 1992,7 NeXT Computer, Inc.
31 * Unix data structure initialization.
35 #include <mach/mach_types.h>
37 #include <vm/vm_kern.h>
38 #include <mach/vm_prot.h>
40 #include <sys/param.h>
41 #include <sys/buf_internal.h>
42 #include <sys/file_internal.h>
43 #include <sys/proc_internal.h>
44 #include <sys/clist.h>
45 #include <sys/mcache.h>
47 #include <sys/systm.h>
49 #include <sys/vnode.h>
50 #include <sys/sysctl.h>
51 #include <machine/cons.h>
52 #include <pexpert/pexpert.h>
53 #include <sys/socketvar.h>
54 #include <pexpert/pexpert.h>
55 #include <netinet/tcp_var.h>
57 extern uint32_t kern_maxvnodes
;
58 extern vm_map_t mb_map
;
61 extern uint32_t tcp_sendspace
;
62 extern uint32_t tcp_recvspace
;
65 void bsd_bufferinit(void);
67 unsigned int bsd_mbuf_cluster_reserve(boolean_t
*);
68 void bsd_scale_setup(int);
69 void bsd_exec_setup(int);
72 * Declare these as initialized data so we can patch them.
76 int max_nbuf_headers
= NBUF
;
77 int niobuf_headers
= (NBUF
/ 2) + 2048;
78 int nbuf_hashelements
= NBUF
;
79 int nbuf_headers
= NBUF
;
81 int max_nbuf_headers
= 0;
82 int niobuf_headers
= 0;
83 int nbuf_hashelements
= 0;
87 SYSCTL_INT (_kern
, OID_AUTO
, nbuf
, CTLFLAG_RD
| CTLFLAG_LOCKED
, &nbuf_headers
, 0, "");
88 SYSCTL_INT (_kern
, OID_AUTO
, maxnbuf
, CTLFLAG_RW
| CTLFLAG_LOCKED
, &max_nbuf_headers
, 0, "");
90 __private_extern__
int customnbuf
= 0;
91 int serverperfmode
= 0; /* Flag indicates a server boot when set */
95 static unsigned int mbuf_poolsz
;
99 vm_map_t bufferhdr_map
;
100 static int vnodes_sized
= 0;
102 extern void bsd_startupearly(void);
105 bsd_startupearly(void)
107 vm_offset_t firstaddr
;
111 /* clip the number of buf headers upto 16k */
112 if (max_nbuf_headers
== 0)
113 max_nbuf_headers
= atop_kernel(sane_size
/ 50); /* Get 2% of ram, but no more than we can map */
114 if ((customnbuf
== 0) && (max_nbuf_headers
> 16384))
115 max_nbuf_headers
= 16384;
116 if (max_nbuf_headers
< CONFIG_MIN_NBUF
)
117 max_nbuf_headers
= CONFIG_MIN_NBUF
;
119 /* clip the number of hash elements to 200000 */
120 if ( (customnbuf
== 0 ) && nbuf_hashelements
== 0) {
121 nbuf_hashelements
= atop_kernel(sane_size
/ 50);
122 if (nbuf_hashelements
> 200000)
123 nbuf_hashelements
= 200000;
125 nbuf_hashelements
= max_nbuf_headers
;
127 if (niobuf_headers
== 0) {
128 if (max_nbuf_headers
< 4096)
129 niobuf_headers
= max_nbuf_headers
;
131 niobuf_headers
= (max_nbuf_headers
/ 2) + 2048;
133 if (niobuf_headers
< CONFIG_MIN_NIOBUF
)
134 niobuf_headers
= CONFIG_MIN_NIOBUF
;
136 size
= (max_nbuf_headers
+ niobuf_headers
) * sizeof(struct buf
);
137 size
= round_page(size
);
139 ret
= kmem_suballoc(kernel_map
,
143 VM_FLAGS_ANYWHERE
| VM_MAKE_TAG(VM_KERN_MEMORY_FILE
),
146 if (ret
!= KERN_SUCCESS
)
147 panic("Failed to create bufferhdr_map");
149 ret
= kernel_memory_allocate(bufferhdr_map
,
153 KMA_HERE
| KMA_KOBJECT
,
154 VM_KERN_MEMORY_FILE
);
156 if (ret
!= KERN_SUCCESS
)
157 panic("Failed to allocate bufferhdr_map");
159 buf_headers
= (struct buf
*) firstaddr
;
160 bzero(buf_headers
, size
);
164 static const unsigned int maxspace
= 128 * 1024;
167 nmbclusters
= bsd_mbuf_cluster_reserve(NULL
) / MCLBYTES
;
170 if ((scale
= nmbclusters
/ NMBCLUSTERS
) > 1) {
171 tcp_sendspace
*= scale
;
172 tcp_recvspace
*= scale
;
174 if (tcp_sendspace
> maxspace
)
175 tcp_sendspace
= maxspace
;
176 if (tcp_recvspace
> maxspace
)
177 tcp_recvspace
= maxspace
;
179 #endif /* INET || INET6 */
183 if (vnodes_sized
== 0) {
184 if (!PE_get_default("kern.maxvnodes", &desiredvnodes
, sizeof(desiredvnodes
))) {
186 * Size vnodes based on memory
187 * Number vnodes is (memsize/64k) + 1024
188 * This is the calculation that is used by launchd in tiger
189 * we are clipping the max based on 16G
190 * ie ((16*1024*1024*1024)/(64 *1024)) + 1024 = 263168;
191 * CONFIG_VNODES is set to 263168 for "medium" configurations (the default)
192 * but can be smaller or larger.
194 desiredvnodes
= (sane_size
/65536) + 1024;
196 if (desiredvnodes
> CONFIG_VNODES
)
197 desiredvnodes
= CONFIG_VNODES
;
211 * Note: Console device initialized in kminit() from bsd_autoconf()
212 * prior to call to us in bsd_init().
218 ret
= kmem_suballoc(kernel_map
,
219 (vm_offset_t
*) &mbutl
,
220 (vm_size_t
) (nmbclusters
* MCLBYTES
),
222 VM_FLAGS_ANYWHERE
| VM_MAKE_TAG(VM_KERN_MEMORY_MBUF
),
225 if (ret
!= KERN_SUCCESS
)
226 panic("Failed to allocate mb_map\n");
230 * Set up buffers, so they can be used to read disk labels.
235 /* 512 MB (K32) or 2 GB (K64) hard limit on size of the mbuf pool */
236 #if !defined(__LP64__)
237 #define MAX_MBUF_POOL (512 << MBSHIFT)
239 #define MAX_MBUF_POOL (2ULL << GBSHIFT)
240 #endif /* !__LP64__ */
241 #define MAX_NCL (MAX_MBUF_POOL >> MCLSHIFT)
245 * this has been broken out into a separate routine that
246 * can be called from the x86 early vm initialization to
247 * determine how much lo memory to reserve on systems with
248 * DMA hardware that can't fully address all of the physical
249 * memory that is present.
252 bsd_mbuf_cluster_reserve(boolean_t
*overridden
)
255 static boolean_t was_overridden
= FALSE
;
257 /* If called more than once, return the previously calculated size */
258 if (mbuf_poolsz
!= 0)
262 * Some of these are parsed in parse_bsd_args(), but for x86 we get
263 * here early from i386_vm_init() and so we parse them now, in order
264 * to correctly compute the size of the low-memory VM pool. It is
265 * redundant but rather harmless.
267 (void) PE_parse_boot_argn("ncl", &ncl
, sizeof (ncl
));
268 (void) PE_parse_boot_argn("mbuf_pool", &mbuf_pool
, sizeof (mbuf_pool
));
271 * Convert "mbuf_pool" from MB to # of 2KB clusters; it is
272 * equivalent to "ncl", except that it uses different unit.
275 ncl
= (mbuf_pool
<< MBSHIFT
) >> MCLSHIFT
;
277 if (sane_size
> (64 * 1024 * 1024) || ncl
!= 0) {
279 if (ncl
|| serverperfmode
)
280 was_overridden
= TRUE
;
282 if ((nmbclusters
= ncl
) == 0) {
283 /* Auto-configure the mbuf pool size */
284 nmbclusters
= mbuf_default_ncl(serverperfmode
, sane_size
);
286 /* Make sure it's not odd in case ncl is manually set */
287 if (nmbclusters
& 0x1)
290 /* And obey the upper limit */
291 if (nmbclusters
> MAX_NCL
)
292 nmbclusters
= MAX_NCL
;
295 /* Round it down to nearest multiple of PAGE_SIZE */
296 nmbclusters
= P2ROUNDDOWN(nmbclusters
, NCLPG
);
298 mbuf_poolsz
= nmbclusters
<< MCLSHIFT
;
301 *overridden
= was_overridden
;
303 return (mbuf_poolsz
);
307 #if defined(__LP64__)
308 extern int tcp_tcbhashsize
;
309 extern int max_cached_sock_count
;
314 bsd_scale_setup(int scale
)
316 #if defined(__LP64__)
317 if ((scale
> 0) && (serverperfmode
== 0)) {
319 maxprocperuid
= (maxproc
* 2) / 3;
321 /* Apply server scaling rules */
322 if ((scale
> 0) && (serverperfmode
!=0)) {
323 maxproc
= 2500 * scale
;
324 hard_maxproc
= maxproc
;
326 maxprocperuid
= (maxproc
*3)/4;
327 maxfiles
= (150000 * scale
);
328 maxfilesperproc
= maxfiles
/2;
329 desiredvnodes
= maxfiles
;
331 tcp_tfo_backlog
= 100 * scale
;
333 /* clip somaxconn at 32G level */
336 * For scale > 4 (> 32G), clip
337 * tcp_tcbhashsize to 32K
339 tcp_tcbhashsize
= 32 *1024;
342 /* clip at 64G level */
343 max_cached_sock_count
= 165000;
345 max_cached_sock_count
= 60000 + ((scale
-1) * 15000);
348 somaxconn
= 512*scale
;
349 tcp_tcbhashsize
= 4*1024*scale
;
350 max_cached_sock_count
= 60000 + ((scale
-1) * 15000);
354 if(maxproc
> hard_maxproc
) {
355 hard_maxproc
= maxproc
;
358 bsd_exec_setup(scale
);