2 * Copyright (c) 2000-2019 Apple Inc. All rights reserved.
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
29 * Copyright (c) 1982, 1986, 1989, 1991, 1992, 1993
30 * The Regents of the University of California. All rights reserved.
31 * (c) UNIX System Laboratories, Inc.
32 * All or some portions of this file are derived from material licensed
33 * to the University of California by American Telephone and Telegraph
34 * Co. or Unix System Laboratories, Inc. and are reproduced herein with
35 * the permission of UNIX System Laboratories, Inc.
37 * Redistribution and use in source and binary forms, with or without
38 * modification, are permitted provided that the following conditions
40 * 1. Redistributions of source code must retain the above copyright
41 * notice, this list of conditions and the following disclaimer.
42 * 2. Redistributions in binary form must reproduce the above copyright
43 * notice, this list of conditions and the following disclaimer in the
44 * documentation and/or other materials provided with the distribution.
45 * 3. All advertising materials mentioning features or use of this software
46 * must display the following acknowledgement:
47 * This product includes software developed by the University of
48 * California, Berkeley and its contributors.
49 * 4. Neither the name of the University nor the names of its contributors
50 * may be used to endorse or promote products derived from this software
51 * without specific prior written permission.
53 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
54 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
55 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
56 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
57 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
58 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
59 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
60 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
61 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
62 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
65 * @(#)init_main.c 8.16 (Berkeley) 5/14/95
70 * Mach Operating System
71 * Copyright (c) 1987 Carnegie-Mellon University
72 * All rights reserved. The CMU software License Agreement specifies
73 * the terms and conditions for use and redistribution.
76 * NOTICE: This file was modified by McAfee Research in 2004 to introduce
77 * support for mandatory and extensible security protections. This notice
78 * is included in support of clause 2.2 (b) of the Apple Public License,
82 #include <sys/param.h>
83 #include <sys/filedesc.h>
84 #include <sys/kernel.h>
85 #include <sys/mount_internal.h>
86 #include <sys/proc_internal.h>
87 #include <sys/kauth.h>
88 #include <sys/systm.h>
89 #include <sys/vnode_internal.h>
91 #include <sys/buf_internal.h>
92 #include <sys/clist.h>
95 #include <sys/systm.h>
99 #include <security/audit/audit.h>
101 #include <sys/malloc.h>
102 #include <sys/dkstat.h>
103 #include <sys/codesign.h>
105 #include <kern/startup.h>
106 #include <kern/thread.h>
107 #include <kern/task.h>
108 #include <kern/ast.h>
109 #include <kern/kalloc.h>
110 #include <kern/ux_handler.h> /* for ux_handler_setup() */
112 #include <mach/vm_param.h>
114 #include <vm/vm_map.h>
115 #include <vm/vm_kern.h>
117 #include <sys/reboot.h>
118 #include <dev/busvar.h> /* for pseudo_inits */
119 #include <sys/kdebug.h>
120 #include <sys/monotonic.h>
121 #include <sys/reason.h>
123 #include <mach/mach_types.h>
124 #include <mach/vm_prot.h>
125 #include <mach/semaphore.h>
126 #include <mach/sync_policy.h>
127 #include <kern/clock.h>
128 #include <mach/kern_return.h>
129 #include <mach/thread_act.h> /* for thread_resume() */
130 #include <sys/ubc_internal.h> /* for ubc_init() */
131 #include <sys/mcache.h> /* for mcache_init() */
132 #include <sys/mbuf.h> /* for mbinit() */
133 #include <sys/event.h> /* for knote_init() */
134 #include <sys/eventhandler.h> /* for eventhandler_init() */
135 #include <sys/kern_memorystatus.h> /* for memorystatus_init() */
136 #include <sys/kern_memorystatus_freeze.h> /* for memorystatus_freeze_init() */
137 #include <sys/aio_kern.h> /* for aio_init() */
138 #include <sys/semaphore.h> /* for psem_cache_init() */
139 #include <net/dlil.h> /* for dlil_init() */
140 #include <net/kpi_protocol.h> /* for proto_kpi_init() */
141 #include <net/iptap.h> /* for iptap_init() */
142 #include <sys/pipe.h> /* for pipeinit() */
143 #include <sys/socketvar.h> /* for socketinit() */
144 #include <sys/protosw.h> /* for domaininit() */
145 #include <kern/sched_prim.h> /* for thread_wakeup() */
146 #include <net/if_ether.h> /* for ether_family_init() */
147 #include <net/if_gif.h> /* for gif_init() */
148 #include <vm/vm_protos.h> /* for vnode_pager_bootstrap() */
149 #include <miscfs/devfs/devfsdefs.h> /* for devfs_kernel_mount() */
150 #include <vm/vm_kern.h> /* for kmem_suballoc() */
151 #include <sys/semaphore.h> /* for psem_lock_init() */
152 #include <sys/msgbuf.h> /* for log_setsize() */
153 #include <sys/tty.h> /* for tty_init() */
154 #include <sys/proc_uuid_policy.h> /* proc_uuid_policy_init() */
155 #include <netinet/flow_divert.h> /* flow_divert_init() */
156 #include <net/content_filter.h> /* for cfil_init() */
157 #include <net/necp.h> /* for necp_init() */
158 #include <net/network_agent.h> /* for netagent_init() */
159 #include <net/packet_mangler.h> /* for pkt_mnglr_init() */
160 #include <net/if_utun.h> /* for utun_register_control() */
161 #include <net/if_ipsec.h> /* for ipsec_register_control() */
162 #include <net/net_str_id.h> /* for net_str_id_init() */
163 #include <net/netsrc.h> /* for netsrc_init() */
164 #include <net/ntstat.h> /* for nstat_init() */
165 #include <netinet/tcp_cc.h> /* for tcp_cc_init() */
166 #include <netinet/mptcp_var.h> /* for mptcp_control_register() */
167 #include <net/nwk_wq.h> /* for nwk_wq_init */
168 #include <net/restricted_in_port.h> /* for restricted_in_port_init() */
169 #include <kern/assert.h> /* for assert() */
170 #include <sys/kern_overrides.h> /* for init_system_override() */
171 #include <sys/lockf.h> /* for lf_init() */
173 #include <net/init.h>
176 #include <security/mac_framework.h>
177 #include <security/mac_internal.h> /* mac_init_bsd() */
178 #include <security/mac_mach_internal.h> /* mac_update_task_label() */
181 #include <machine/exec.h>
184 #include <sys/netboot.h>
188 #include <sys/imageboot.h>
192 #include <net/if_pflog.h>
196 #include <pexpert/pexpert.h>
197 #include <machine/pal_routines.h>
198 #include <console/video_console.h>
201 #include <tests/xnupost.h>
204 void * get_user_regs(thread_t
); /* XXX kludge for <machine/thread.h> */
205 void IOKitInitializeTime(void); /* XXX */
206 void IOSleep(unsigned int); /* XXX */
207 void loopattach(void); /* XXX */
209 const char copyright
[] =
210 "Copyright (c) 1982, 1986, 1989, 1991, 1993\n\t"
211 "The Regents of the University of California. "
212 "All rights reserved.\n\n";
214 /* Components of the first process -- never freed. */
216 struct session session0
;
218 struct filedesc filedesc0
;
219 struct plimit limit0
;
220 struct pstats pstats0
;
221 struct sigacts sigacts0
;
231 /* Global variables to make pstat happy. We do swapping differently */
235 struct swdevt swdevt
[1];
237 dev_t rootdev
; /* device of the root */
238 dev_t dumpdev
; /* device to take dumps on */
239 long dumplo
; /* offset into dumpdev */
241 char hostname
[MAXHOSTNAMELEN
];
242 lck_mtx_t hostname_lock
;
243 lck_grp_t
*hostname_lck_grp
;
244 char domainname
[MAXDOMNAMELEN
];
245 lck_mtx_t domainname_lock
;
247 char rootdevice
[DEVMAXNAMESIZE
];
250 struct kmemstats kmemstats
[M_LAST
];
253 struct vnode
*rootvp
;
261 int legacy_footprint_entitlement_mode
= LEGACY_FOOTPRINT_ENTITLEMENT_IGNORE
;
262 #endif /* __arm64__ */
265 __private_extern__
int proc_ref_tracking_disabled
= 0; /* disable panics on leaked proc refs across syscall boundary */
269 __private_extern__
int os_reason_debug_disabled
= 0; /* disable asserts for when we fail to allocate OS reasons */
272 extern kern_return_t
IOFindBSDRoot(char *, unsigned int, dev_t
*, u_int32_t
*);
273 extern void IOSecureBSDRoot(const char * rootName
);
274 extern kern_return_t
IOKitBSDInit(void );
275 extern void kminit(void);
276 extern void file_lock_init(void);
277 extern void kmeminit(void);
278 extern void bsd_bufferinit(void);
279 extern void oslog_setsize(int size
);
280 extern void throttle_init(void);
281 extern void acct_init(void);
283 #if CONFIG_LOCKERBOOT
284 #define LOCKER_PROTOBOOT_MOUNT "/protoboot"
286 const char kernel_protoboot_mount
[] = LOCKER_PROTOBOOT_MOUNT
;
287 extern int mount_locker_protoboot(const char *fsname
, const char *mntpoint
,
288 const char *pbdevpath
);
291 extern int serverperfmode
;
293 #if DEVELOPMENT || DEBUG
294 extern int syscallfilter_disable
;
295 #endif // DEVELOPMENT || DEBUG
297 vm_map_t bsd_pageable_map
;
300 static int bsd_simul_execs
;
301 static int bsd_pageable_map_size
;
302 __private_extern__
int execargs_cache_size
= 0;
303 __private_extern__
int execargs_free_count
= 0;
304 __private_extern__ vm_offset_t
* execargs_cache
= NULL
;
306 void bsd_exec_setup(int);
308 __private_extern__
int bootarg_execfailurereports
= 0;
311 __private_extern__
int bootarg_no32exec
= 1;
313 __private_extern__
int bootarg_vnode_cache_defeat
= 0;
315 #if CONFIG_JETSAM && (DEVELOPMENT || DEBUG)
316 __private_extern__
int bootarg_no_vnode_jetsam
= 0;
317 #endif /* CONFIG_JETSAM && (DEVELOPMENT || DEBUG) */
319 __private_extern__
int bootarg_no_vnode_drain
= 0;
322 * Prevent kernel-based ASLR from being used, for testing.
324 #if DEVELOPMENT || DEBUG
325 __private_extern__
int bootarg_disable_aslr
= 0;
329 * Allow an alternate dyld to be used for testing.
332 #if DEVELOPMENT || DEBUG
333 char dyld_alt_path
[MAXPATHLEN
];
334 int use_alt_dyld
= 0;
335 extern uint64_t dyld_flags
;
339 extern int customnbuf
;
341 kern_return_t
bsd_autoconf(void);
342 void bsd_utaskbootstrap(void);
344 static void parse_bsd_args(void);
346 extern void dev_kmem_init(void);
348 extern void time_zone_slock_init(void);
349 extern void select_waitq_init(void);
350 static void process_name(const char *, proc_t
);
352 static void setconf(void);
355 extern void sysv_shm_lock_init(void);
358 extern void sysv_sem_lock_init(void);
361 extern void sysv_msg_lock_init(void);
364 extern void ulock_initialize(void);
367 #if defined (__i386__) || defined (__x86_64__)
368 /* MACF policy_check configuration flags; see policy_check.c for details */
369 int policy_check_flags
= 0;
371 extern int check_policy_init(int);
373 #endif /* CONFIG_MACF */
375 /* If we are using CONFIG_DTRACE */
377 extern void dtrace_postinit(void);
381 * Initialization code.
382 * Called from cold start routine as
383 * soon as a stack and segmentation
384 * have been established.
387 * hand craft 0th process
388 * call all initialization routines
389 * hand craft 1st user process
393 * Sets the name for the given task.
396 process_name(const char *s
, proc_t p
)
398 strlcpy(p
->p_comm
, s
, sizeof(p
->p_comm
));
399 strlcpy(p
->p_name
, s
, sizeof(p
->p_name
));
402 /* To allow these values to be patched, they're globals here */
403 #include <machine/vmparam.h>
404 struct rlimit vm_initial_limit_stack
= { .rlim_cur
= DFLSSIZ
, .rlim_max
= MAXSSIZ
- PAGE_MAX_SIZE
};
405 struct rlimit vm_initial_limit_data
= { .rlim_cur
= DFLDSIZ
, .rlim_max
= MAXDSIZ
};
406 struct rlimit vm_initial_limit_core
= { .rlim_cur
= DFLCSIZ
, .rlim_max
= MAXCSIZ
};
408 extern thread_t
cloneproc(task_t
, coalition_t
, proc_t
, int, int);
409 extern int (*mountroot
)(void);
411 lck_grp_t
* proc_lck_grp
;
412 lck_grp_t
* proc_slock_grp
;
413 lck_grp_t
* proc_fdmlock_grp
;
414 lck_grp_t
* proc_kqhashlock_grp
;
415 lck_grp_t
* proc_knhashlock_grp
;
416 lck_grp_t
* proc_ucred_mlock_grp
;
417 lck_grp_t
* proc_mlock_grp
;
418 lck_grp_attr_t
* proc_lck_grp_attr
;
419 lck_attr_t
* proc_lck_attr
;
420 lck_mtx_t
* proc_list_mlock
;
421 lck_mtx_t
* proc_klist_mlock
;
424 lck_grp_t
* sysctl_debug_test_stackshot_owner_grp
;
425 lck_mtx_t
* sysctl_debug_test_stackshot_owner_init_mtx
;
426 #endif /* !CONFIG_XNUPOST */
428 extern lck_mtx_t
* execargs_cache_lock
;
430 /* hook called after root is mounted XXX temporary hack */
431 void (*mountroot_post_hook
)(void);
432 void (*unmountroot_pre_hook
)(void);
435 * This function is called before IOKit initialization, so that globals
436 * like the sysctl tree are initialized before kernel extensions
437 * are started (since they may want to register sysctls
446 * This function is called very early on in the Mach startup, from the
447 * function start_kernel_threads() in osfmk/kern/startup.c. It's called
448 * in the context of the current (startup) task using a call to the
449 * function kernel_thread_create() to jump into start_kernel_threads().
450 * Internally, kernel_thread_create() calls thread_create_internal(),
451 * which calls uthread_alloc(). The function of uthread_alloc() is
452 * normally to allocate a uthread structure, and fill out the uu_sigmask,
453 * uu_context fields. It skips filling these out in the case of the "task"
454 * being "kernel_task", because the order of operation is inverted. To
455 * account for that, we need to manually fill in at least the contents
456 * of the uu_context.vc_ucred field so that the uthread structure can be
457 * used like any other.
465 struct vfs_context context
;
467 struct ucred temp_cred
;
468 struct posix_cred temp_pcred
;
469 #if CONFIG_NETBOOT || CONFIG_IMAGEBOOT
470 boolean_t netboot
= FALSE
;
472 #if CONFIG_LOCKERBOOT
473 vnode_t pbvn
= NULLVP
;
474 mount_t pbmnt
= NULL
;
477 char pbfsname
[MFSNAMELEN
];
478 char *slash_dev
= NULL
;
481 #define DEBUG_BSDINIT 0
484 #define bsd_init_kprintf(x, ...) kprintf("bsd_init: " x, ## __VA_ARGS__)
486 #define bsd_init_kprintf(x, ...)
493 bsd_init_kprintf("calling kmeminit\n");
496 bsd_init_kprintf("calling parse_bsd_args\n");
500 bsd_init_kprintf("calling dev_kmem_init\n");
504 /* Initialize kauth subsystem before instancing the first credential */
505 bsd_init_kprintf("calling kauth_init\n");
508 /* Initialize process and pgrp structures. */
509 bsd_init_kprintf("calling procinit\n");
512 /* Initialize the ttys (MUST be before kminit()/bsd_autoconf()!)*/
515 kernproc
= &proc0
; /* implicitly bzero'ed */
517 /* kernel_task->proc = kernproc; */
518 set_bsdtask_info(kernel_task
, (void *)kernproc
);
520 /* give kernproc a name */
521 bsd_init_kprintf("calling process_name\n");
522 process_name("kernel_task", kernproc
);
524 /* allocate proc lock group attribute and group */
525 bsd_init_kprintf("calling lck_grp_attr_alloc_init\n");
526 proc_lck_grp_attr
= lck_grp_attr_alloc_init();
528 proc_lck_grp
= lck_grp_alloc_init("proc", proc_lck_grp_attr
);
530 proc_slock_grp
= lck_grp_alloc_init("proc-slock", proc_lck_grp_attr
);
531 proc_ucred_mlock_grp
= lck_grp_alloc_init("proc-ucred-mlock", proc_lck_grp_attr
);
532 proc_mlock_grp
= lck_grp_alloc_init("proc-mlock", proc_lck_grp_attr
);
533 proc_fdmlock_grp
= lck_grp_alloc_init("proc-fdmlock", proc_lck_grp_attr
);
534 proc_kqhashlock_grp
= lck_grp_alloc_init("proc-kqhashlock", proc_lck_grp_attr
);
535 proc_knhashlock_grp
= lck_grp_alloc_init("proc-knhashlock", proc_lck_grp_attr
);
537 sysctl_debug_test_stackshot_owner_grp
= lck_grp_alloc_init("test-stackshot-owner-grp", LCK_GRP_ATTR_NULL
);
538 sysctl_debug_test_stackshot_owner_init_mtx
= lck_mtx_alloc_init(
539 sysctl_debug_test_stackshot_owner_grp
,
541 #endif /* !CONFIG_XNUPOST */
542 /* Allocate proc lock attribute */
543 proc_lck_attr
= lck_attr_alloc_init();
545 proc_list_mlock
= lck_mtx_alloc_init(proc_mlock_grp
, proc_lck_attr
);
546 proc_klist_mlock
= lck_mtx_alloc_init(proc_mlock_grp
, proc_lck_attr
);
547 lck_mtx_init(&kernproc
->p_mlock
, proc_mlock_grp
, proc_lck_attr
);
548 lck_mtx_init(&kernproc
->p_fdmlock
, proc_fdmlock_grp
, proc_lck_attr
);
549 lck_mtx_init(&kernproc
->p_ucred_mlock
, proc_ucred_mlock_grp
, proc_lck_attr
);
550 lck_spin_init(&kernproc
->p_slock
, proc_slock_grp
, proc_lck_attr
);
552 assert(bsd_simul_execs
!= 0);
553 execargs_cache_lock
= lck_mtx_alloc_init(proc_lck_grp
, proc_lck_attr
);
554 execargs_cache_size
= bsd_simul_execs
;
555 execargs_free_count
= bsd_simul_execs
;
556 execargs_cache
= (vm_offset_t
*)kalloc(bsd_simul_execs
* sizeof(vm_offset_t
));
557 bzero(execargs_cache
, bsd_simul_execs
* sizeof(vm_offset_t
));
559 if (current_task() != kernel_task
) {
560 printf("bsd_init: We have a problem, "
561 "current task is not kernel task\n");
564 bsd_init_kprintf("calling get_bsdthread_info\n");
565 ut
= (uthread_t
)get_bsdthread_info(current_thread());
569 * Initialize the MAC Framework
571 mac_policy_initbsd();
573 #if defined (__i386__) || defined (__x86_64__)
575 * We currently only support this on i386/x86_64, as that is the
576 * only lock code we have instrumented so far.
578 check_policy_init(policy_check_flags
);
584 hostname_lck_grp
= lck_grp_alloc_init("hostname", LCK_GRP_ATTR_NULL
);
585 lck_mtx_init(&hostname_lock
, hostname_lck_grp
, LCK_ATTR_NULL
);
586 lck_mtx_init(&domainname_lock
, hostname_lck_grp
, LCK_ATTR_NULL
);
592 LIST_INSERT_HEAD(&allproc
, kernproc
, p_list
);
593 kernproc
->p_pgrp
= &pgrp0
;
594 LIST_INSERT_HEAD(PGRPHASH(0), &pgrp0
, pg_hash
);
595 LIST_INIT(&pgrp0
.pg_members
);
596 lck_mtx_init(&pgrp0
.pg_mlock
, proc_mlock_grp
, proc_lck_attr
);
597 /* There is no other bsd thread this point and is safe without pgrp lock */
598 LIST_INSERT_HEAD(&pgrp0
.pg_members
, kernproc
, p_pglist
);
599 kernproc
->p_listflag
|= P_LIST_INPGRP
;
600 kernproc
->p_pgrpid
= 0;
601 kernproc
->p_uniqueid
= 0;
603 pgrp0
.pg_session
= &session0
;
604 pgrp0
.pg_membercnt
= 1;
606 session0
.s_count
= 1;
607 session0
.s_leader
= kernproc
;
608 session0
.s_listflags
= 0;
609 lck_mtx_init(&session0
.s_mlock
, proc_mlock_grp
, proc_lck_attr
);
610 LIST_INSERT_HEAD(SESSHASH(0), &session0
, s_hash
);
614 kernproc
->p_persona
= NULL
;
617 kernproc
->task
= kernel_task
;
619 kernproc
->p_stat
= SRUN
;
620 kernproc
->p_flag
= P_SYSTEM
;
621 kernproc
->p_lflag
= 0;
622 kernproc
->p_ladvflag
= 0;
624 #if defined(__LP64__)
625 kernproc
->p_flag
|= P_LP64
;
628 #if DEVELOPMENT || DEBUG
629 if (bootarg_disable_aslr
) {
630 kernproc
->p_flag
|= P_DISABLE_ASLR
;
634 kernproc
->p_nice
= NZERO
;
635 kernproc
->p_pptr
= kernproc
;
637 TAILQ_INIT(&kernproc
->p_uthlist
);
638 TAILQ_INSERT_TAIL(&kernproc
->p_uthlist
, ut
, uu_list
);
640 kernproc
->sigwait
= FALSE
;
641 kernproc
->sigwait_thread
= THREAD_NULL
;
642 kernproc
->exit_thread
= THREAD_NULL
;
643 kernproc
->p_csflags
= CS_VALID
;
646 * Create credential. This also Initializes the audit information.
648 bsd_init_kprintf("calling bzero\n");
649 bzero(&temp_cred
, sizeof(temp_cred
));
650 bzero(&temp_pcred
, sizeof(temp_pcred
));
651 temp_pcred
.cr_ngroups
= 1;
652 /* kern_proc, shouldn't call up to DS for group membership */
653 temp_pcred
.cr_flags
= CRF_NOMEMBERD
;
654 temp_cred
.cr_audit
.as_aia_p
= audit_default_aia_p
;
656 bsd_init_kprintf("calling kauth_cred_create\n");
658 * We have to label the temp cred before we create from it to
659 * properly set cr_ngroups, or the create will fail.
661 posix_cred_label(&temp_cred
, &temp_pcred
);
662 kernproc
->p_ucred
= kauth_cred_create(&temp_cred
);
664 /* update cred on proc */
665 PROC_UPDATE_CREDS_ONPROC(kernproc
);
667 /* give the (already exisiting) initial thread a reference on it */
668 bsd_init_kprintf("calling kauth_cred_ref\n");
669 kauth_cred_ref(kernproc
->p_ucred
);
670 ut
->uu_context
.vc_ucred
= kernproc
->p_ucred
;
671 ut
->uu_context
.vc_thread
= current_thread();
673 TAILQ_INIT(&kernproc
->p_aio_activeq
);
674 TAILQ_INIT(&kernproc
->p_aio_doneq
);
675 kernproc
->p_aio_total_count
= 0;
676 kernproc
->p_aio_active_count
= 0;
678 bsd_init_kprintf("calling file_lock_init\n");
682 mac_cred_label_associate_kernel(kernproc
->p_ucred
);
685 /* Create the file descriptor table. */
686 kernproc
->p_fd
= &filedesc0
;
687 filedesc0
.fd_cmask
= cmask
;
688 filedesc0
.fd_knlistsize
= 0;
689 filedesc0
.fd_knlist
= NULL
;
690 filedesc0
.fd_knhash
= NULL
;
691 filedesc0
.fd_knhashmask
= 0;
692 lck_mtx_init(&filedesc0
.fd_kqhashlock
, proc_kqhashlock_grp
, proc_lck_attr
);
693 lck_mtx_init(&filedesc0
.fd_knhashlock
, proc_knhashlock_grp
, proc_lck_attr
);
695 /* Create the limits structures. */
696 kernproc
->p_limit
= &limit0
;
697 for (i
= 0; i
< sizeof(kernproc
->p_rlimit
) / sizeof(kernproc
->p_rlimit
[0]); i
++) {
698 limit0
.pl_rlimit
[i
].rlim_cur
=
699 limit0
.pl_rlimit
[i
].rlim_max
= RLIM_INFINITY
;
701 limit0
.pl_rlimit
[RLIMIT_NOFILE
].rlim_cur
= NOFILE
;
702 limit0
.pl_rlimit
[RLIMIT_NPROC
].rlim_cur
= maxprocperuid
;
703 limit0
.pl_rlimit
[RLIMIT_NPROC
].rlim_max
= maxproc
;
704 limit0
.pl_rlimit
[RLIMIT_STACK
] = vm_initial_limit_stack
;
705 limit0
.pl_rlimit
[RLIMIT_DATA
] = vm_initial_limit_data
;
706 limit0
.pl_rlimit
[RLIMIT_CORE
] = vm_initial_limit_core
;
707 limit0
.pl_refcnt
= 1;
709 kernproc
->p_stats
= &pstats0
;
710 kernproc
->p_sigacts
= &sigacts0
;
713 * Charge root for one process: launchd.
715 bsd_init_kprintf("calling chgproccnt\n");
716 (void)chgproccnt(0, 1);
719 * Allocate a kernel submap for pageable memory
720 * for temporary copying (execve()).
725 bsd_init_kprintf("calling kmem_suballoc\n");
726 assert(bsd_pageable_map_size
!= 0);
727 ret
= kmem_suballoc(kernel_map
,
729 (vm_size_t
)bsd_pageable_map_size
,
732 VM_MAP_KERNEL_FLAGS_NONE
,
735 if (ret
!= KERN_SUCCESS
) {
736 panic("bsd_init: Failed to allocate bsd pageable map");
740 bsd_init_kprintf("calling fpxlog_init\n");
744 * Initialize buffers and hash links for buffers
746 * SIDE EFFECT: Starts a thread for bcleanbuf_thread(), so must
747 * happen after a credential has been associated with
750 bsd_init_kprintf("calling bsd_bufferinit\n");
754 * Initialize the calendar.
756 bsd_init_kprintf("calling IOKitInitializeTime\n");
757 IOKitInitializeTime();
759 bsd_init_kprintf("calling ubc_init\n");
762 /* Initialize the file systems. */
763 bsd_init_kprintf("calling vfsinit\n");
766 /* Initialize file locks. */
767 bsd_init_kprintf("calling lf_init\n");
770 #if CONFIG_PROC_UUID_POLICY
771 /* Initial proc_uuid_policy subsystem */
772 bsd_init_kprintf("calling proc_uuid_policy_init()\n");
773 proc_uuid_policy_init();
777 /* Initialize per-CPU cache allocator */
780 /* Initialize mbuf's. */
781 bsd_init_kprintf("calling mbinit\n");
783 net_str_id_init(); /* for mbuf tags */
784 restricted_in_port_init();
788 * Initializes security event auditing.
789 * XXX: Should/could this occur later?
792 bsd_init_kprintf("calling audit_init\n");
796 /* Initialize kqueues */
797 bsd_init_kprintf("calling knote_init\n");
800 /* Initialize event handler */
801 bsd_init_kprintf("calling eventhandler_init\n");
804 /* Initialize for async IO */
805 bsd_init_kprintf("calling aio_init\n");
808 /* Initialize pipes */
809 bsd_init_kprintf("calling pipeinit\n");
812 /* Initialize SysV shm subsystem locks; the subsystem proper is
813 * initialized through a sysctl.
816 bsd_init_kprintf("calling sysv_shm_lock_init\n");
817 sysv_shm_lock_init();
820 bsd_init_kprintf("calling sysv_sem_lock_init\n");
821 sysv_sem_lock_init();
824 bsd_init_kprintf("sysv_msg_lock_init\n");
825 sysv_msg_lock_init();
827 bsd_init_kprintf("calling pshm_lock_init\n");
829 bsd_init_kprintf("calling psem_lock_init\n");
833 /* POSIX Shm and Sem */
834 bsd_init_kprintf("calling pshm_cache_init\n");
836 bsd_init_kprintf("calling psem_cache_init\n");
838 bsd_init_kprintf("calling time_zone_slock_init\n");
839 time_zone_slock_init();
840 bsd_init_kprintf("calling select_waitq_init\n");
844 * Initialize protocols. Block reception of incoming packets
845 * until everything is ready.
848 bsd_init_kprintf("calling nwk_wq_init\n");
850 bsd_init_kprintf("calling dlil_init\n");
852 bsd_init_kprintf("calling proto_kpi_init\n");
854 #endif /* NETWORKING */
856 bsd_init_kprintf("calling socketinit\n");
858 bsd_init_kprintf("calling domaininit\n");
863 #endif /* FLOW_DIVERT */
865 kernproc
->p_fd
->fd_cdir
= NULL
;
866 kernproc
->p_fd
->fd_rdir
= NULL
;
869 #ifndef CONFIG_MEMORYSTATUS
870 #error "CONFIG_FREEZE defined without matching CONFIG_MEMORYSTATUS"
872 /* Initialise background freezing */
873 bsd_init_kprintf("calling memorystatus_freeze_init\n");
874 memorystatus_freeze_init();
877 #if CONFIG_MEMORYSTATUS
878 /* Initialize kernel memory status notifications */
879 bsd_init_kprintf("calling memorystatus_init\n");
881 #endif /* CONFIG_MEMORYSTATUS */
883 bsd_init_kprintf("calling acct_init\n");
886 bsd_init_kprintf("calling sysctl_mib_init\n");
889 bsd_init_kprintf("calling bsd_autoconf\n");
892 bsd_init_kprintf("calling os_reason_init\n");
900 * We attach the loopback interface *way* down here to ensure
901 * it happens after autoconf(), otherwise it becomes the
902 * "primary" interface.
906 bsd_init_kprintf("calling loopattach\n");
907 loopattach(); /* XXX */
910 /* Initialize gif interface (after lo0) */
915 /* Initialize packet filter log interface */
920 /* Register the built-in dlil ethernet interface family */
921 bsd_init_kprintf("calling ether_family_init\n");
926 /* Call any kext code that wants to run just after network init */
927 bsd_init_kprintf("calling net_init_run\n");
939 /* Initialize Network Extension Control Policies */
945 /* register user tunnel kernel control handler */
946 utun_register_control();
948 ipsec_register_control();
954 mptcp_control_register();
956 #endif /* NETWORKING */
958 bsd_init_kprintf("calling vnode_pager_bootstrap\n");
959 vnode_pager_bootstrap();
961 bsd_init_kprintf("calling inittodr\n");
964 /* Mount the root file system. */
968 bsd_init_kprintf("calling setconf\n");
971 netboot
= (mountroot
== netboot_mountroot
);
974 bsd_init_kprintf("vfs_mountroot\n");
975 if (0 == (err
= vfs_mountroot())) {
978 rootdevice
[0] = '\0';
981 PE_display_icon( 0, "noroot"); /* XXX a netboot-specific icon would be nicer */
982 vc_progress_set(FALSE
, 0);
983 for (i
= 1; 1; i
*= 2) {
984 printf("bsd_init: failed to mount network root, error %d, %s\n",
985 err
, PE_boot_args());
986 printf("We are hanging here...\n");
987 IOSleep(i
* 60 * 1000);
992 printf("cannot mount root, errno = %d\n", err
);
993 boothowto
|= RB_ASKNAME
;
996 IOSecureBSDRoot(rootdevice
);
998 context
.vc_thread
= current_thread();
999 context
.vc_ucred
= kernproc
->p_ucred
;
1000 mountlist
.tqh_first
->mnt_flag
|= MNT_ROOTFS
;
1002 bsd_init_kprintf("calling VFS_ROOT\n");
1003 /* Get the vnode for '/'. Set fdp->fd_fd.fd_cdir to reference it. */
1004 if (VFS_ROOT(mountlist
.tqh_first
, &rootvnode
, &context
)) {
1005 panic("bsd_init: cannot find root vnode: %s", PE_boot_args());
1007 rootvnode
->v_flag
|= VROOT
;
1008 (void)vnode_ref(rootvnode
);
1009 (void)vnode_put(rootvnode
);
1010 filedesc0
.fd_cdir
= rootvnode
;
1017 /* post mount setup */
1018 if ((err
= netboot_setup()) != 0) {
1019 PE_display_icon( 0, "noroot"); /* XXX a netboot-specific icon would be nicer */
1020 vc_progress_set(FALSE
, 0);
1021 for (i
= 1; 1; i
*= 2) {
1022 printf("bsd_init: NetBoot could not find root, error %d: %s\n",
1023 err
, PE_boot_args());
1024 printf("We are hanging here...\n");
1025 IOSleep(i
* 60 * 1000);
1033 #if CONFIG_IMAGEBOOT
1034 #if CONFIG_LOCKERBOOT
1036 * Stash the protoboot vnode, mount, filesystem name, and device name for
1037 * later use. Note that the mount-from name may not have the "/dev/"
1038 * component, so we must sniff out this condition and add it as needed.
1041 pbmnt
= pbvn
->v_mount
;
1042 pbdevp
= vfs_statfs(pbmnt
)->f_mntfromname
;
1043 slash_dev
= strnstr(pbdevp
, "/dev/", strlen(pbdevp
));
1046 * If the old root is a snapshot mount, it will have the form:
1048 * com.apple.os.update-<boot manifest hash>@<dev node path>
1050 * So we just search the mntfromname for any occurrence of "/dev/" and
1051 * grab that as the device path. The image boot code needs a dev node to
1052 * do the re-mount, so we cannot directly mount the snapshot as the
1053 * protoboot volume currently.
1055 strlcpy(pbdevpath
, slash_dev
, sizeof(pbdevpath
));
1057 snprintf(pbdevpath
, sizeof(pbdevpath
), "/dev/%s", pbdevp
);
1060 bsd_init_kprintf("protoboot mount-from: %s\n", pbdevp
);
1061 bsd_init_kprintf("protoboot dev path: %s\n", pbdevpath
);
1063 strlcpy(pbfsname
, pbmnt
->mnt_vtable
->vfc_name
, sizeof(pbfsname
));
1066 * See if a system disk image is present. If so, mount it and
1067 * switch the root vnode to point to it
1069 imageboot_type_t imageboot_type
= imageboot_needed();
1070 if (netboot
== FALSE
&& imageboot_type
) {
1072 * An image was found. No turning back: we're booted
1073 * with a kernel from the disk image.
1075 bsd_init_kprintf("doing image boot: type = %d\n", imageboot_type
);
1076 imageboot_setup(imageboot_type
);
1079 #if CONFIG_LOCKERBOOT
1080 if (imageboot_type
== IMAGEBOOT_LOCKER
) {
1081 bsd_init_kprintf("booting from locker\n");
1082 if (vnode_tag(rootvnode
) != VT_LOCKERFS
) {
1083 panic("root filesystem not a locker: fsname = %s",
1084 rootvnode
->v_mount
->mnt_vtable
->vfc_name
);
1087 #endif /* CONFIG_LOCKERBOOT */
1088 #endif /* CONFIG_IMAGEBOOT */
1090 /* set initial time; all other resource data is already zero'ed */
1091 microtime_with_abstime(&kernproc
->p_start
, &kernproc
->p_stats
->ps_start
);
1095 char mounthere
[] = "/dev"; /* !const because of internal casting */
1097 bsd_init_kprintf("calling devfs_kernel_mount\n");
1098 devfs_kernel_mount(mounthere
);
1102 if (vfs_mount_rosv_data()) {
1103 panic("failed to mount data volume!");
1106 if (vfs_mount_vm()) {
1107 printf("failed to mount vm volume!");
1110 #if CONFIG_LOCKERBOOT
1112 * We need to wait until devfs is up before remounting the protoboot volume
1113 * within the locker so that it can have a real devfs vnode backing it.
1115 if (imageboot_type
== IMAGEBOOT_LOCKER
) {
1116 bsd_init_kprintf("re-mounting protoboot volume\n");
1117 int error
= mount_locker_protoboot(pbfsname
, LOCKER_PROTOBOOT_MOUNT
,
1120 panic("failed to mount protoboot volume: dev path = %s, error = %d",
1124 #endif /* CONFIG_LOCKERBOOT */
1126 /* Initialize signal state for process 0. */
1127 bsd_init_kprintf("calling siginit\n");
1130 bsd_init_kprintf("calling bsd_utaskbootstrap\n");
1131 bsd_utaskbootstrap();
1133 pal_kernel_announce();
1135 bsd_init_kprintf("calling mountroot_post_hook\n");
1137 /* invoke post-root-mount hook */
1138 if (mountroot_post_hook
!= NULL
) {
1139 mountroot_post_hook();
1143 consider_zone_gc(FALSE
);
1146 /* Initialize System Override call */
1147 init_system_override();
1149 bsd_init_kprintf("done\n");
1155 proc_t p
= current_proc();
1157 process_name("init", p
);
1159 /* Set up exception-to-signal reflection */
1163 mac_cred_label_associate_user(p
->p_ucred
);
1166 vm_init_before_launchd();
1169 int result
= bsd_list_tests();
1170 result
= bsd_do_post();
1172 panic("bsd_do_post: Tests failed with result = 0x%08x\n", result
);
1176 bsd_init_kprintf("bsd_do_post - done");
1178 load_init_program(p
);
1185 kprintf("bsd_autoconf: calling kminit\n");
1189 * Early startup for bsd pseudodevices.
1192 struct pseudo_init
*pi
;
1194 for (pi
= pseudo_inits
; pi
->ps_func
; pi
++) {
1195 (*pi
->ps_func
)(pi
->ps_count
);
1199 return IOKitBSDInit();
1203 #include <sys/disklabel.h> /* for MAXPARTITIONS */
1211 err
= IOFindBSDRoot(rootdevice
, sizeof(rootdevice
), &rootdev
, &flags
);
1213 printf("setconf: IOFindBSDRoot returned an error (%d);"
1214 "setting rootdevice to 'sd0a'.\n", err
); /* XXX DEBUG TEMP */
1215 rootdev
= makedev( 6, 0 );
1216 strlcpy(rootdevice
, "sd0a", sizeof(rootdevice
));
1222 /* network device */
1223 mountroot
= netboot_mountroot
;
1226 /* otherwise have vfs determine root filesystem */
1234 bsd_utaskbootstrap(void)
1240 * Clone the bootstrap process from the kernel process, without
1241 * inheriting either task characteristics or memory from the kernel;
1243 thread
= cloneproc(TASK_NULL
, COALITION_NULL
, kernproc
, FALSE
, TRUE
);
1245 /* Hold the reference as it will be dropped during shutdown */
1246 initproc
= proc_find(1);
1247 #if __PROC_INTERNAL_DEBUG
1248 if (initproc
== PROC_NULL
) {
1249 panic("bsd_utaskbootstrap: initproc not set\n");
1253 * Since we aren't going back out the normal way to our parent,
1254 * we have to drop the transition locks explicitly.
1256 proc_signalend(initproc
, 0);
1257 proc_transend(initproc
, 0);
1259 ut
= (struct uthread
*)get_bsdthread_info(thread
);
1261 act_set_astbsd(thread
);
1262 task_clear_return_wait(get_threadtask(thread
), TCRW_CLEAR_ALL_WAIT
);
1266 parse_bsd_args(void)
1271 if (PE_parse_boot_argn("-s", namep
, sizeof(namep
))) {
1272 boothowto
|= RB_SINGLE
;
1275 if (PE_parse_boot_argn("-x", namep
, sizeof(namep
))) { /* safe boot */
1276 boothowto
|= RB_SAFEBOOT
;
1279 if (PE_parse_boot_argn("-minimalboot", namep
, sizeof(namep
))) {
1281 * -minimalboot indicates that we want userspace to be bootstrapped to a
1282 * minimal environment. What constitutes minimal is up to the bootstrap
1291 /* disable 32 bit grading */
1292 if (PE_parse_boot_argn("no32exec", &no32exec
, sizeof(no32exec
))) {
1293 bootarg_no32exec
= !!no32exec
;
1297 int execfailure_crashreports
;
1298 /* enable crash reports on various exec failures */
1299 if (PE_parse_boot_argn("execfailurecrashes", &execfailure_crashreports
, sizeof(execfailure_crashreports
))) {
1300 bootarg_execfailurereports
= !!execfailure_crashreports
;
1303 /* disable vnode_cache_is_authorized() by setting vnode_cache_defeat */
1304 if (PE_parse_boot_argn("-vnode_cache_defeat", namep
, sizeof(namep
))) {
1305 bootarg_vnode_cache_defeat
= 1;
1308 #if DEVELOPMENT || DEBUG
1309 if (PE_parse_boot_argn("-disable_aslr", namep
, sizeof(namep
))) {
1310 bootarg_disable_aslr
= 1;
1314 PE_parse_boot_argn("ncl", &ncl
, sizeof(ncl
));
1315 if (PE_parse_boot_argn("nbuf", &max_nbuf_headers
,
1316 sizeof(max_nbuf_headers
))) {
1321 #if defined (__i386__) || defined (__x86_64__)
1322 PE_parse_boot_argn("policy_check", &policy_check_flags
, sizeof(policy_check_flags
));
1324 #endif /* CONFIG_MACF */
1326 if (PE_parse_boot_argn("msgbuf", &msgbuf
, sizeof(msgbuf
))) {
1327 log_setsize(msgbuf
);
1328 oslog_setsize(msgbuf
);
1331 if (PE_parse_boot_argn("-novfscache", namep
, sizeof(namep
))) {
1335 #if CONFIG_JETSAM && (DEVELOPMENT || DEBUG)
1336 if (PE_parse_boot_argn("-no_vnode_jetsam", namep
, sizeof(namep
))) {
1337 bootarg_no_vnode_jetsam
= 1;
1339 #endif /* CONFIG_JETSAM && (DEVELOPMENT || DEBUG) */
1341 if (PE_parse_boot_argn("-no_vnode_drain", namep
, sizeof(namep
))) {
1342 bootarg_no_vnode_drain
= 1;
1347 * The darkboot flag is specified by the bootloader and is stored in
1348 * boot_args->bootFlags. This flag is available starting revision 2.
1350 boot_args
*args
= (boot_args
*) PE_state
.bootArgs
;
1351 if ((args
!= NULL
) && (args
->Revision
>= kBootArgsRevision2
)) {
1352 darkboot
= (args
->bootFlags
& kBootFlagsDarkBoot
) ? 1 : 0;
1359 if (PE_parse_boot_argn("-disable_procref_tracking", namep
, sizeof(namep
))) {
1360 proc_ref_tracking_disabled
= 1;
1365 if (PE_parse_boot_argn("-disable_osreason_debug", namep
, sizeof(namep
))) {
1366 os_reason_debug_disabled
= 1;
1370 PE_parse_boot_argn("sigrestrict", &sigrestrict_arg
, sizeof(sigrestrict_arg
));
1372 #if DEVELOPMENT || DEBUG
1373 if (PE_parse_boot_argn("-no_sigsys", namep
, sizeof(namep
))) {
1374 send_sigsys
= false;
1377 if (PE_parse_boot_argn("alt-dyld", dyld_alt_path
, sizeof(dyld_alt_path
))) {
1378 if (strlen(dyld_alt_path
) > 0) {
1382 PE_parse_boot_argn("dyld_flags", &dyld_flags
, sizeof(dyld_flags
));
1384 if (PE_parse_boot_argn("-disable_syscallfilter", &namep
, sizeof(namep
))) {
1385 syscallfilter_disable
= 1;
1389 if (PE_parse_boot_argn("legacy_footprint_entitlement_mode", &legacy_footprint_entitlement_mode
, sizeof(legacy_footprint_entitlement_mode
))) {
1391 * legacy_footprint_entitlement_mode specifies the behavior we want associated
1392 * with the entitlement. The supported modes are:
1394 * LEGACY_FOOTPRINT_ENTITLEMENT_IGNORE:
1395 * Indicates that we want every process to have the memory accounting
1396 * that is available in iOS 12.0 and beyond.
1398 * LEGACY_FOOTPRINT_ENTITLEMENT_IOS11_ACCT:
1399 * Indicates that for every process that has the 'legacy footprint entitlement',
1400 * we want to give it the old iOS 11.0 accounting behavior which accounted some
1401 * of the process's memory to the kernel.
1403 * LEGACY_FOOTPRINT_ENTITLEMENT_LIMIT_INCREASE:
1404 * Indicates that for every process that has the 'legacy footprint entitlement',
1405 * we want it to have a higher memory limit which will help them acclimate to the
1406 * iOS 12.0 (& beyond) accounting behavior that does the right accounting.
1407 * The bonus added to the system-wide task limit to calculate this higher memory limit
1408 * is available in legacy_footprint_bonus_mb.
1411 if (legacy_footprint_entitlement_mode
< LEGACY_FOOTPRINT_ENTITLEMENT_IGNORE
||
1412 legacy_footprint_entitlement_mode
> LEGACY_FOOTPRINT_ENTITLEMENT_LIMIT_INCREASE
) {
1413 legacy_footprint_entitlement_mode
= LEGACY_FOOTPRINT_ENTITLEMENT_LIMIT_INCREASE
;
1416 #endif /* __arm64__ */
1417 #endif /* DEVELOPMENT || DEBUG */
1421 bsd_exec_setup(int scale
)
1426 bsd_simul_execs
= BSD_SIMUL_EXECS
;
1430 bsd_simul_execs
= 65;
1434 bsd_simul_execs
= 129;
1438 bsd_simul_execs
= 257;
1441 bsd_simul_execs
= 513;
1444 bsd_pageable_map_size
= (bsd_simul_execs
* BSD_PAGEABLE_SIZE_PER_EXEC
);