2  * Copyright (c) 2000-2004 Apple Computer, Inc. All rights reserved. 
   4  * @APPLE_OSREFERENCE_LICENSE_HEADER_START@ 
   6  * This file contains Original Code and/or Modifications of Original Code 
   7  * as defined in and that are subject to the Apple Public Source License 
   8  * Version 2.0 (the 'License'). You may not use this file except in 
   9  * compliance with the License. The rights granted to you under the License 
  10  * may not be used to create, or enable the creation or redistribution of, 
  11  * unlawful or unlicensed copies of an Apple operating system, or to 
  12  * circumvent, violate, or enable the circumvention or violation of, any 
  13  * terms of an Apple operating system software license agreement. 
  15  * Please obtain a copy of the License at 
  16  * http://www.opensource.apple.com/apsl/ and read it before using this file. 
  18  * The Original Code and all software distributed under the License are 
  19  * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER 
  20  * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES, 
  21  * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY, 
  22  * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT. 
  23  * Please see the License for the specific language governing rights and 
  24  * limitations under the License. 
  26  * @APPLE_OSREFERENCE_LICENSE_HEADER_END@ 
  28 /* Copyright (c) 1995 NeXT Computer, Inc. All Rights Reserved */ 
  30  * Mach Operating System 
  31  * Copyright (c) 1987 Carnegie-Mellon University 
  32  * All rights reserved.  The CMU software License Agreement specifies 
  33  * the terms and conditions for use and redistribution. 
  39  * Copyright (c) 1982, 1986, 1991, 1993 
  40  *      The Regents of the University of California.  All rights reserved. 
  41  * (c) UNIX System Laboratories, Inc. 
  42  * All or some portions of this file are derived from material licensed 
  43  * to the University of California by American Telephone and Telegraph 
  44  * Co. or Unix System Laboratories, Inc. and are reproduced herein with 
  45  * the permission of UNIX System Laboratories, Inc. 
  47  * Redistribution and use in source and binary forms, with or without 
  48  * modification, are permitted provided that the following conditions 
  50  * 1. Redistributions of source code must retain the above copyright 
  51  *    notice, this list of conditions and the following disclaimer. 
  52  * 2. Redistributions in binary form must reproduce the above copyright 
  53  *    notice, this list of conditions and the following disclaimer in the 
  54  *    documentation and/or other materials provided with the distribution. 
  55  * 3. All advertising materials mentioning features or use of this software 
  56  *    must display the following acknowledgement: 
  57  *      This product includes software developed by the University of 
  58  *      California, Berkeley and its contributors. 
  59  * 4. Neither the name of the University nor the names of its contributors 
  60  *    may be used to endorse or promote products derived from this software 
  61  *    without specific prior written permission. 
  63  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 
  64  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 
  65  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 
  66  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 
  67  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 
  68  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 
  69  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 
  70  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 
  71  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 
  72  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 
  75  *      from: @(#)kern_exec.c   8.1 (Berkeley) 6/10/93 
  77 #include <machine/reg.h> 
  79 #include <sys/param.h> 
  80 #include <sys/systm.h> 
  81 #include <sys/filedesc.h> 
  82 #include <sys/kernel.h> 
  83 #include <sys/proc_internal.h> 
  84 #include <sys/kauth.h> 
  86 #include <sys/socketvar.h> 
  87 #include <sys/malloc.h> 
  88 #include <sys/namei.h> 
  89 #include <sys/mount_internal.h> 
  90 #include <sys/vnode_internal.h>          
  91 #include <sys/file_internal.h> 
  93 #include <sys/uio_internal.h> 
  96 #include <sys/kdebug.h> 
  97 #include <sys/signal.h> 
  98 #include <sys/aio_kern.h> 
  99 #include <sys/sysproto.h> 
 100 #include <sys/shm_internal.h>           /* shmexec() */ 
 101 #include <sys/ubc_internal.h>           /* ubc_map() */ 
 103 #include <bsm/audit_kernel.h> 
 105 #include <mach/mach_types.h> 
 106 #include <mach/task.h> 
 107 #include <mach/thread_act.h> 
 108 #include <mach/vm_map.h> 
 109 #include <mach/mach_vm.h> 
 110 #include <mach/vm_param.h> 
 112 #include <vm/vm_map.h> 
 113 #include <vm/vm_kern.h> 
 114 #include <vm/vm_pager.h> 
 115 #include <vm/vm_kern.h> 
 116 #include <vm/task_working_set.h> 
 117 #include <vm/vm_shared_memory_server.h> 
 120  * Mach things for which prototypes are unavailable from Mach headers 
 125 extern struct savearea 
*get_user_regs(thread_t
); 
 128 #include <kern/thread.h> 
 129 #include <kern/task.h> 
 130 #include <kern/ast.h> 
 131 #include <kern/mach_loader.h> 
 132 #include <mach-o/fat.h> 
 133 #include <mach-o/loader.h> 
 134 #include <machine/vmparam.h> 
 136 #include <sys/ktrace.h> 
 138 #include <sys/imgact.h> 
 142  * SIZE_MAXPTR          The maximum size of a user space pointer, in bytes 
 143  * SIZE_IMG_STRSPACE    The available string space, minus two pointers; we 
 144  *                      define it interms of the maximum, since we don't 
 145  *                      know the pointer size going in, until after we've 
 146  *                      parsed the executable image. 
 148 #define SIZE_MAXPTR             8                               /* 64 bits */ 
 149 #define SIZE_IMG_STRSPACE       (NCARGS - 2 * SIZE_MAXPTR) 
 153 extern vm_map_t bsd_pageable_map
; 
 154 extern struct fileops vnops
; 
 156 #define ROUND_PTR(type, addr)   \ 
 157         (type *)( ( (unsigned)(addr) + 16 - 1) \ 
 160 struct image_params
;    /* Forward */ 
 161 static int exec_copyout_strings(struct image_params 
*imgp
, user_addr_t 
*stackp
); 
 162 static int load_return_to_errno(load_return_t lrtn
); 
 163 static int execargs_alloc(struct image_params 
*imgp
); 
 164 static int execargs_free(struct image_params 
*imgp
); 
 165 static int exec_check_permissions(struct image_params 
*imgp
); 
 166 static int exec_extract_strings(struct image_params 
*imgp
); 
 167 static int exec_handle_sugid(struct image_params 
*imgp
); 
 168 static int sugid_scripts 
= 0; 
 169 SYSCTL_INT (_kern
, OID_AUTO
, sugid_scripts
, CTLFLAG_RW
, &sugid_scripts
, 0, ""); 
 170 static kern_return_t 
create_unix_stack(vm_map_t map
, user_addr_t user_stack
, 
 171                                         int customstack
, struct proc 
*p
); 
 172 static int copyoutptr(user_addr_t ua
, user_addr_t ptr
, int ptr_size
); 
 174 /* XXX forward; should be in headers, but can't be for one reason or another */ 
 175 extern int grade_binary(cpu_type_t exectype
, cpu_subtype_t execsubtype
); 
 176 extern void vfork_return(thread_t th_act
, 
 182 extern char classichandler
[32]; 
 183 extern uint32_t classichandler_fsid
; 
 184 extern long classichandler_fileid
; 
 190  * Add the requested string to the string space area. 
 192  * Parameters;  struct image_params *           image parameter block 
 193  *              user_addr_t                     string to add to strings area 
 194  *              uio_seg                         segment where string is located 
 197  *              !0                      Failure errno from copyinstr() 
 200  *              (imgp->ip_strendp)      updated location of next add, if any 
 201  *              (imgp->ip_strspace)     updated byte count of space remaining 
 204 exec_add_string(struct image_params 
*imgp
, user_addr_t str
, /*uio_seg*/int seg
) 
 210                 if (imgp
->ip_strspace 
<= 0) { 
 214                 if (IS_UIO_SYS_SPACE(seg
)) { 
 215                         char *kstr 
= CAST_DOWN(char *,str
);     /* SAFE */ 
 216                         error 
= copystr(kstr
, imgp
->ip_strendp
, imgp
->ip_strspace
, &len
); 
 218                         error 
= copyinstr(str
, imgp
->ip_strendp
, imgp
->ip_strspace
, 
 221                 imgp
->ip_strendp 
+= len
; 
 222                 imgp
->ip_strspace 
-= len
; 
 223         } while (error 
== ENAMETOOLONG
); 
 231  * To support new app package launching for Mac OS X, the dyld needs the 
 232  * first argument to execve() stored on the user stack. 
 234  * Save the executable path name at the top of the strings area and set 
 235  * the argument vector pointer to the location following that to indicate 
 236  * the start of the argument and environment tuples, setting the remaining 
 237  * string space count to the size of the string area minus the path length 
 238  * and a reserve for two pointers. 
 240  * Parameters;  struct image_params *           image parameter block 
 241  *              char *                          path used to invoke program 
 242  *              uio_seg                         segment where path is located 
 244  * Returns:     int                     0       Success 
 245  *                                      !0      Failure: error number 
 247  *              (imgp->ip_strings)              saved path 
 248  *              (imgp->ip_strspace)             space remaining in ip_strings 
 249  *              (imgp->ip_argv)                 beginning of argument list 
 250  *              (imgp->ip_strendp)              start of remaining copy area 
 252  * Note:        We have to do this before the initial namei() since in the 
 253  *              path contains symbolic links, namei() will overwrite the 
 254  *              original path buffer contents.  If the last symbolic link 
 255  *              resolved was a relative pathname, we would lose the original 
 256  *              "path", which could be an absolute pathname. This might be 
 257  *              unacceptable for dyld. 
 260 exec_save_path(struct image_params 
*imgp
, user_addr_t path
, /*uio_seg*/int seg
) 
 264         char *kpath 
= CAST_DOWN(char *,path
);   /* SAFE */ 
 266         imgp
->ip_strendp 
= imgp
->ip_strings
; 
 267         imgp
->ip_strspace 
= SIZE_IMG_STRSPACE
; 
 269         len 
= MIN(MAXPATHLEN
, imgp
->ip_strspace
); 
 272         case UIO_USERSPACE32
: 
 273         case UIO_USERSPACE64
:   /* Same for copyin()... */ 
 274                 error 
= copyinstr(path
, imgp
->ip_strings
, len
, &len
); 
 277                 error 
= copystr(kpath
, imgp
->ip_strings
, len
, &len
); 
 285                 imgp
->ip_strendp 
+= len
; 
 286                 imgp
->ip_strspace 
-= len
; 
 287                 imgp
->ip_argv 
= imgp
->ip_strendp
; 
 298  * Image activator for interpreter scripts.  If the image begins with the 
 299  * characters "#!", then it is an interpreter script.  Verify that we are 
 300  * not already executing in Classic mode, and that the length of the script 
 301  * line indicating the interpreter is not in excess of the maximum allowed 
 302  * size.  If this is the case, then break out the arguments, if any, which 
 303  * are separated by white space, and copy them into the argument save area 
 304  * as if they were provided on the command line before all other arguments. 
 305  * The line ends when we encounter a comment character ('#') or newline. 
 307  * Parameters;  struct image_params *   image parameter block 
 309  * Returns:     -1                      not an interpreter (keep looking) 
 310  *              -3                      Success: interpreter: relookup 
 311  *              >0                      Failure: interpreter: error number 
 313  * A return value other than -1 indicates subsequent image activators should 
 314  * not be given the opportunity to attempt to activate the image. 
 317 exec_shell_imgact(struct image_params 
*imgp
) 
 319         char *vdata 
= imgp
->ip_vdata
; 
 325          * Make sure it's a shell script.  If we've already redirected 
 326          * from an interpreted file once, don't do it again. 
 328          * Note: We disallow Classic, since the expectation is that we 
 329          * may run a Classic interpreter, but not an interpret a Classic 
 330          * image.  This is consistent with historical behaviour. 
 332         if (vdata
[0] != '#' || 
 334             (imgp
->ip_flags 
& IMGPF_INTERPRET
) != 0) { 
 339         imgp
->ip_flags 
|= IMGPF_INTERPRET
; 
 341         /* Check to see if SUGID scripts are permitted.  If they aren't then 
 342          * clear the SUGID bits. 
 343          * imgp->ip_vattr is known to be valid. 
 345         if (sugid_scripts 
== 0) { 
 346            imgp
->ip_origvattr
->va_mode 
&= ~(VSUID 
| VSGID
); 
 349         /* Find the nominal end of the interpreter line */ 
 350         for( ihp 
= &vdata
[2]; *ihp 
!= '\n' && *ihp 
!= '#'; ihp
++) { 
 351                 if (ihp 
>= &vdata
[IMG_SHSIZE
]) 
 357         /* Skip over leading spaces - until the interpreter name */ 
 358         while ( ihp 
< line_endp 
&& ((*ihp 
== ' ') || (*ihp 
== '\t'))) 
 362          * Find the last non-whitespace character before the end of line or 
 363          * the beginning of a comment; this is our new end of line. 
 365         for (;line_endp 
> ihp 
&& ((*line_endp 
== ' ') || (*line_endp 
== '\t')); line_endp
--) 
 369         if (line_endp 
== ihp
) 
 372         /* copy the interpreter name */ 
 373         interp 
= imgp
->ip_interp_name
; 
 374         while ((ihp 
< line_endp
) && (*ihp 
!= ' ') && (*ihp 
!= '\t')) 
 378         exec_save_path(imgp
, CAST_USER_ADDR_T(imgp
->ip_interp_name
), 
 382         while (ihp 
< line_endp
) { 
 383                 /* Skip leading whitespace before each argument */ 
 384                 while ((*ihp 
== ' ') || (*ihp 
== '\t')) 
 387                 if (ihp 
>= line_endp
) 
 390                 /* We have an argument; copy it */ 
 391                 while ((ihp 
< line_endp
) && (*ihp 
!= ' ') && (*ihp 
!= '\t')) {   
 392                         *imgp
->ip_strendp
++ = *ihp
++; 
 395                 *imgp
->ip_strendp
++ = 0; 
 408  * Image activator for fat 1.0 binaries.  If the binary is fat, then we 
 409  * need to select an image from it internally, and make that the image 
 410  * we are going to attempt to execute.  At present, this consists of 
 411  * reloading the first page for the image with a first page from the 
 412  * offset location indicated by the fat header. 
 414  * Important:   This image activator is byte order neutral. 
 416  * Note:        If we find an encapsulated binary, we make no assertions 
 417  *              about its  validity; instead, we leave that up to a rescan 
 418  *              for an activator to claim it, and, if it is claimed by one, 
 419  *              that activator is responsible for determining validity. 
 422 exec_fat_imgact(struct image_params 
*imgp
) 
 424         struct proc 
*p 
= vfs_context_proc(imgp
->ip_vfs_context
); 
 425         kauth_cred_t cred 
= p
->p_ucred
; 
 426         struct fat_header 
*fat_header 
= (struct fat_header 
*)imgp
->ip_vdata
; 
 427         struct fat_arch fat_arch
; 
 431         /* Make sure it's a fat binary */ 
 432         if ((fat_header
->magic 
!= FAT_MAGIC
) && 
 433             (fat_header
->magic 
!= FAT_CIGAM
)) { 
 438         /* Look up our preferred architecture in the fat file. */ 
 439         lret 
= fatfile_getarch_affinity(imgp
->ip_vp
, 
 440                                         (vm_offset_t
)fat_header
, 
 442                                         (p
->p_flag 
& P_AFFINITY
)); 
 443         if (lret 
!= LOAD_SUCCESS
) { 
 444                 error 
= load_return_to_errno(lret
); 
 448         /* Read the Mach-O header out of it */ 
 449         error 
= vn_rdwr(UIO_READ
, imgp
->ip_vp
, imgp
->ip_vdata
, 
 450                         PAGE_SIZE
, fat_arch
.offset
, 
 451                         UIO_SYSSPACE32
, (IO_UNIT
|IO_NODELOCKED
), 
 457         /* Did we read a complete header? */ 
 463         /* Success.  Indicate we have identified an encapsulated binary */ 
 465         imgp
->ip_arch_offset 
= (user_size_t
)fat_arch
.offset
; 
 466         imgp
->ip_arch_size 
= (user_size_t
)fat_arch
.size
; 
 475  * Image activator for mach-o 1.0 binaries. 
 477  * Important:   This image activator is NOT byte order neutral. 
 480 exec_mach_imgact(struct image_params 
*imgp
) 
 482         struct mach_header 
*mach_header 
= (struct mach_header 
*)imgp
->ip_vdata
; 
 483         kauth_cred_t            cred 
= vfs_context_ucred(imgp
->ip_vfs_context
); 
 484         struct proc             
*p 
= vfs_context_proc(imgp
->ip_vfs_context
); 
 490         struct uthread          
*uthread
; 
 491         vm_map_t old_map 
= VM_MAP_NULL
; 
 493         boolean_t                               clean_regions 
= FALSE
; 
 494     shared_region_mapping_t initial_region 
= NULL
; 
 496         load_result_t           load_result
; 
 499          * make sure it's a Mach-O 1.0 or Mach-O 2.0 binary; the difference 
 500          * is a reserved field on the end, so for the most part, we can 
 501          * treat them as if they were identical. 
 503         if ((mach_header
->magic 
!= MH_MAGIC
) && 
 504             (mach_header
->magic 
!= MH_MAGIC_64
)) { 
 509         task 
= current_task(); 
 510         thread 
= current_thread(); 
 511         uthread 
= get_bsdthread_info(thread
); 
 513         if (uthread
->uu_flag 
& UT_VFORK
) 
 514                 vfexec 
= 1;      /* Mark in exec */ 
 516         if ((mach_header
->cputype 
& CPU_ARCH_ABI64
) == CPU_ARCH_ABI64
) 
 517                 imgp
->ip_flags 
|= IMGPF_IS_64BIT
; 
 519         if (!grade_binary(mach_header
->cputype
, mach_header
->cpusubtype
)) { 
 525          * Copy in arguments/environment from the old process, if the 
 526          * vector is non-NULL (i.e. exec is not being called from 
 527          * load_init_program(), as a special case, at system startup). 
 529         if (imgp
->ip_user_argv 
!= 0LL) { 
 530                 error 
= exec_extract_strings(imgp
); 
 536          * Hack for binary compatability; put three NULs on the end of the 
 537          * string area, and round it up to the next word boundary.  This 
 538          * ensures padding with NULs to the boundary. 
 540         imgp
->ip_strendp
[0] = 0; 
 541         imgp
->ip_strendp
[1] = 0; 
 542         imgp
->ip_strendp
[2] = 0; 
 543         imgp
->ip_strendp 
+= (((imgp
->ip_strendp 
- imgp
->ip_strings
) + NBPW
-1) & ~(NBPW
-1)); 
 547                 kern_return_t   result
; 
 549                 result 
= task_create_internal(task
, FALSE
, &new_task
); 
 550                 if (result 
!= KERN_SUCCESS
) 
 551                 printf("execve: task_create failed. Code: 0x%x\n", result
); 
 553                 set_bsdtask_info(new_task
, p
); 
 556                 map 
= get_task_map(new_task
); 
 557                 result 
= thread_create(new_task
, &imgp
->ip_vfork_thread
); 
 558                 if (result 
!= KERN_SUCCESS
) 
 559                 printf("execve: thread_create failed. Code: 0x%x\n", result
); 
 560                 /* reset local idea of task, thread, uthread */ 
 562                 thread 
= imgp
->ip_vfork_thread
; 
 563                 uthread 
= get_bsdthread_info(thread
); 
 569          * We set these flags here; this is OK, since if we fail after 
 570          * this point, we have already destroyed the parent process anyway. 
 572         if (imgp
->ip_flags 
& IMGPF_IS_64BIT
) { 
 573                 task_set_64bit(task
, TRUE
); 
 576                 task_set_64bit(task
, FALSE
); 
 577                 p
->p_flag 
&= ~P_LP64
; 
 581          *      Load the Mach-O file. 
 583 /* LP64 - remove following "if" statement after osfmk/vm/task_working_set.c */ 
 584 if((imgp
->ip_flags 
& IMGPF_IS_64BIT
) == 0) 
 585         if(imgp
->ip_tws_cache_name
) { 
 586                 tws_handle_startup_file(task
, kauth_cred_getuid(cred
),  
 587                         imgp
->ip_tws_cache_name
, imgp
->ip_vp
, &clean_regions
); 
 590         vm_get_shared_region(task
, &initial_region
); 
 594          * NOTE: An error after this point  indicates we have potentially 
 595          * destroyed or overwrote some process state while attempting an 
 596          * execve() following a vfork(), which is an unrecoverable condition. 
 600          * We reset the task to 64-bit (or not) here.  It may have picked up 
 601          * a new map, and we need that to reflect its true 64-bit nature. 
 604                        ((imgp
->ip_flags 
& IMGPF_IS_64BIT
) == IMGPF_IS_64BIT
)); 
 607          * Actually load the image file we previously decided to load. 
 609         lret 
= load_machfile(imgp
, mach_header
, thread
, map
, clean_regions
, &load_result
); 
 611         if (lret 
!= LOAD_SUCCESS
) { 
 612                 error 
= load_return_to_errno(lret
); 
 616         /* load_machfile() maps the vnode */ 
 617         (void)ubc_map(imgp
->ip_vp
, PROT_EXEC
); 
 620          * deal with set[ug]id. 
 622         error 
= exec_handle_sugid(imgp
); 
 624         KNOTE(&p
->p_klist
, NOTE_EXEC
); 
 626         if (!vfexec 
&& (p
->p_flag 
& P_TRACED
)) 
 632         vnode_put(imgp
->ip_vp
); 
 635         if (load_result
.unixproc 
&& 
 636                 create_unix_stack(get_task_map(task
), 
 637                                   load_result
.user_stack
, load_result
.customstack
, p
)) { 
 638                 error 
= load_return_to_errno(LOAD_NOSPACE
); 
 643                 uthread
->uu_ar0 
= (void *)get_user_regs(thread
); 
 644                 old_map 
= vm_map_switch(get_task_map(task
)); 
 647         if (load_result
.unixproc
) { 
 651                  * Copy the strings area out into the new process address 
 655                 error 
= exec_copyout_strings(imgp
, &ap
); 
 658                                 vm_map_switch(old_map
); 
 662                 thread_setuserstack(thread
, ap
); 
 665         if (load_result
.dynlinker
) { 
 668                 /* Adjust the stack */ 
 669                 if (imgp
->ip_flags 
& IMGPF_IS_64BIT
) { 
 670                         ap 
= thread_adjuserstack(thread
, -8); 
 671                         (void)copyoutptr(load_result
.mach_header
, ap
, 8); 
 673                         ap 
= thread_adjuserstack(thread
, -4); 
 674                         (void)suword(ap
, load_result
.mach_header
); 
 679                 vm_map_switch(old_map
); 
 681         /* Set the entry point */ 
 682         thread_setentrypoint(thread
, load_result
.entry_point
); 
 688          * Reset signal state. 
 693          * Close file descriptors 
 694          * which specify close-on-exec. 
 699          * need to cancel async IO requests that can be cancelled and wait for those 
 700          * already active.  MAY BLOCK! 
 704         /* FIXME: Till vmspace inherit is fixed: */ 
 705         if (!vfexec 
&& p
->vm_shm
) 
 707         /* Clean up the semaphores */ 
 711          * Remember file name for accounting. 
 713         p
->p_acflag 
&= ~AFORK
; 
 714         /* If the translated name isn't NULL, then we want to use 
 715          * that translated name as the name we show as the "real" name. 
 716          * Otherwise, use the name passed into exec. 
 718         if (0 != imgp
->ip_p_comm
[0]) { 
 719                 bcopy((caddr_t
)imgp
->ip_p_comm
, (caddr_t
)p
->p_comm
, 
 722                 if (imgp
->ip_ndp
->ni_cnd
.cn_namelen 
> MAXCOMLEN
) 
 723                         imgp
->ip_ndp
->ni_cnd
.cn_namelen 
= MAXCOMLEN
; 
 724                 bcopy((caddr_t
)imgp
->ip_ndp
->ni_cnd
.cn_nameptr
, (caddr_t
)p
->p_comm
, 
 725                         (unsigned)imgp
->ip_ndp
->ni_cnd
.cn_namelen
); 
 726                 p
->p_comm
[imgp
->ip_ndp
->ni_cnd
.cn_namelen
] = '\0'; 
 730           /* This is for kdebug */ 
 731           long dbg_arg1
, dbg_arg2
, dbg_arg3
, dbg_arg4
; 
 733           /* Collect the pathname for tracing */ 
 734           kdbg_trace_string(p
, &dbg_arg1
, &dbg_arg2
, &dbg_arg3
, &dbg_arg4
); 
 740                   KERNEL_DEBUG_CONSTANT1((TRACEDBG_CODE(DBG_TRACE_DATA
, 2)) | DBG_FUNC_NONE
, 
 741                                         p
->p_pid 
,0,0,0, (unsigned int)thread
); 
 742                   KERNEL_DEBUG_CONSTANT1((TRACEDBG_CODE(DBG_TRACE_STRING
, 2)) | DBG_FUNC_NONE
, 
 743                                         dbg_arg1
, dbg_arg2
, dbg_arg3
, dbg_arg4
, (unsigned int)thread
); 
 747                   KERNEL_DEBUG_CONSTANT((TRACEDBG_CODE(DBG_TRACE_DATA
, 2)) | DBG_FUNC_NONE
, 
 749                   KERNEL_DEBUG_CONSTANT((TRACEDBG_CODE(DBG_TRACE_STRING
, 2)) | DBG_FUNC_NONE
, 
 750                                         dbg_arg1
, dbg_arg2
, dbg_arg3
, dbg_arg4
, 0); 
 754                 p
->p_flag 
&= ~P_CLASSIC
; 
 757          * mark as execed, wakeup the process that vforked (if any) and tell 
 758          * it that it now has it's own resources back 
 761         if (p
->p_pptr 
&& (p
->p_flag 
& P_PPWAIT
)) { 
 762                 p
->p_flag 
&= ~P_PPWAIT
; 
 763                 wakeup((caddr_t
)p
->p_pptr
); 
 766         if (vfexec 
&& (p
->p_flag 
& P_TRACED
)) { 
 767                 psignal_vfork(p
, new_task
, thread
, SIGTRAP
); 
 772                 task_deallocate(new_task
); 
 773                 thread_deallocate(thread
); 
 786  * Our image activator table; this is the table of the image types we are 
 787  * capable of loading.  We list them in order of preference to ensure the 
 788  * fastest image load speed. 
 790  * XXX hardcoded, for now; should use linker sets 
 793         int (*ex_imgact
)(struct image_params 
*); 
 796         { exec_mach_imgact
,             "Mach-o Binary" }, 
 797         { exec_fat_imgact
,              "Fat Binary" }, 
 798         { exec_shell_imgact
,            "Interpreter Script" }, 
 804  * TODO:        Dynamic linker header address on stack is copied via suword() 
 808 execve(struct proc 
*p
, struct execve_args 
*uap
, register_t 
*retval
) 
 810         kauth_cred_t cred 
= p
->p_ucred
; 
 811         struct image_params image_params
, *imgp
; 
 812         struct vnode_attr va
; 
 813         struct vnode_attr origva
; 
 815         struct uthread          
*uthread
; 
 821         int once 
= 1;   /* save SGUID-ness for interpreted files */ 
 822         char alt_p_comm
[sizeof(p
->p_comm
)] = {0};       /* for Classic */ 
 823         int is_64 
= IS_64BIT_PROCESS(p
); 
 824         int seg 
= (is_64 
? UIO_USERSPACE64 
: UIO_USERSPACE32
); 
 825         struct vfs_context context
; 
 828         context
.vc_ucred 
= p
->p_ucred
;  /* XXX must NOT be kauth_cred_get() */ 
 831         imgp 
= &image_params
; 
 833         /* Initialize the common data in the image_params structure */ 
 834         bzero(imgp
, sizeof(*imgp
)); 
 835         imgp
->ip_user_fname 
= uap
->fname
; 
 836         imgp
->ip_user_argv 
= uap
->argp
; 
 837         imgp
->ip_user_envv 
= uap
->envp
; 
 838         imgp
->ip_vattr 
= &va
; 
 839         imgp
->ip_origvattr 
= &origva
; 
 840         imgp
->ip_vfs_context 
= &context
; 
 841         imgp
->ip_flags 
= (is_64 
? IMGPF_WAS_64BIT 
: IMGPF_NONE
); 
 842         imgp
->ip_tws_cache_name 
= NULL
; 
 843         imgp
->ip_p_comm 
= alt_p_comm
;           /* for Classic */ 
 846          * XXXAUDIT: Currently, we only audit the pathname of the binary. 
 847          * There may also be poor interaction with dyld. 
 850         task 
= current_task(); 
 851         uthread 
= get_bsdthread_info(current_thread()); 
 853         if (uthread
->uu_flag 
& UT_VFORK
) { 
 854                         vfexec 
= 1; /* Mark in exec */ 
 856                 if (task 
!= kernel_task
) {  
 857                         numthreads 
= get_task_numacts(task
); 
 858                         if (numthreads 
<= 0 ) 
 860                         if (numthreads 
> 1) { 
 866         error 
= execargs_alloc(imgp
); 
 871          * XXXAUDIT: Note: the double copyin introduces an audit 
 872          * race.  To correct this race, we must use a single 
 873          * copyin(), e.g. by passing a flag to namei to indicate an 
 874          * external path buffer is being used. 
 876         error 
= exec_save_path(imgp
, uap
->fname
, seg
); 
 883          * No app profiles under chroot 
 885         if((p
->p_fd
->fd_rdir 
== NULLVP
) && (app_profile 
!= 0)) { 
 887                 /* grab the name of the file out of its path */ 
 888                 /* we will need this for lookup within the   */ 
 890                 /* Scan backwards for the first '/' or start of string */ 
 891                 imgp
->ip_tws_cache_name 
= imgp
->ip_strendp
; 
 892                 while (imgp
->ip_tws_cache_name
[0] != '/') { 
 893                         if(imgp
->ip_tws_cache_name 
== imgp
->ip_strings
) { 
 894                                 imgp
->ip_tws_cache_name
--; 
 897                         imgp
->ip_tws_cache_name
--; 
 899                 imgp
->ip_tws_cache_name
++; 
 901         NDINIT(&nd
, LOOKUP
, FOLLOW 
| LOCKLEAF 
| AUDITVNPATH1
, 
 902                 seg
, uap
->fname
, imgp
->ip_vfs_context
); 
 908         imgp
->ip_ndp 
= &nd
;     /* successful namei(); call nameidone() later */ 
 909         imgp
->ip_vp 
= nd
.ni_vp
; /* if set, need to vnode_put() at some point */ 
 911         error 
= exec_check_permissions(imgp
); 
 915         /* Copy; avoid invocation of an interpreter overwriting the original */ 
 921         error 
= vn_rdwr(UIO_READ
, imgp
->ip_vp
, imgp
->ip_vdata
, PAGE_SIZE
, 0, 
 922                         UIO_SYSSPACE32
, IO_NODELOCKED
, cred
, &resid
, p
); 
 928         for(i 
= 0; error 
== -1 && execsw
[i
].ex_imgact 
!= NULL
; i
++) { 
 930                 error 
= (*execsw
[i
].ex_imgact
)(imgp
); 
 933                 /* case -1: not claimed: continue */ 
 934                 case -2:                /* Encapsulated binary */ 
 935                         goto encapsulated_binary
; 
 937                 case -3:                /* Interpreter */ 
 938                         vnode_put(imgp
->ip_vp
); 
 939                         imgp
->ip_vp 
= NULL
;     /* already put */ 
 940                         nd
.ni_cnd
.cn_nameiop 
= LOOKUP
; 
 941                         nd
.ni_cnd
.cn_flags 
= (nd
.ni_cnd
.cn_flags 
& HASBUF
) | 
 945                         nd
.ni_segflg 
= UIO_SYSSPACE32
; 
 946                         nd
.ni_dirp 
= CAST_USER_ADDR_T(imgp
->ip_interp_name
); 
 954         /* call out to allow 3rd party notification of exec.  
 955          * Ignore result of kauth_authorize_fileop call. 
 957         if (error 
== 0 && kauth_authorize_fileop_has_listeners()) { 
 958                 kauth_authorize_fileop(vfs_context_ucred(&context
), KAUTH_FILEOP_EXEC
,  
 959                                                            (uintptr_t)nd
.ni_vp
, 0); 
 962         /* Image not claimed by any activator? */ 
 968                 nameidone(imgp
->ip_ndp
); 
 970                 vnode_put(imgp
->ip_vp
); 
 971         if (imgp
->ip_strings
) 
 973         if (!error 
&& vfexec
) { 
 974                         vfork_return(current_thread(), p
->p_pptr
, p
, retval
); 
 975                         (void)thread_resume(imgp
->ip_vfork_thread
); 
 983 copyinptr(user_addr_t froma
, user_addr_t 
*toptr
, int ptr_size
) 
 988                 /* 64 bit value containing 32 bit address */ 
 991                 error 
= copyin(froma
, &i
, 4); 
 992                 *toptr 
= CAST_USER_ADDR_T(i
);   /* SAFE */ 
 994                 error 
= copyin(froma
, toptr
, 8); 
1001 copyoutptr(user_addr_t ua
, user_addr_t ptr
, int ptr_size
) 
1005         if (ptr_size 
== 4) { 
1006                 /* 64 bit value containing 32 bit address */ 
1007                 unsigned int i 
= CAST_DOWN(unsigned int,ua
);    /* SAFE */ 
1009                 error 
= copyout(&i
, ptr
, 4); 
1011                 error 
= copyout(&ua
, ptr
, 8); 
1018  * exec_copyout_strings 
1020  * Copy out the strings segment to user space.  The strings segment is put 
1021  * on a preinitialized stack frame. 
1023  * Parameters:  struct image_params *   the image parameter block 
1024  *              int *                   a pointer to the stack offset variable 
1026  * Returns:     0                       Success 
1030  *              (*stackp)               The stack offset, modified 
1032  * Note:        The strings segment layout is backward, from the beginning 
1033  *              of the top of the stack to consume the minimal amount of 
1034  *              space possible; the returned stack pointer points to the 
1035  *              end of the area consumed (stacks grow upward). 
1037  *              argc is an int; arg[i] are pointers; env[i] are pointers; 
1038  *              exec_path is a pointer; the 0's are (void *)NULL's 
1040  * The stack frame layout is: 
1063  *      |  exec_path  | In MacOS X PR2 Beaker2E the path passed to exec() is 
1064  *      +-------------+ passed on the stack just after the trailing 0 of the 
1065  *      |      0      | the envp[] array as a pointer to a string. 
1072  *      |             | <- p->user_stack 
1075  * Although technically a part of the STRING AREA, we treat the PATH AREA as 
1076  * a separate entity.  This allows us to align the beginning of the PATH AREA 
1077  * to a pointer boundary so that the exec_path, env[i], and argv[i] pointers 
1078  * which preceed it on the stack are properly aligned. 
1080  * TODO:        argc copied with suword(), which takes a 64 bit address 
1083 exec_copyout_strings(struct image_params 
*imgp
, user_addr_t 
*stackp
) 
1085         struct proc 
*p 
= vfs_context_proc(imgp
->ip_vfs_context
); 
1086         int     ptr_size 
= (imgp
->ip_flags 
& IMGPF_IS_64BIT
) ? 8 : 4; 
1087         char    *argv 
= imgp
->ip_argv
;  /* modifiable copy of argv */ 
1088         user_addr_t     string_area
;    /* *argv[], *env[] */ 
1089         user_addr_t     path_area
;      /* package launch path */ 
1090         user_addr_t     ptr_area
;       /* argv[], env[], exec_path */ 
1092         int     stringc 
= imgp
->ip_argc 
+ imgp
->ip_envc
; 
1100          * Set up pointers to the beginning of the string area, the beginning 
1101          * of the path area, and the beginning of the pointer area (actually, 
1102          * the location of argc, an int, which may be smaller than a pointer, 
1103          * but we use ptr_size worth of space for it, for alignment). 
1105         string_area 
= stack 
- (((imgp
->ip_strendp 
- imgp
->ip_strings
) + ptr_size
-1) & ~(ptr_size
-1)) - ptr_size
; 
1106         path_area 
= string_area 
- (((imgp
->ip_argv 
- imgp
->ip_strings
) + ptr_size
-1) & ~(ptr_size
-1)); 
1107         ptr_area 
= path_area 
- ((imgp
->ip_argc 
+ imgp
->ip_envc 
+ 4) * ptr_size
) - ptr_size 
/*argc*/; 
1109         /* Return the initial stack address: the location of argc */ 
1113          * Record the size of the arguments area so that sysctl_procargs() 
1114          * can return the argument area without having to parse the arguments. 
1116         p
->p_argc 
= imgp
->ip_argc
; 
1117         p
->p_argslen 
= (int)(stack 
- path_area
); 
1121          * Support for new app package launching for Mac OS X allocates 
1122          * the "path" at the begining of the imgp->ip_strings buffer. 
1123          * copy it just before the string area. 
1126         error 
= copyoutstr(imgp
->ip_strings
, path_area
, 
1127                                 (unsigned)(imgp
->ip_argv 
- imgp
->ip_strings
), 
1133         /* Save a NULL pointer below it */ 
1134         (void)copyoutptr(0LL, path_area 
- ptr_size
, ptr_size
); 
1136         /* Save the pointer to "path" just below it */ 
1137         (void)copyoutptr(path_area
, path_area 
- 2*ptr_size
, ptr_size
); 
1140          * ptr_size for 2 NULL one each ofter arg[argc -1] and env[n] 
1142          * skip over saved path, ptr_size for pointer to path, 
1143          * and ptr_size for the NULL after pointer to path. 
1146         /* argc (int32, stored in a ptr_size area) */ 
1147         (void)suword(ptr_area
, imgp
->ip_argc
); 
1148         ptr_area 
+= sizeof(int); 
1149         /* pad to ptr_size, if 64 bit image, to ensure user stack alignment */ 
1150         if (imgp
->ip_flags 
& IMGPF_IS_64BIT
) { 
1151                 (void)suword(ptr_area
, 0);      /* int, not long: ignored */ 
1152                 ptr_area 
+= sizeof(int); 
1157          * We use (string_area - path_area) here rather than the more 
1158          * intuitive (imgp->ip_argv - imgp->ip_strings) because we are 
1159          * interested in the length of the PATH_AREA in user space, 
1160          * rather than the actual length of the execution path, since 
1161          * it includes alignment padding of the PATH_AREA + STRING_AREA 
1162          * to a ptr_size boundary. 
1164         strspace 
= SIZE_IMG_STRSPACE 
- (string_area 
- path_area
); 
1166                 if (stringc 
== imgp
->ip_envc
) { 
1167                         /* argv[n] = NULL */ 
1168                         (void)copyoutptr(0LL, ptr_area
, ptr_size
); 
1169                         ptr_area 
+= ptr_size
; 
1174                 /* pointer: argv[n]/env[n] */ 
1175                 (void)copyoutptr(string_area
, ptr_area
, ptr_size
); 
1177                 /* string : argv[n][]/env[n][] */ 
1179                         if (strspace 
<= 0) { 
1183                         error 
= copyoutstr(argv
, string_area
, 
1189                 } while (error 
== ENAMETOOLONG
); 
1190                 if (error 
== EFAULT 
|| error 
== E2BIG
) 
1191                         break;  /* bad stack - user's problem */ 
1192                 ptr_area 
+= ptr_size
; 
1195         (void)copyoutptr(0LL, ptr_area
, ptr_size
); 
1203  * exec_extract_strings 
1205  * Copy arguments and environment from user space into work area; we may 
1206  * have already copied some early arguments into the work area, and if 
1207  * so, any arguments opied in are appended to those already there. 
1209  * Parameters:  struct image_params *   the image parameter block 
1211  * Returns:     0                       Success 
1215  *              (imgp->ip_argc)         Count of arguments, updated 
1216  *              (imgp->ip_envc)         Count of environment strings, updated 
1219  * Notes:       The argument and environment vectors are user space pointers 
1220  *              to arrays of user space pointers. 
1223 exec_extract_strings(struct image_params 
*imgp
) 
1226         struct proc 
*p 
= vfs_context_proc(imgp
->ip_vfs_context
); 
1227         int seg 
= (IS_64BIT_PROCESS(p
) ? UIO_USERSPACE64 
: UIO_USERSPACE32
); 
1228         int     ptr_size 
= (imgp
->ip_flags 
& IMGPF_WAS_64BIT
) ? 8 : 4; 
1229         user_addr_t     argv 
= imgp
->ip_user_argv
; 
1230         user_addr_t     envv 
= imgp
->ip_user_envv
; 
1232         /* Now, get rest of arguments */ 
1235          * If we are running an interpreter, replace the av[0] that was 
1236          * passed to execve() with the fully qualified path name that was 
1237          * passed to execve() for interpreters which do not use the PATH 
1238          * to locate their script arguments. 
1240         if((imgp
->ip_flags 
& IMGPF_INTERPRET
) != 0 && argv 
!= 0LL) { 
1243                 error 
= copyinptr(argv
, &arg
, ptr_size
); 
1246                 if (arg 
!= 0LL && arg 
!= (user_addr_t
)-1) { 
1248                         error 
= exec_add_string(imgp
, imgp
->ip_user_fname
, seg
); 
1255         while (argv 
!= 0LL) { 
1258                 error 
= copyinptr(argv
, &arg
, ptr_size
); 
1265                 } else if (arg 
== (user_addr_t
)-1) { 
1266                         /* Um... why would it be -1? */ 
1273                 error 
= exec_add_string(imgp
, arg
, seg
); 
1279         /* Now, get the environment */ 
1280         while (envv 
!= 0LL) { 
1283                 error 
= copyinptr(envv
, &env
, ptr_size
); 
1290                 } else if (env 
== (user_addr_t
)-1) { 
1297                 error 
= exec_add_string(imgp
, env
, seg
); 
1307 #define unix_stack_size(p)      (p->p_rlimit[RLIMIT_STACK].rlim_cur) 
1310 exec_check_permissions(struct image_params 
*imgp
) 
1312         struct vnode 
*vp 
= imgp
->ip_vp
; 
1313         struct vnode_attr 
*vap 
= imgp
->ip_vattr
; 
1314         struct proc 
*p 
= vfs_context_proc(imgp
->ip_vfs_context
); 
1316         kauth_action_t action
; 
1318         /* Only allow execution of regular files */ 
1319         if (!vnode_isreg(vp
)) 
1322         /* Get the file attributes that we will be using here and elsewhere */ 
1324         VATTR_WANTED(vap
, va_uid
); 
1325         VATTR_WANTED(vap
, va_gid
); 
1326         VATTR_WANTED(vap
, va_mode
); 
1327         VATTR_WANTED(vap
, va_fsid
); 
1328         VATTR_WANTED(vap
, va_fileid
); 
1329         VATTR_WANTED(vap
, va_data_size
); 
1330         if ((error 
= vnode_getattr(vp
, vap
, imgp
->ip_vfs_context
)) != 0) 
1334          * Ensure that at least one execute bit is on - otherwise root 
1335          * will always succeed, and we don't want to happen unless the 
1336          * file really is executable. 
1338         if ((vap
->va_mode 
& (S_IXUSR 
| S_IXGRP 
| S_IXOTH
)) == 0) 
1341         /* Disallow zero length files */ 
1342         if (vap
->va_data_size 
== 0) 
1345         imgp
->ip_arch_offset 
= (user_size_t
)0; 
1346         imgp
->ip_arch_size 
= vap
->va_data_size
; 
1348         /* Disable setuid-ness for traced programs or if MNT_NOSUID */ 
1349         if ((vp
->v_mount
->mnt_flag 
& MNT_NOSUID
) || (p
->p_flag 
& P_TRACED
)) 
1350                 vap
->va_mode 
&= ~(VSUID 
| VSGID
); 
1352         /* Check for execute permission */ 
1353         action 
= KAUTH_VNODE_EXECUTE
; 
1354         /* Traced images must also be readable */ 
1355         if (p
->p_flag 
& P_TRACED
) 
1356                 action 
|= KAUTH_VNODE_READ_DATA
; 
1357         if ((error 
= vnode_authorize(vp
, NULL
, action
, imgp
->ip_vfs_context
)) != 0) 
1360         /* Don't let it run if anyone had it open for writing */ 
1361         if (vp
->v_writecount
) 
1365         /* XXX May want to indicate to underlying FS that vnode is open */ 
1373  * Initially clear the P_SUGID in the process flags; if an SUGID process is 
1374  * exec'ing a non-SUGID image, then  this is the point of no return. 
1376  * If the image being activated is SUGI, then replace the credential with a 
1377  * copy, disable tracing (unless the tracing process is root), reset the 
1378  * mach task port to revoke it, set the P_SUGID bit, 
1380  * If the saved user and group ID will be changing, then make sure it happens 
1381  * to a new credential, rather than a shared one. 
1383  * Set the security token (this is probably obsolete, given that the token 
1384  * should not technically be separate from the credential itself). 
1386  * Parameters:  struct image_params *   the image parameter block 
1388  * Returns:     void                    No failure indication 
1391  *              <process credential>    Potentially modified/replaced 
1392  *              <task port>             Potentially revoked 
1393  *              <process flags>         P_SUGID bit potentially modified 
1394  *              <security token>        Potentially modified 
1397 exec_handle_sugid(struct image_params 
*imgp
) 
1399         kauth_cred_t            cred 
= vfs_context_ucred(imgp
->ip_vfs_context
); 
1400         struct proc             
*p 
= vfs_context_proc(imgp
->ip_vfs_context
); 
1403         static struct vnode     
*dev_null 
= NULLVP
; 
1405         p
->p_flag 
&= ~P_SUGID
; 
1407         if (((imgp
->ip_origvattr
->va_mode 
& VSUID
) != 0 && 
1408              kauth_cred_getuid(cred
) != imgp
->ip_origvattr
->va_uid
) || 
1409             ((imgp
->ip_origvattr
->va_mode 
& VSGID
) != 0 && 
1410              cred
->cr_gid 
!= imgp
->ip_origvattr
->va_gid
)) { 
1413                  * If process is being ktraced, turn off - unless 
1416                 if (p
->p_tracep 
&& !(p
->p_traceflag 
& KTRFAC_ROOT
)) { 
1417                         struct vnode 
*tvp 
= p
->p_tracep
; 
1424                  * Replace the credential with a copy of itself if euid or egid change. 
1426                 if (imgp
->ip_origvattr
->va_mode 
& VSUID
) { 
1427                         p
->p_ucred 
= kauth_cred_seteuid(p
->p_ucred
, imgp
->ip_origvattr
->va_uid
); 
1429                 if (imgp
->ip_origvattr
->va_mode 
& VSGID
) { 
1430                         p
->p_ucred 
= kauth_cred_setegid(p
->p_ucred
, imgp
->ip_origvattr
->va_gid
); 
1434                  * Have mach reset the task port.  We don't want 
1435                  * anyone who had the task port before a setuid 
1436                  * exec to be able to access/control the task 
1439                 if (current_task() == p
->task
) 
1440                         ipc_task_reset(p
->task
); 
1442                 p
->p_flag 
|= P_SUGID
; 
1444                 /* Cache the vnode for /dev/null the first time around */ 
1445                 if (dev_null 
== NULLVP
) { 
1446                         struct nameidata nd1
; 
1448                         NDINIT(&nd1
, LOOKUP
, FOLLOW
, UIO_SYSSPACE32
, 
1449                             CAST_USER_ADDR_T("/dev/null"), 
1450                             imgp
->ip_vfs_context
); 
1452                         if ((error 
= vn_open(&nd1
, FREAD
, 0)) == 0) { 
1453                                 dev_null 
= nd1
.ni_vp
; 
1455                                  * vn_open returns with both a use_count 
1456                                  * and an io_count on the found vnode 
1457                                  * drop the io_count, but keep the use_count 
1459                                 vnode_put(nd1
.ni_vp
); 
1463                 /* Radar 2261856; setuid security hole fix */ 
1464                 /* Patch from OpenBSD: A. Ramesh */ 
1466                  * XXX For setuid processes, attempt to ensure that 
1467                  * stdin, stdout, and stderr are already allocated. 
1468                  * We do not want userland to accidentally allocate 
1469                  * descriptors in this range which has implied meaning 
1472                 if (dev_null 
!= NULLVP
) { 
1473                         for (i 
= 0; i 
< 3; i
++) { 
1474                                 struct fileproc 
*fp
; 
1477                                 if (p
->p_fd
->fd_ofiles
[i
] != NULL
) 
1480                                 if ((error 
= falloc(p
, &fp
, &indx
)) != 0) 
1483                                 if ((error 
= vnode_ref_ext(dev_null
, FREAD
)) != 0) { 
1484                                         fp_free(p
, indx
, fp
); 
1488                                 fp
->f_fglob
->fg_flag 
= FREAD
; 
1489                                 fp
->f_fglob
->fg_type 
= DTYPE_VNODE
; 
1490                                 fp
->f_fglob
->fg_ops 
= &vnops
; 
1491                                 fp
->f_fglob
->fg_data 
= (caddr_t
)dev_null
; 
1494                                 *fdflags(p
, indx
) &= ~UF_RESERVED
; 
1495                                 fp_drop(p
, indx
, fp
, 1); 
1499                          * for now we need to drop the reference immediately 
1500                          * since we don't have any mechanism in place to 
1501                          * release it before starting to unmount "/dev" 
1502                          * during a reboot/shutdown 
1504                         vnode_rele(dev_null
); 
1510          * Implement the semantic where the effective user and group become 
1511          * the saved user and group in exec'ed programs. 
1513         p
->p_ucred 
= kauth_cred_setsvuidgid(p
->p_ucred
, kauth_cred_getuid(p
->p_ucred
),  p
->p_ucred
->cr_gid
); 
1515         /* XXX Obsolete; security token should not be separate from cred */ 
1516         set_security_token(p
); 
1521 static kern_return_t
 
1522 create_unix_stack(vm_map_t map
, user_addr_t user_stack
, int customstack
, 
1525         mach_vm_size_t  size
; 
1526         mach_vm_offset_t addr
; 
1528         p
->user_stack 
= user_stack
; 
1530                 size 
= mach_vm_round_page(unix_stack_size(p
)); 
1531                 addr 
= mach_vm_trunc_page(user_stack 
- size
); 
1532                 return (mach_vm_allocate(map
, &addr
, size
, 
1533                                         VM_MAKE_TAG(VM_MEMORY_STACK
) | 
1536                 return(KERN_SUCCESS
); 
1539 #include <sys/reboot.h> 
1541 static char             init_program_name
[128] = "/sbin/launchd"; 
1542 static const char *     other_init 
= "/sbin/mach_init"; 
1544 char            init_args
[128] = ""; 
1546 struct execve_args      init_exec_args
; 
1547 int             init_attempts 
= 0; 
1551 load_init_program(struct proc 
*p
) 
1553         vm_offset_t     init_addr
; 
1556         register_t      retval
[2]; 
1560         /* init_args are copied in string form directly from bootstrap */ 
1563                 if (boothowto 
& RB_INITNAME
) { 
1564                         printf("init program? "); 
1566                         gets(init_program_name
, init_program_name
); 
1567 #endif  /* FIXME ] */ 
1570                 if (error 
&& ((boothowto 
& RB_INITNAME
) == 0) && 
1571                                         (init_attempts 
== 1)) { 
1572                         printf("Load of %s, errno %d, trying %s\n", 
1573                                 init_program_name
, error
, other_init
); 
1575                         bcopy(other_init
, init_program_name
, 
1576                                                         sizeof(other_init
)); 
1582                         printf("Load of %s failed, errno %d\n", 
1583                                         init_program_name
, error
); 
1585                         boothowto 
|= RB_INITNAME
; 
1590                  *      Copy out program name. 
1593                 init_addr 
= VM_MIN_ADDRESS
; 
1594                 (void) vm_allocate(current_map(), &init_addr
, 
1595                                    PAGE_SIZE
, VM_FLAGS_ANYWHERE
); 
1599                 (void) copyout((caddr_t
) init_program_name
, 
1600                                 CAST_USER_ADDR_T(init_addr
), 
1601                                 (unsigned) sizeof(init_program_name
)+1); 
1603                 argv
[0] = (char *) init_addr
; 
1604                 init_addr 
+= sizeof(init_program_name
); 
1605                 init_addr 
= (vm_offset_t
)ROUND_PTR(char, init_addr
); 
1608                  *      Put out first (and only) argument, similarly. 
1609                  *      Assumes everything fits in a page as allocated 
1613                 (void) copyout((caddr_t
) init_args
, 
1614                                 CAST_USER_ADDR_T(init_addr
), 
1615                                 (unsigned) sizeof(init_args
)); 
1617                 argv
[1] = (char *) init_addr
; 
1618                 init_addr 
+= sizeof(init_args
); 
1619                 init_addr 
= (vm_offset_t
)ROUND_PTR(char, init_addr
); 
1622                  *      Null-end the argument list 
1625                 argv
[2] = (char *) 0; 
1628                  *      Copy out the argument list. 
1631                 (void) copyout((caddr_t
) argv
, 
1632                                 CAST_USER_ADDR_T(init_addr
), 
1633                                 (unsigned) sizeof(argv
)); 
1636                  *      Set up argument block for fake call to execve. 
1639                 init_exec_args
.fname 
= CAST_USER_ADDR_T(argv
[0]); 
1640                 init_exec_args
.argp 
= CAST_USER_ADDR_T((char **)init_addr
); 
1641                 init_exec_args
.envp 
= CAST_USER_ADDR_T(0); 
1643                 /* So that mach_init task  
1644                  * is set with uid,gid 0 token  
1646                 set_security_token(p
); 
1648                 error 
= execve(p
,&init_exec_args
,retval
); 
1653  * Convert a load_return_t to an errno. 
1656 load_return_to_errno(load_return_t lrtn
) 
1682 #include <mach/mach_types.h> 
1683 #include <mach/vm_prot.h> 
1684 #include <mach/semaphore.h> 
1685 #include <mach/sync_policy.h> 
1686 #include <kern/clock.h> 
1687 #include <mach/kern_return.h> 
1689 extern semaphore_t execve_semaphore
; 
1692  * The block of memory used by the execve arguments.  At the same time, 
1693  * we allocate a page so that we can read in the first page of the image. 
1696 execargs_alloc(struct image_params 
*imgp
) 
1700         kret 
= semaphore_wait(execve_semaphore
); 
1701         if (kret 
!= KERN_SUCCESS
) 
1705                 case KERN_INVALID_ADDRESS
: 
1706                 case KERN_PROTECTION_FAILURE
: 
1709                 case KERN_OPERATION_TIMED_OUT
: 
1713         kret 
= kmem_alloc_pageable(bsd_pageable_map
, (vm_offset_t 
*)&imgp
->ip_strings
, NCARGS 
+ PAGE_SIZE
); 
1714         imgp
->ip_vdata 
= imgp
->ip_strings 
+ NCARGS
; 
1715         if (kret 
!= KERN_SUCCESS
) { 
1716                 semaphore_signal(execve_semaphore
); 
1723 execargs_free(struct image_params 
*imgp
) 
1727         kmem_free(bsd_pageable_map
, (vm_offset_t
)imgp
->ip_strings
, NCARGS 
+ PAGE_SIZE
); 
1728         imgp
->ip_strings 
= NULL
; 
1730         kret 
= semaphore_signal(execve_semaphore
); 
1732         case KERN_INVALID_ADDRESS
: 
1733         case KERN_PROTECTION_FAILURE
: 
1736         case KERN_OPERATION_TIMED_OUT
: