2 * Copyright (c) 2000-2008 Apple Inc. All rights reserved.
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
28 /* Copyright (c) 1995, 1997 Apple Computer, Inc. All Rights Reserved */
30 * Copyright (c) 1982, 1986, 1991, 1993
31 * The Regents of the University of California. All rights reserved.
32 * (c) UNIX System Laboratories, Inc.
33 * All or some portions of this file are derived from material licensed
34 * to the University of California by American Telephone and Telegraph
35 * Co. or Unix System Laboratories, Inc. and are reproduced herein with
36 * the permission of UNIX System Laboratories, Inc.
38 * Redistribution and use in source and binary forms, with or without
39 * modification, are permitted provided that the following conditions
41 * 1. Redistributions of source code must retain the above copyright
42 * notice, this list of conditions and the following disclaimer.
43 * 2. Redistributions in binary form must reproduce the above copyright
44 * notice, this list of conditions and the following disclaimer in the
45 * documentation and/or other materials provided with the distribution.
46 * 3. All advertising materials mentioning features or use of this software
47 * must display the following acknowledgement:
48 * This product includes software developed by the University of
49 * California, Berkeley and its contributors.
50 * 4. Neither the name of the University nor the names of its contributors
51 * may be used to endorse or promote products derived from this software
52 * without specific prior written permission.
54 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
55 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
56 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
57 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
58 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
59 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
60 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
61 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
62 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
63 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
66 * @(#)kern_resource.c 8.5 (Berkeley) 1/21/94
69 * NOTICE: This file was modified by SPARTA, Inc. in 2005 to introduce
70 * support for mandatory and extensible security protections. This notice
71 * is included in support of clause 2.2 (b) of the Apple Public License,
75 #include <sys/param.h>
76 #include <sys/systm.h>
77 #include <sys/sysctl.h>
78 #include <sys/kernel.h>
79 #include <sys/file_internal.h>
80 #include <sys/resourcevar.h>
81 #include <sys/malloc.h>
82 #include <sys/proc_internal.h>
83 #include <sys/kauth.h>
84 #include <machine/spl.h>
86 #include <sys/mount_internal.h>
87 #include <sys/sysproto.h>
89 #include <security/audit/audit.h>
91 #include <machine/vmparam.h>
93 #include <mach/mach_types.h>
94 #include <mach/time_value.h>
95 #include <mach/task.h>
96 #include <mach/task_info.h>
97 #include <mach/vm_map.h>
98 #include <mach/mach_vm.h>
99 #include <mach/thread_act.h> /* for thread_policy_set( ) */
100 #include <kern/lock.h>
101 #include <kern/thread.h>
103 #include <kern/task.h>
104 #include <kern/clock.h> /* for absolutetime_to_microtime() */
105 #include <netinet/in.h> /* for TRAFFIC_MGT_SO_* */
106 #include <sys/socketvar.h> /* for struct socket */
108 #include <vm/vm_map.h>
110 int donice(struct proc
*curp
, struct proc
*chgp
, int n
);
111 int dosetrlimit(struct proc
*p
, u_int which
, struct rlimit
*limp
);
112 int uthread_get_background_state(uthread_t
);
113 static void do_background_socket(struct proc
*p
, thread_t thread
, int priority
);
114 static int do_background_thread(struct proc
*curp
, int priority
);
115 static int do_background_task(struct proc
*curp
, int priority
);
117 rlim_t maxdmap
= MAXDSIZ
; /* XXX */
118 rlim_t maxsmap
= MAXSSIZ
- PAGE_SIZE
; /* XXX */
121 * Limits on the number of open files per process, and the number
122 * of child processes per process.
124 * Note: would be in kern/subr_param.c in FreeBSD.
126 __private_extern__
int maxfilesperproc
= OPEN_MAX
; /* per-proc open files limit */
128 SYSCTL_INT( _kern
, KERN_MAXPROCPERUID
, maxprocperuid
, CTLFLAG_RW
,
129 &maxprocperuid
, 0, "Maximum processes allowed per userid" );
131 SYSCTL_INT( _kern
, KERN_MAXFILESPERPROC
, maxfilesperproc
, CTLFLAG_RW
,
132 &maxfilesperproc
, 0, "Maximum files allowed open per process" );
134 /* Args and fn for proc_iteration callback used in setpriority */
135 struct puser_nice_args
{
142 static int puser_donice_callback(proc_t p
, void * arg
);
145 /* Args and fn for proc_iteration callback used in setpriority */
146 struct ppgrp_nice_args
{
152 static int ppgrp_donice_callback(proc_t p
, void * arg
);
155 * Resource controls and accounting.
158 getpriority(struct proc
*curp
, struct getpriority_args
*uap
, int32_t *retval
)
161 int low
= PRIO_MAX
+ 1;
162 kauth_cred_t my_cred
;
164 /* would also test (uap->who < 0), but id_t is unsigned */
165 if (uap
->who
> 0x7fffffff)
168 switch (uap
->which
) {
175 p
= proc_find(uap
->who
);
185 struct pgrp
*pg
= PGRP_NULL
;
188 /* returns the pgrp to ref */
189 pg
= proc_pgrp(curp
);
190 } else if ((pg
= pgfind(uap
->who
)) == PGRP_NULL
) {
193 /* No need for iteration as it is a simple scan */
195 for (p
= pg
->pg_members
.lh_first
; p
!= 0; p
= p
->p_pglist
.le_next
) {
206 uap
->who
= kauth_cred_getuid(kauth_cred_get());
210 for (p
= allproc
.lh_first
; p
!= 0; p
= p
->p_list
.le_next
) {
211 my_cred
= kauth_cred_proc_ref(p
);
212 if (kauth_cred_getuid(my_cred
) == uap
->who
&&
215 kauth_cred_unref(&my_cred
);
222 case PRIO_DARWIN_THREAD
: {
226 /* we currently only support the current thread */
231 thread
= current_thread();
232 ut
= get_bsdthread_info(thread
);
235 if ( (ut
->uu_flag
& UT_BACKGROUND_TRAFFIC_MGT
) != 0 ) {
244 if (low
== PRIO_MAX
+ 1)
250 /* call back function used for proc iteration in PRIO_USER */
252 puser_donice_callback(proc_t p
, void * arg
)
255 struct puser_nice_args
* pun
= (struct puser_nice_args
*)arg
;
256 kauth_cred_t my_cred
;
258 my_cred
= kauth_cred_proc_ref(p
);
259 if (kauth_cred_getuid(my_cred
) == pun
->who
) {
260 error
= donice(pun
->curp
, p
, pun
->prio
);
261 if (pun
->errorp
!= NULL
)
262 *pun
->errorp
= error
;
263 if (pun
->foundp
!= NULL
) {
268 kauth_cred_unref(&my_cred
);
270 return(PROC_RETURNED
);
273 /* call back function used for proc iteration in PRIO_PGRP */
275 ppgrp_donice_callback(proc_t p
, void * arg
)
278 struct ppgrp_nice_args
* pun
= (struct ppgrp_nice_args
*)arg
;
281 error
= donice(pun
->curp
, p
, pun
->prio
);
282 if (pun
->errorp
!= NULL
)
283 *pun
->errorp
= error
;
284 if (pun
->foundp
!= NULL
) {
289 return(PROC_RETURNED
);
301 setpriority(struct proc
*curp
, struct setpriority_args
*uap
, __unused
int32_t *retval
)
304 int found
= 0, error
= 0;
307 AUDIT_ARG(cmd
, uap
->which
);
308 AUDIT_ARG(owner
, uap
->who
, 0);
309 AUDIT_ARG(value32
, uap
->prio
);
311 /* would also test (uap->who < 0), but id_t is unsigned */
312 if (uap
->who
> 0x7fffffff)
315 switch (uap
->which
) {
321 p
= proc_find(uap
->who
);
326 error
= donice(curp
, p
, uap
->prio
);
333 struct pgrp
*pg
= PGRP_NULL
;
334 struct ppgrp_nice_args ppgrp
;
337 pg
= proc_pgrp(curp
);
338 } else if ((pg
= pgfind(uap
->who
)) == PGRP_NULL
)
342 ppgrp
.prio
= uap
->prio
;
343 ppgrp
.foundp
= &found
;
344 ppgrp
.errorp
= &error
;
346 /* PGRP_DROPREF drops the reference on process group */
347 pgrp_iterate(pg
, PGRP_DROPREF
, ppgrp_donice_callback
, (void *)&ppgrp
, NULL
, NULL
);
353 struct puser_nice_args punice
;
356 uap
->who
= kauth_cred_getuid(kauth_cred_get());
359 punice
.prio
= uap
->prio
;
360 punice
.who
= uap
->who
;
361 punice
.foundp
= &found
;
363 punice
.errorp
= &error
;
364 proc_iterate(PROC_ALLPROCLIST
, puser_donice_callback
, (void *)&punice
, NULL
, NULL
);
369 case PRIO_DARWIN_THREAD
: {
370 /* we currently only support the current thread */
374 error
= do_background_thread(curp
, uap
->prio
);
375 (void) do_background_socket(curp
, current_thread(), uap
->prio
);
380 case PRIO_DARWIN_PROCESS
: {
384 p
= proc_find(uap
->who
);
390 error
= do_background_task(p
, uap
->prio
);
391 (void) do_background_socket(p
, NULL
, uap
->prio
);
412 * mac_check_proc_sched:???
415 donice(struct proc
*curp
, struct proc
*chgp
, int n
)
419 kauth_cred_t my_cred
;
421 ucred
= kauth_cred_proc_ref(curp
);
422 my_cred
= kauth_cred_proc_ref(chgp
);
424 if (suser(ucred
, NULL
) && ucred
->cr_ruid
&&
425 kauth_cred_getuid(ucred
) != kauth_cred_getuid(my_cred
) &&
426 ucred
->cr_ruid
!= kauth_cred_getuid(my_cred
)) {
434 if (n
< chgp
->p_nice
&& suser(ucred
, &curp
->p_acflag
)) {
439 error
= mac_proc_check_sched(curp
, chgp
);
446 (void)resetpriority(chgp
);
448 kauth_cred_unref(&ucred
);
449 kauth_cred_unref(&my_cred
);
454 do_background_task(struct proc
*p
, int priority
)
457 task_category_policy_data_t info
;
459 /* set the max scheduling priority on the task */
460 if (priority
& PRIO_DARWIN_BG
) {
461 info
.role
= TASK_THROTTLE_APPLICATION
;
463 info
.role
= TASK_DEFAULT_APPLICATION
;
466 error
= task_policy_set(p
->task
,
467 TASK_CATEGORY_POLICY
,
468 (task_policy_t
) &info
,
469 TASK_CATEGORY_POLICY_COUNT
);
476 /* mark proc structure as backgrounded */
477 if (priority
& PRIO_DARWIN_BG
) {
478 p
->p_lflag
|= P_LBACKGROUND
;
480 p
->p_lflag
&= ~P_LBACKGROUND
;
483 /* set or reset the disk I/O priority */
484 p
->p_iopol_disk
= (priority
== PRIO_DARWIN_BG
?
485 IOPOL_THROTTLE
: IOPOL_DEFAULT
);
494 do_background_socket(struct proc
*p
, thread_t thread
, int priority
)
496 struct filedesc
*fdp
;
500 if (priority
& PRIO_DARWIN_BG
) {
502 * For PRIO_DARWIN_PROCESS (thread is NULL), simply mark
503 * the sockets with the background flag. There's nothing
504 * to do here for the PRIO_DARWIN_THREAD case.
506 if (thread
== NULL
) {
510 for (i
= 0; i
< fdp
->fd_nfiles
; i
++) {
511 struct socket
*sockp
;
513 fp
= fdp
->fd_ofiles
[i
];
514 if (fp
== NULL
|| (fdp
->fd_ofileflags
[i
] & UF_RESERVED
) != 0 ||
515 fp
->f_fglob
->fg_type
!= DTYPE_SOCKET
) {
518 sockp
= (struct socket
*)fp
->f_fglob
->fg_data
;
519 socket_set_traffic_mgt_flags(sockp
, TRAFFIC_MGT_SO_BACKGROUND
);
520 sockp
->so_background_thread
= NULL
;
526 u_int32_t traffic_mgt
;
528 * See comments on do_background_thread(). Deregulate network
529 * traffics only for setpriority(PRIO_DARWIN_THREAD).
531 traffic_mgt
= (thread
== NULL
) ? 0 : TRAFFIC_MGT_SO_BG_REGULATE
;
533 /* disable networking IO throttle.
534 * NOTE - It is a known limitation of the current design that we
535 * could potentially clear TRAFFIC_MGT_SO_BACKGROUND bit for
536 * sockets created by other threads within this process.
540 for ( i
= 0; i
< fdp
->fd_nfiles
; i
++ ) {
541 struct socket
*sockp
;
543 fp
= fdp
->fd_ofiles
[ i
];
544 if ( fp
== NULL
|| (fdp
->fd_ofileflags
[ i
] & UF_RESERVED
) != 0 ||
545 fp
->f_fglob
->fg_type
!= DTYPE_SOCKET
) {
548 sockp
= (struct socket
*)fp
->f_fglob
->fg_data
;
549 /* skip if only clearing this thread's sockets */
550 if ((thread
) && (sockp
->so_background_thread
!= thread
)) {
553 socket_clear_traffic_mgt_flags(sockp
, TRAFFIC_MGT_SO_BACKGROUND
| traffic_mgt
);
554 sockp
->so_background_thread
= NULL
;
562 * do_background_thread
564 * XXX - todo - does this need a MACF hook?
566 * NOTE: To maintain binary compatibility with PRIO_DARWIN_THREAD with respect
567 * to network traffic management, UT_BACKGROUND_TRAFFIC_MGT is set/cleared
568 * along with UT_BACKGROUND flag, as the latter alone no longer implies
569 * any form of traffic regulation (it simply means that the thread is
570 * background.) With PRIO_DARWIN_PROCESS, any form of network traffic
571 * management must be explicitly requested via whatever means appropriate,
572 * and only TRAFFIC_MGT_SO_BACKGROUND is set via do_background_socket().
575 do_background_thread(struct proc
*curp __unused
, int priority
)
579 thread_precedence_policy_data_t policy
;
581 thread
= current_thread();
582 ut
= get_bsdthread_info(thread
);
584 if ( (priority
& PRIO_DARWIN_BG
) == 0 ) {
585 /* turn off backgrounding of thread */
586 if ( (ut
->uu_flag
& UT_BACKGROUND
) == 0 ) {
592 * Clear background bit in thread and disable disk IO
593 * throttle as well as network traffic management.
594 * The corresponding socket flags for sockets created by
595 * this thread will be cleared in do_background_socket().
597 ut
->uu_flag
&= ~(UT_BACKGROUND
| UT_BACKGROUND_TRAFFIC_MGT
);
598 ut
->uu_iopol_disk
= IOPOL_NORMAL
;
600 /* reset thread priority (we did not save previous value) */
601 policy
.importance
= 0;
602 thread_policy_set( thread
, THREAD_PRECEDENCE_POLICY
,
603 (thread_policy_t
)&policy
,
604 THREAD_PRECEDENCE_POLICY_COUNT
);
608 /* background this thread */
609 if ( (ut
->uu_flag
& UT_BACKGROUND
) != 0 ) {
610 /* already backgrounded */
615 * Tag thread as background and throttle disk IO, as well
616 * as regulate network traffics. Future sockets created
617 * by this thread will have their corresponding socket
618 * flags set at socket create time.
620 ut
->uu_flag
|= (UT_BACKGROUND
| UT_BACKGROUND_TRAFFIC_MGT
);
621 ut
->uu_iopol_disk
= IOPOL_THROTTLE
;
623 policy
.importance
= INT_MIN
;
624 thread_policy_set( thread
, THREAD_PRECEDENCE_POLICY
,
625 (thread_policy_t
)&policy
,
626 THREAD_PRECEDENCE_POLICY_COUNT
);
628 /* throttle networking IO happens in socket( ) syscall.
629 * If UT_{BACKGROUND,BACKGROUND_TRAFFIC_MGT} is set in the current
630 * thread then TRAFFIC_MGT_SO_{BACKGROUND,BG_REGULATE} is set.
631 * Existing sockets are taken care of by do_background_socket().
637 * If the thread or its proc has been put into the background
638 * with setpriority(PRIO_DARWIN_{THREAD,PROCESS}, *, PRIO_DARWIN_BG),
639 * report that status.
641 * Returns: PRIO_DARWIN_BG if background
645 uthread_get_background_state(uthread_t uth
)
647 proc_t p
= uth
->uu_proc
;
648 if (p
&& (p
->p_lflag
& P_LBACKGROUND
))
649 return PRIO_DARWIN_BG
;
651 if (uth
->uu_flag
& UT_BACKGROUND
)
652 return PRIO_DARWIN_BG
;
664 setrlimit(struct proc
*p
, struct setrlimit_args
*uap
, __unused
int32_t *retval
)
669 if ((error
= copyin(uap
->rlp
, (caddr_t
)&alim
,
670 sizeof (struct rlimit
))))
673 return (dosetrlimit(p
, uap
->which
, &alim
));
679 * ENOMEM Cannot copy limit structure
682 * Notes: EINVAL is returned both for invalid arguments, and in the
683 * case that the current usage (e.g. RLIMIT_STACK) is already
684 * in excess of the requested limit.
687 dosetrlimit(struct proc
*p
, u_int which
, struct rlimit
*limp
)
689 struct rlimit
*alimp
;
692 int posix
= (which
& _RLIMIT_POSIX_FLAG
) ? 1 : 0;
694 /* Mask out POSIX flag, saved above */
695 which
&= ~_RLIMIT_POSIX_FLAG
;
697 if (which
>= RLIM_NLIMITS
)
700 alimp
= &p
->p_rlimit
[which
];
701 if (limp
->rlim_cur
> limp
->rlim_max
)
704 if (limp
->rlim_cur
> alimp
->rlim_max
||
705 limp
->rlim_max
> alimp
->rlim_max
)
706 if ((error
= suser(kauth_cred_get(), &p
->p_acflag
))) {
712 if ((error
= proc_limitreplace(p
)) != 0) {
713 proc_limitunblock(p
);
717 alimp
= &p
->p_rlimit
[which
];
722 if (limp
->rlim_cur
== RLIM_INFINITY
) {
723 task_vtimer_clear(p
->task
, TASK_VTIMER_RLIM
);
724 timerclear(&p
->p_rlim_cpu
);
727 task_absolutetime_info_data_t tinfo
;
728 mach_msg_type_number_t count
;
729 struct timeval ttv
, tv
;
731 clock_usec_t tv_usec
;
733 count
= TASK_ABSOLUTETIME_INFO_COUNT
;
734 task_info(p
->task
, TASK_ABSOLUTETIME_INFO
,
735 (task_info_t
)&tinfo
, &count
);
736 absolutetime_to_microtime(tinfo
.total_user
+ tinfo
.total_system
,
739 ttv
.tv_usec
= tv_usec
;
741 tv
.tv_sec
= (limp
->rlim_cur
> __INT_MAX__
? __INT_MAX__
: limp
->rlim_cur
);
743 timersub(&tv
, &ttv
, &p
->p_rlim_cpu
);
746 if (timercmp(&p
->p_rlim_cpu
, &tv
, >))
747 task_vtimer_set(p
->task
, TASK_VTIMER_RLIM
);
749 task_vtimer_clear(p
->task
, TASK_VTIMER_RLIM
);
751 timerclear(&p
->p_rlim_cpu
);
759 if (limp
->rlim_cur
> maxdmap
)
760 limp
->rlim_cur
= maxdmap
;
761 if (limp
->rlim_max
> maxdmap
)
762 limp
->rlim_max
= maxdmap
;
766 /* Disallow illegal stack size instead of clipping */
767 if (limp
->rlim_cur
> maxsmap
||
768 limp
->rlim_max
> maxsmap
) {
775 * 4797860 - workaround poorly written installers by
776 * doing previous implementation (< 10.5) when caller
777 * is non-POSIX conforming.
779 if (limp
->rlim_cur
> maxsmap
)
780 limp
->rlim_cur
= maxsmap
;
781 if (limp
->rlim_max
> maxsmap
)
782 limp
->rlim_max
= maxsmap
;
787 * Stack is allocated to the max at exec time with only
788 * "rlim_cur" bytes accessible. If stack limit is going
789 * up make more accessible, if going down make inaccessible.
791 if (limp
->rlim_cur
> alimp
->rlim_cur
) {
796 size
= round_page_64(limp
->rlim_cur
);
797 size
-= round_page_64(alimp
->rlim_cur
);
800 /* go to top of current stack */
801 addr
= p
->user_stack
+ round_page_64(alimp
->rlim_cur
);
802 #else /* STACK_GROWTH_UP */
803 addr
= p
->user_stack
- round_page_64(limp
->rlim_cur
);
804 #endif /* STACK_GROWTH_UP */
805 kr
= mach_vm_protect(current_map(),
807 FALSE
, VM_PROT_DEFAULT
);
808 if (kr
!= KERN_SUCCESS
) {
812 } else if (limp
->rlim_cur
< alimp
->rlim_cur
) {
820 * First check if new stack limit would agree
821 * with current stack usage.
822 * Get the current thread's stack pointer...
824 cur_sp
= thread_adjuserstack(current_thread(),
827 if (cur_sp
>= p
->user_stack
&&
828 cur_sp
< (p
->user_stack
+
829 round_page_64(alimp
->rlim_cur
))) {
830 /* current stack pointer is in main stack */
831 if (cur_sp
>= (p
->user_stack
+
832 round_page_64(limp
->rlim_cur
))) {
834 * New limit would cause
835 * current usage to be invalid:
842 /* not on the main stack: reject */
847 #else /* STACK_GROWTH_UP */
848 if (cur_sp
<= p
->user_stack
&&
849 cur_sp
> (p
->user_stack
-
850 round_page_64(alimp
->rlim_cur
))) {
851 /* stack pointer is in main stack */
852 if (cur_sp
<= (p
->user_stack
-
853 round_page_64(limp
->rlim_cur
))) {
855 * New limit would cause
856 * current usage to be invalid:
863 /* not on the main stack: reject */
867 #endif /* STACK_GROWTH_UP */
869 size
= round_page_64(alimp
->rlim_cur
);
870 size
-= round_page_64(limp
->rlim_cur
);
873 addr
= p
->user_stack
+ round_page_64(limp
->rlim_cur
);
874 #else /* STACK_GROWTH_UP */
875 addr
= p
->user_stack
- round_page_64(alimp
->rlim_cur
);
876 #endif /* STACK_GROWTH_UP */
878 kr
= mach_vm_protect(current_map(),
880 FALSE
, VM_PROT_NONE
);
881 if (kr
!= KERN_SUCCESS
) {
892 * Only root can set the maxfiles limits, as it is
893 * systemwide resource. If we are expecting POSIX behavior,
894 * instead of clamping the value, return EINVAL. We do this
895 * because historically, people have been able to attempt to
896 * set RLIM_INFINITY to get "whatever the maximum is".
899 if (limp
->rlim_cur
!= alimp
->rlim_cur
&&
900 limp
->rlim_cur
> (rlim_t
)maxfiles
) {
905 limp
->rlim_cur
= maxfiles
;
907 if (limp
->rlim_max
!= alimp
->rlim_max
&&
908 limp
->rlim_max
> (rlim_t
)maxfiles
)
909 limp
->rlim_max
= maxfiles
;
912 if (limp
->rlim_cur
!= alimp
->rlim_cur
&&
913 limp
->rlim_cur
> (rlim_t
)maxfilesperproc
) {
918 limp
->rlim_cur
= maxfilesperproc
;
920 if (limp
->rlim_max
!= alimp
->rlim_max
&&
921 limp
->rlim_max
> (rlim_t
)maxfilesperproc
)
922 limp
->rlim_max
= maxfilesperproc
;
928 * Only root can set to the maxproc limits, as it is
929 * systemwide resource; all others are limited to
930 * maxprocperuid (presumably less than maxproc).
933 if (limp
->rlim_cur
> (rlim_t
)maxproc
)
934 limp
->rlim_cur
= maxproc
;
935 if (limp
->rlim_max
> (rlim_t
)maxproc
)
936 limp
->rlim_max
= maxproc
;
939 if (limp
->rlim_cur
> (rlim_t
)maxprocperuid
)
940 limp
->rlim_cur
= maxprocperuid
;
941 if (limp
->rlim_max
> (rlim_t
)maxprocperuid
)
942 limp
->rlim_max
= maxprocperuid
;
948 * Tell the Mach VM layer about the new limit value.
951 vm_map_set_user_wire_limit(current_map(), limp
->rlim_cur
);
960 proc_limitunblock(p
);
966 getrlimit(struct proc
*p
, struct getrlimit_args
*uap
, __unused
int32_t *retval
)
971 * Take out flag now in case we need to use it to trigger variant
974 uap
->which
&= ~_RLIMIT_POSIX_FLAG
;
976 if (uap
->which
>= RLIM_NLIMITS
)
978 proc_limitget(p
, uap
->which
, &lim
);
979 return (copyout((caddr_t
)&lim
,
980 uap
->rlp
, sizeof (struct rlimit
)));
984 * Transform the running time and tick information in proc p into user,
985 * system, and interrupt time usage.
987 /* No lock on proc is held for this.. */
989 calcru(struct proc
*p
, struct timeval
*up
, struct timeval
*sp
, struct timeval
*ip
)
1000 task_basic_info_32_data_t tinfo
;
1001 task_thread_times_info_data_t ttimesinfo
;
1002 task_events_info_data_t teventsinfo
;
1003 mach_msg_type_number_t task_info_count
, task_ttimes_count
;
1004 mach_msg_type_number_t task_events_count
;
1005 struct timeval ut
,st
;
1007 task_info_count
= TASK_BASIC_INFO_32_COUNT
;
1008 task_info(task
, TASK_BASIC2_INFO_32
,
1009 (task_info_t
)&tinfo
, &task_info_count
);
1010 ut
.tv_sec
= tinfo
.user_time
.seconds
;
1011 ut
.tv_usec
= tinfo
.user_time
.microseconds
;
1012 st
.tv_sec
= tinfo
.system_time
.seconds
;
1013 st
.tv_usec
= tinfo
.system_time
.microseconds
;
1014 timeradd(&ut
, up
, up
);
1015 timeradd(&st
, sp
, sp
);
1017 task_ttimes_count
= TASK_THREAD_TIMES_INFO_COUNT
;
1018 task_info(task
, TASK_THREAD_TIMES_INFO
,
1019 (task_info_t
)&ttimesinfo
, &task_ttimes_count
);
1021 ut
.tv_sec
= ttimesinfo
.user_time
.seconds
;
1022 ut
.tv_usec
= ttimesinfo
.user_time
.microseconds
;
1023 st
.tv_sec
= ttimesinfo
.system_time
.seconds
;
1024 st
.tv_usec
= ttimesinfo
.system_time
.microseconds
;
1025 timeradd(&ut
, up
, up
);
1026 timeradd(&st
, sp
, sp
);
1028 task_events_count
= TASK_EVENTS_INFO_COUNT
;
1029 task_info(task
, TASK_EVENTS_INFO
,
1030 (task_info_t
)&teventsinfo
, &task_events_count
);
1033 * No need to lock "p": this does not need to be
1034 * completely consistent, right ?
1036 p
->p_stats
->p_ru
.ru_minflt
= (teventsinfo
.faults
-
1037 teventsinfo
.pageins
);
1038 p
->p_stats
->p_ru
.ru_majflt
= teventsinfo
.pageins
;
1039 p
->p_stats
->p_ru
.ru_nivcsw
= (teventsinfo
.csw
-
1040 p
->p_stats
->p_ru
.ru_nvcsw
);
1041 if (p
->p_stats
->p_ru
.ru_nivcsw
< 0)
1042 p
->p_stats
->p_ru
.ru_nivcsw
= 0;
1044 p
->p_stats
->p_ru
.ru_maxrss
= tinfo
.resident_size
;
1048 __private_extern__
void munge_user64_rusage(struct rusage
*a_rusage_p
, struct user64_rusage
*a_user_rusage_p
);
1049 __private_extern__
void munge_user32_rusage(struct rusage
*a_rusage_p
, struct user32_rusage
*a_user_rusage_p
);
1053 getrusage(struct proc
*p
, struct getrusage_args
*uap
, __unused
int32_t *retval
)
1055 struct rusage
*rup
, rubuf
;
1056 struct user64_rusage rubuf64
;
1057 struct user32_rusage rubuf32
;
1058 size_t retsize
= sizeof(rubuf
); /* default: 32 bits */
1059 caddr_t retbuf
= (caddr_t
)&rubuf
; /* default: 32 bits */
1060 struct timeval utime
;
1061 struct timeval stime
;
1066 calcru(p
, &utime
, &stime
, NULL
);
1068 rup
= &p
->p_stats
->p_ru
;
1069 rup
->ru_utime
= utime
;
1070 rup
->ru_stime
= stime
;
1077 case RUSAGE_CHILDREN
:
1079 rup
= &p
->p_stats
->p_cru
;
1087 if (IS_64BIT_PROCESS(p
)) {
1088 retsize
= sizeof(rubuf64
);
1089 retbuf
= (caddr_t
)&rubuf64
;
1090 munge_user64_rusage(&rubuf
, &rubuf64
);
1092 retsize
= sizeof(rubuf32
);
1093 retbuf
= (caddr_t
)&rubuf32
;
1094 munge_user32_rusage(&rubuf
, &rubuf32
);
1097 return (copyout(retbuf
, uap
->rusage
, retsize
));
1101 ruadd(struct rusage
*ru
, struct rusage
*ru2
)
1106 timeradd(&ru
->ru_utime
, &ru2
->ru_utime
, &ru
->ru_utime
);
1107 timeradd(&ru
->ru_stime
, &ru2
->ru_stime
, &ru
->ru_stime
);
1108 if (ru
->ru_maxrss
< ru2
->ru_maxrss
)
1109 ru
->ru_maxrss
= ru2
->ru_maxrss
;
1110 ip
= &ru
->ru_first
; ip2
= &ru2
->ru_first
;
1111 for (i
= &ru
->ru_last
- &ru
->ru_first
; i
>= 0; i
--)
1116 proc_limitget(proc_t p
, int which
, struct rlimit
* limp
)
1119 limp
->rlim_cur
= p
->p_rlimit
[which
].rlim_cur
;
1120 limp
->rlim_max
= p
->p_rlimit
[which
].rlim_max
;
1126 proc_limitdrop(proc_t p
, int exiting
)
1128 struct plimit
* freelim
= NULL
;
1129 struct plimit
* freeoldlim
= NULL
;
1133 if (--p
->p_limit
->pl_refcnt
== 0) {
1134 freelim
= p
->p_limit
;
1137 if ((exiting
!= 0) && (p
->p_olimit
!= NULL
) && (--p
->p_olimit
->pl_refcnt
== 0)) {
1138 freeoldlim
= p
->p_olimit
;
1143 if (freelim
!= NULL
)
1144 FREE_ZONE(freelim
, sizeof *p
->p_limit
, M_PLIMIT
);
1145 if (freeoldlim
!= NULL
)
1146 FREE_ZONE(freeoldlim
, sizeof *p
->p_olimit
, M_PLIMIT
);
1151 proc_limitfork(proc_t parent
, proc_t child
)
1154 child
->p_limit
= parent
->p_limit
;
1155 child
->p_limit
->pl_refcnt
++;
1156 child
->p_olimit
= NULL
;
1161 proc_limitblock(proc_t p
)
1164 while (p
->p_lflag
& P_LLIMCHANGE
) {
1165 p
->p_lflag
|= P_LLIMWAIT
;
1166 msleep(&p
->p_olimit
, &p
->p_mlock
, 0, "proc_limitblock", NULL
);
1168 p
->p_lflag
|= P_LLIMCHANGE
;
1175 proc_limitunblock(proc_t p
)
1178 p
->p_lflag
&= ~P_LLIMCHANGE
;
1179 if (p
->p_lflag
& P_LLIMWAIT
) {
1180 p
->p_lflag
&= ~P_LLIMWAIT
;
1181 wakeup(&p
->p_olimit
);
1186 /* This is called behind serialization provided by proc_limitblock/unlbock */
1188 proc_limitreplace(proc_t p
)
1190 struct plimit
*copy
;
1195 if (p
->p_limit
->pl_refcnt
== 1) {
1202 MALLOC_ZONE(copy
, struct plimit
*,
1203 sizeof(struct plimit
), M_PLIMIT
, M_WAITOK
);
1209 bcopy(p
->p_limit
->pl_rlimit
, copy
->pl_rlimit
,
1210 sizeof(struct rlimit
) * RLIM_NLIMITS
);
1211 copy
->pl_refcnt
= 1;
1212 /* hang on to reference to old till process exits */
1213 p
->p_olimit
= p
->p_limit
;
1224 * Description: System call MUX for use in manipulating I/O policy attributes of the current process or thread
1226 * Parameters: cmd Policy command
1227 * arg Pointer to policy arguments
1229 * Returns: 0 Success
1230 * EINVAL Invalid command or invalid policy arguments
1234 iopolicysys(__unused
struct proc
*p
, __unused
struct iopolicysys_args
*uap
, __unused
int32_t *retval
)
1237 thread_t thread
= THREAD_NULL
;
1239 struct uthread
*ut
= NULL
;
1240 struct _iopol_param_t iop_param
;
1242 if ((error
= copyin(uap
->arg
, &iop_param
, sizeof(iop_param
))) != 0)
1245 if (iop_param
.iop_iotype
!= IOPOL_TYPE_DISK
) {
1250 switch (iop_param
.iop_scope
) {
1251 case IOPOL_SCOPE_PROCESS
:
1252 policy
= &p
->p_iopol_disk
;
1254 case IOPOL_SCOPE_THREAD
:
1255 thread
= current_thread();
1256 ut
= get_bsdthread_info(thread
);
1257 policy
= &ut
->uu_iopol_disk
;
1266 switch (iop_param
.iop_policy
) {
1269 case IOPOL_THROTTLE
:
1272 *policy
= iop_param
.iop_policy
;
1284 case IOPOL_THROTTLE
:
1286 iop_param
.iop_policy
= *policy
;
1288 default: // in-kernel
1289 // this should never happen
1290 printf("%s: unknown I/O policy %d\n", __func__
, *policy
);
1291 // restore to default value
1292 *policy
= IOPOL_DEFAULT
;
1293 iop_param
.iop_policy
= *policy
;
1296 error
= copyout((caddr_t
)&iop_param
, uap
->arg
, sizeof(iop_param
));
1299 error
= EINVAL
; // unknown command
1309 boolean_t
thread_is_io_throttled(void);
1312 thread_is_io_throttled(void) {
1317 ut
= get_bsdthread_info(current_thread());
1320 policy
= current_proc()->p_iopol_disk
;
1322 if (ut
->uu_iopol_disk
!= IOPOL_DEFAULT
)
1323 policy
= ut
->uu_iopol_disk
;
1325 if (policy
== IOPOL_THROTTLE
)