2 * Copyright (c) 2000-2007 Apple Inc. All rights reserved.
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
32 * Mach Operating System
33 * Copyright (c) 1991,1990,1989,1988,1987 Carnegie Mellon University
34 * All Rights Reserved.
36 * Permission to use, copy, modify and distribute this software and its
37 * documentation is hereby granted, provided that both the copyright
38 * notice and this permission notice appear in all copies of the
39 * software, derivative works or modified versions, and any portions
40 * thereof, and that both notices appear in supporting documentation.
42 * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS"
43 * CONDITION. CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND FOR
44 * ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
46 * Carnegie Mellon requests users of this software to return to
48 * Software Distribution Coordinator or Software.Distribution@CS.CMU.EDU
49 * School of Computer Science
50 * Carnegie Mellon University
51 * Pittsburgh PA 15213-3890
53 * any improvements or extensions that they make and grant Carnegie Mellon
54 * the rights to redistribute these changes.
56 #include <mach_ldebug.h>
59 #include <mach/kern_return.h>
60 #include <mach/mach_host_server.h>
61 #include <mach_debug/lockgroup_info.h>
63 #include <kern/locks.h>
64 #include <kern/misc_protos.h>
65 #include <kern/kalloc.h>
66 #include <kern/thread.h>
67 #include <kern/processor.h>
68 #include <kern/sched_prim.h>
69 #include <kern/debug.h>
73 #include <sys/kdebug.h>
77 * We need only enough declarations from the BSD-side to be able to
78 * test if our probe is active, and to call __dtrace_probe(). Setting
79 * NEED_DTRACE_DEFS gets a local copy of those definitions pulled in.
81 #define NEED_DTRACE_DEFS
82 #include <../bsd/sys/lockstat.h>
85 #define LCK_MTX_SLEEP_CODE 0
86 #define LCK_MTX_SLEEP_DEADLINE_CODE 1
87 #define LCK_MTX_LCK_WAIT_CODE 2
88 #define LCK_MTX_UNLCK_WAKEUP_CODE 3
91 static queue_head_t lck_grp_queue
;
92 static unsigned int lck_grp_cnt
;
94 decl_lck_mtx_data(static,lck_grp_lock
)
95 static lck_mtx_ext_t lck_grp_lock_ext
;
97 lck_grp_attr_t LockDefaultGroupAttr
;
98 lck_grp_t LockCompatGroup
;
99 lck_attr_t LockDefaultLckAttr
;
102 * Routine: lck_mod_init
110 * Obtain "lcks" options:this currently controls lock statistics
112 if (!PE_parse_boot_argn("lcks", &LcksOpts
, sizeof (LcksOpts
)))
115 queue_init(&lck_grp_queue
);
118 * Need to bootstrap the LockCompatGroup instead of calling lck_grp_init() here. This avoids
119 * grabbing the lck_grp_lock before it is initialized.
122 bzero(&LockCompatGroup
, sizeof(lck_grp_t
));
123 (void) strncpy(LockCompatGroup
.lck_grp_name
, "Compatibility APIs", LCK_GRP_MAX_NAME
);
125 if (LcksOpts
& enaLkStat
)
126 LockCompatGroup
.lck_grp_attr
= LCK_GRP_ATTR_STAT
;
128 LockCompatGroup
.lck_grp_attr
= LCK_ATTR_NONE
;
130 LockCompatGroup
.lck_grp_refcnt
= 1;
132 enqueue_tail(&lck_grp_queue
, (queue_entry_t
)&LockCompatGroup
);
135 lck_grp_attr_setdefault(&LockDefaultGroupAttr
);
136 lck_attr_setdefault(&LockDefaultLckAttr
);
138 lck_mtx_init_ext(&lck_grp_lock
, &lck_grp_lock_ext
, &LockCompatGroup
, &LockDefaultLckAttr
);
143 * Routine: lck_grp_attr_alloc_init
147 lck_grp_attr_alloc_init(
150 lck_grp_attr_t
*attr
;
152 if ((attr
= (lck_grp_attr_t
*)kalloc(sizeof(lck_grp_attr_t
))) != 0)
153 lck_grp_attr_setdefault(attr
);
160 * Routine: lck_grp_attr_setdefault
164 lck_grp_attr_setdefault(
165 lck_grp_attr_t
*attr
)
167 if (LcksOpts
& enaLkStat
)
168 attr
->grp_attr_val
= LCK_GRP_ATTR_STAT
;
170 attr
->grp_attr_val
= 0;
175 * Routine: lck_grp_attr_setstat
179 lck_grp_attr_setstat(
180 lck_grp_attr_t
*attr
)
182 (void)hw_atomic_or(&attr
->grp_attr_val
, LCK_GRP_ATTR_STAT
);
187 * Routine: lck_grp_attr_free
192 lck_grp_attr_t
*attr
)
194 kfree(attr
, sizeof(lck_grp_attr_t
));
199 * Routine: lck_grp_alloc_init
204 const char* grp_name
,
205 lck_grp_attr_t
*attr
)
209 if ((grp
= (lck_grp_t
*)kalloc(sizeof(lck_grp_t
))) != 0)
210 lck_grp_init(grp
, grp_name
, attr
);
217 * Routine: lck_grp_init
223 const char* grp_name
,
224 lck_grp_attr_t
*attr
)
226 bzero((void *)grp
, sizeof(lck_grp_t
));
228 (void) strncpy(grp
->lck_grp_name
, grp_name
, LCK_GRP_MAX_NAME
);
230 if (attr
!= LCK_GRP_ATTR_NULL
)
231 grp
->lck_grp_attr
= attr
->grp_attr_val
;
232 else if (LcksOpts
& enaLkStat
)
233 grp
->lck_grp_attr
= LCK_GRP_ATTR_STAT
;
235 grp
->lck_grp_attr
= LCK_ATTR_NONE
;
237 grp
->lck_grp_refcnt
= 1;
239 lck_mtx_lock(&lck_grp_lock
);
240 enqueue_tail(&lck_grp_queue
, (queue_entry_t
)grp
);
242 lck_mtx_unlock(&lck_grp_lock
);
248 * Routine: lck_grp_free
255 lck_mtx_lock(&lck_grp_lock
);
257 (void)remque((queue_entry_t
)grp
);
258 lck_mtx_unlock(&lck_grp_lock
);
259 lck_grp_deallocate(grp
);
264 * Routine: lck_grp_reference
271 (void)hw_atomic_add(&grp
->lck_grp_refcnt
, 1);
276 * Routine: lck_grp_deallocate
283 if (hw_atomic_sub(&grp
->lck_grp_refcnt
, 1) == 0)
284 kfree(grp
, sizeof(lck_grp_t
));
288 * Routine: lck_grp_lckcnt_incr
296 unsigned int *lckcnt
;
300 lckcnt
= &grp
->lck_grp_spincnt
;
303 lckcnt
= &grp
->lck_grp_mtxcnt
;
306 lckcnt
= &grp
->lck_grp_rwcnt
;
309 return panic("lck_grp_lckcnt_incr(): invalid lock type: %d\n", lck_type
);
312 (void)hw_atomic_add(lckcnt
, 1);
316 * Routine: lck_grp_lckcnt_decr
324 unsigned int *lckcnt
;
328 lckcnt
= &grp
->lck_grp_spincnt
;
331 lckcnt
= &grp
->lck_grp_mtxcnt
;
334 lckcnt
= &grp
->lck_grp_rwcnt
;
337 return panic("lck_grp_lckcnt_decr(): invalid lock type: %d\n", lck_type
);
340 (void)hw_atomic_sub(lckcnt
, 1);
344 * Routine: lck_attr_alloc_init
353 if ((attr
= (lck_attr_t
*)kalloc(sizeof(lck_attr_t
))) != 0)
354 lck_attr_setdefault(attr
);
361 * Routine: lck_attr_setdefault
368 #if __i386__ || __x86_64__
370 if (LcksOpts
& enaLkDeb
)
371 attr
->lck_attr_val
= LCK_ATTR_DEBUG
;
373 attr
->lck_attr_val
= LCK_ATTR_NONE
;
375 attr
->lck_attr_val
= LCK_ATTR_DEBUG
;
378 #error Unknown architecture.
384 * Routine: lck_attr_setdebug
390 (void)hw_atomic_or(&attr
->lck_attr_val
, LCK_ATTR_DEBUG
);
394 * Routine: lck_attr_setdebug
400 (void)hw_atomic_and(&attr
->lck_attr_val
, ~LCK_ATTR_DEBUG
);
405 * Routine: lck_attr_rw_shared_priority
408 lck_attr_rw_shared_priority(
411 (void)hw_atomic_or(&attr
->lck_attr_val
, LCK_ATTR_RW_SHARED_PRIORITY
);
416 * Routine: lck_attr_free
422 kfree(attr
, sizeof(lck_attr_t
));
427 * Routine: lck_spin_sleep
432 lck_sleep_action_t lck_sleep_action
,
434 wait_interrupt_t interruptible
)
438 if ((lck_sleep_action
& ~LCK_SLEEP_MASK
) != 0)
439 panic("Invalid lock sleep action %x\n", lck_sleep_action
);
441 res
= assert_wait(event
, interruptible
);
442 if (res
== THREAD_WAITING
) {
443 lck_spin_unlock(lck
);
444 res
= thread_block(THREAD_CONTINUE_NULL
);
445 if (!(lck_sleep_action
& LCK_SLEEP_UNLOCK
))
449 if (lck_sleep_action
& LCK_SLEEP_UNLOCK
)
450 lck_spin_unlock(lck
);
457 * Routine: lck_spin_sleep_deadline
460 lck_spin_sleep_deadline(
462 lck_sleep_action_t lck_sleep_action
,
464 wait_interrupt_t interruptible
,
469 if ((lck_sleep_action
& ~LCK_SLEEP_MASK
) != 0)
470 panic("Invalid lock sleep action %x\n", lck_sleep_action
);
472 res
= assert_wait_deadline(event
, interruptible
, deadline
);
473 if (res
== THREAD_WAITING
) {
474 lck_spin_unlock(lck
);
475 res
= thread_block(THREAD_CONTINUE_NULL
);
476 if (!(lck_sleep_action
& LCK_SLEEP_UNLOCK
))
480 if (lck_sleep_action
& LCK_SLEEP_UNLOCK
)
481 lck_spin_unlock(lck
);
488 * Routine: lck_mtx_sleep
493 lck_sleep_action_t lck_sleep_action
,
495 wait_interrupt_t interruptible
)
498 thread_t thread
= current_thread();
500 KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS
, LCK_MTX_SLEEP_CODE
) | DBG_FUNC_START
,
501 (int)lck
, (int)lck_sleep_action
, (int)event
, (int)interruptible
, 0);
503 if ((lck_sleep_action
& ~LCK_SLEEP_MASK
) != 0)
504 panic("Invalid lock sleep action %x\n", lck_sleep_action
);
506 if (lck_sleep_action
& LCK_SLEEP_PROMOTED_PRI
) {
508 * We overload the RW lock promotion to give us a priority ceiling
509 * during the time that this thread is asleep, so that when it
510 * is re-awakened (and not yet contending on the mutex), it is
511 * runnable at a reasonably high priority.
513 thread
->rwlock_count
++;
516 res
= assert_wait(event
, interruptible
);
517 if (res
== THREAD_WAITING
) {
519 res
= thread_block(THREAD_CONTINUE_NULL
);
520 if (!(lck_sleep_action
& LCK_SLEEP_UNLOCK
)) {
521 if ((lck_sleep_action
& LCK_SLEEP_SPIN
))
522 lck_mtx_lock_spin(lck
);
528 if (lck_sleep_action
& LCK_SLEEP_UNLOCK
)
531 if (lck_sleep_action
& LCK_SLEEP_PROMOTED_PRI
) {
532 if ((thread
->rwlock_count
-- == 1 /* field now 0 */) && (thread
->sched_flags
& TH_SFLAG_RW_PROMOTED
)) {
533 /* sched_flags checked without lock, but will be rechecked while clearing */
534 lck_rw_clear_promotion(thread
);
538 KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS
, LCK_MTX_SLEEP_CODE
) | DBG_FUNC_END
, (int)res
, 0, 0, 0, 0);
545 * Routine: lck_mtx_sleep_deadline
548 lck_mtx_sleep_deadline(
550 lck_sleep_action_t lck_sleep_action
,
552 wait_interrupt_t interruptible
,
556 thread_t thread
= current_thread();
558 KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS
, LCK_MTX_SLEEP_DEADLINE_CODE
) | DBG_FUNC_START
,
559 (int)lck
, (int)lck_sleep_action
, (int)event
, (int)interruptible
, 0);
561 if ((lck_sleep_action
& ~LCK_SLEEP_MASK
) != 0)
562 panic("Invalid lock sleep action %x\n", lck_sleep_action
);
564 if (lck_sleep_action
& LCK_SLEEP_PROMOTED_PRI
) {
566 * See lck_mtx_sleep().
568 thread
->rwlock_count
++;
571 res
= assert_wait_deadline(event
, interruptible
, deadline
);
572 if (res
== THREAD_WAITING
) {
574 res
= thread_block(THREAD_CONTINUE_NULL
);
575 if (!(lck_sleep_action
& LCK_SLEEP_UNLOCK
)) {
576 if ((lck_sleep_action
& LCK_SLEEP_SPIN
))
577 lck_mtx_lock_spin(lck
);
583 if (lck_sleep_action
& LCK_SLEEP_UNLOCK
)
586 if (lck_sleep_action
& LCK_SLEEP_PROMOTED_PRI
) {
587 if ((thread
->rwlock_count
-- == 1 /* field now 0 */) && (thread
->sched_flags
& TH_SFLAG_RW_PROMOTED
)) {
588 /* sched_flags checked without lock, but will be rechecked while clearing */
589 lck_rw_clear_promotion(thread
);
593 KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS
, LCK_MTX_SLEEP_DEADLINE_CODE
) | DBG_FUNC_END
, (int)res
, 0, 0, 0, 0);
599 * Routine: lck_mtx_lock_wait
601 * Invoked in order to wait on contention.
603 * Called with the interlock locked and
604 * returns it unlocked.
611 thread_t self
= current_thread();
614 spl_t s
= splsched();
616 uint64_t sleep_start
= 0;
618 if (lockstat_probemap
[LS_LCK_MTX_LOCK_BLOCK
] || lockstat_probemap
[LS_LCK_MTX_EXT_LOCK_BLOCK
]) {
619 sleep_start
= mach_absolute_time();
623 if (lck
->lck_mtx_tag
!= LCK_MTX_TAG_INDIRECT
)
626 mutex
= &lck
->lck_mtx_ptr
->lck_mtx
;
628 KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS
, LCK_MTX_LCK_WAIT_CODE
) | DBG_FUNC_START
, (int)lck
, (int)holder
, 0, 0, 0);
630 priority
= self
->sched_pri
;
631 if (priority
< self
->priority
)
632 priority
= self
->priority
;
633 if (priority
< BASEPRI_DEFAULT
)
634 priority
= BASEPRI_DEFAULT
;
636 /* Do not promote past promotion ceiling */
637 priority
= MIN(priority
, MAXPRI_PROMOTE
);
640 if (mutex
->lck_mtx_pri
== 0)
641 holder
->promotions
++;
642 holder
->sched_flags
|= TH_SFLAG_PROMOTED
;
643 if ( mutex
->lck_mtx_pri
< priority
&&
644 holder
->sched_pri
< priority
) {
645 KERNEL_DEBUG_CONSTANT(
646 MACHDBG_CODE(DBG_MACH_SCHED
,MACH_PROMOTE
) | DBG_FUNC_NONE
,
647 holder
->sched_pri
, priority
, holder
, lck
, 0);
648 set_sched_pri(holder
, priority
);
650 thread_unlock(holder
);
653 if (mutex
->lck_mtx_pri
< priority
)
654 mutex
->lck_mtx_pri
= priority
;
655 if (self
->pending_promoter
[self
->pending_promoter_index
] == NULL
) {
656 self
->pending_promoter
[self
->pending_promoter_index
] = mutex
;
657 mutex
->lck_mtx_waiters
++;
660 if (self
->pending_promoter
[self
->pending_promoter_index
] != mutex
) {
661 self
->pending_promoter
[++self
->pending_promoter_index
] = mutex
;
662 mutex
->lck_mtx_waiters
++;
665 assert_wait((event_t
)(((unsigned int*)lck
)+((sizeof(lck_mtx_t
)-1)/sizeof(unsigned int))), THREAD_UNINT
);
666 lck_mtx_ilk_unlock(mutex
);
668 thread_block(THREAD_CONTINUE_NULL
);
670 KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS
, LCK_MTX_LCK_WAIT_CODE
) | DBG_FUNC_END
, 0, 0, 0, 0, 0);
673 * Record the Dtrace lockstat probe for blocking, block time
674 * measured from when we were entered.
677 if (lck
->lck_mtx_tag
!= LCK_MTX_TAG_INDIRECT
) {
678 LOCKSTAT_RECORD(LS_LCK_MTX_LOCK_BLOCK
, lck
,
679 mach_absolute_time() - sleep_start
);
681 LOCKSTAT_RECORD(LS_LCK_MTX_EXT_LOCK_BLOCK
, lck
,
682 mach_absolute_time() - sleep_start
);
689 * Routine: lck_mtx_lock_acquire
691 * Invoked on acquiring the mutex when there is
694 * Returns the current number of waiters.
696 * Called with the interlock locked.
699 lck_mtx_lock_acquire(
702 thread_t thread
= current_thread();
705 if (lck
->lck_mtx_tag
!= LCK_MTX_TAG_INDIRECT
)
708 mutex
= &lck
->lck_mtx_ptr
->lck_mtx
;
710 if (thread
->pending_promoter
[thread
->pending_promoter_index
] == mutex
) {
711 thread
->pending_promoter
[thread
->pending_promoter_index
] = NULL
;
712 if (thread
->pending_promoter_index
> 0)
713 thread
->pending_promoter_index
--;
714 mutex
->lck_mtx_waiters
--;
717 if (mutex
->lck_mtx_waiters
> 0) {
718 integer_t priority
= mutex
->lck_mtx_pri
;
719 spl_t s
= splsched();
722 thread
->promotions
++;
723 thread
->sched_flags
|= TH_SFLAG_PROMOTED
;
724 if (thread
->sched_pri
< priority
) {
725 KERNEL_DEBUG_CONSTANT(
726 MACHDBG_CODE(DBG_MACH_SCHED
,MACH_PROMOTE
) | DBG_FUNC_NONE
,
727 thread
->sched_pri
, priority
, 0, lck
, 0);
728 /* Do not promote past promotion ceiling */
729 assert(priority
<= MAXPRI_PROMOTE
);
730 set_sched_pri(thread
, priority
);
732 thread_unlock(thread
);
736 mutex
->lck_mtx_pri
= 0;
739 if (lockstat_probemap
[LS_LCK_MTX_LOCK_ACQUIRE
] || lockstat_probemap
[LS_LCK_MTX_EXT_LOCK_ACQUIRE
]) {
740 if (lck
->lck_mtx_tag
!= LCK_MTX_TAG_INDIRECT
) {
741 LOCKSTAT_RECORD(LS_LCK_MTX_LOCK_ACQUIRE
, lck
, 0);
743 LOCKSTAT_RECORD(LS_LCK_MTX_EXT_LOCK_ACQUIRE
, lck
, 0);
747 return (mutex
->lck_mtx_waiters
);
751 * Routine: lck_mtx_unlock_wakeup
753 * Invoked on unlock when there is contention.
755 * Called with the interlock locked.
758 lck_mtx_unlock_wakeup (
762 thread_t thread
= current_thread();
765 if (lck
->lck_mtx_tag
!= LCK_MTX_TAG_INDIRECT
)
768 mutex
= &lck
->lck_mtx_ptr
->lck_mtx
;
770 if (thread
!= holder
)
771 panic("lck_mtx_unlock_wakeup: mutex %p holder %p\n", mutex
, holder
);
773 KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS
, LCK_MTX_UNLCK_WAKEUP_CODE
) | DBG_FUNC_START
, (int)lck
, (int)holder
, 0, 0, 0);
775 assert(mutex
->lck_mtx_waiters
> 0);
776 thread_wakeup_one((event_t
)(((unsigned int*)lck
)+(sizeof(lck_mtx_t
)-1)/sizeof(unsigned int)));
778 if (thread
->promotions
> 0) {
779 spl_t s
= splsched();
782 if ( --thread
->promotions
== 0 &&
783 (thread
->sched_flags
& TH_SFLAG_PROMOTED
) ) {
784 thread
->sched_flags
&= ~TH_SFLAG_PROMOTED
;
786 if (thread
->sched_flags
& TH_SFLAG_RW_PROMOTED
) {
787 /* Thread still has a RW lock promotion */
788 } else if (thread
->sched_flags
& TH_SFLAG_DEPRESSED_MASK
) {
789 KERNEL_DEBUG_CONSTANT(
790 MACHDBG_CODE(DBG_MACH_SCHED
,MACH_DEMOTE
) | DBG_FUNC_NONE
,
791 thread
->sched_pri
, DEPRESSPRI
, 0, lck
, 0);
793 set_sched_pri(thread
, DEPRESSPRI
);
796 if (thread
->priority
< thread
->sched_pri
) {
797 KERNEL_DEBUG_CONSTANT(
798 MACHDBG_CODE(DBG_MACH_SCHED
,MACH_DEMOTE
) |
800 thread
->sched_pri
, thread
->priority
,
804 SCHED(compute_priority
)(thread
, FALSE
);
807 thread_unlock(thread
);
811 KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS
, LCK_MTX_UNLCK_WAKEUP_CODE
) | DBG_FUNC_END
, 0, 0, 0, 0, 0);
815 lck_mtx_unlockspin_wakeup (
818 assert(lck
->lck_mtx_waiters
> 0);
819 thread_wakeup_one((event_t
)(((unsigned int*)lck
)+(sizeof(lck_mtx_t
)-1)/sizeof(unsigned int)));
821 KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS
, LCK_MTX_UNLCK_WAKEUP_CODE
) | DBG_FUNC_NONE
, (int)lck
, 0, 0, 1, 0);
824 * When there are waiters, we skip the hot-patch spot in the
825 * fastpath, so we record it here.
827 LOCKSTAT_RECORD(LS_LCK_MTX_UNLOCK_RELEASE
, lck
, 0);
833 * Routine: mutex_pause
835 * Called by former callers of simple_lock_pause().
837 #define MAX_COLLISION_COUNTS 32
838 #define MAX_COLLISION 8
840 unsigned int max_collision_count
[MAX_COLLISION_COUNTS
];
842 uint32_t collision_backoffs
[MAX_COLLISION
] = {
843 10, 50, 100, 200, 400, 600, 800, 1000
848 mutex_pause(uint32_t collisions
)
850 wait_result_t wait_result
;
853 if (collisions
>= MAX_COLLISION_COUNTS
)
854 collisions
= MAX_COLLISION_COUNTS
- 1;
855 max_collision_count
[collisions
]++;
857 if (collisions
>= MAX_COLLISION
)
858 collisions
= MAX_COLLISION
- 1;
859 back_off
= collision_backoffs
[collisions
];
861 wait_result
= assert_wait_timeout((event_t
)mutex_pause
, THREAD_UNINT
, back_off
, NSEC_PER_USEC
);
862 assert(wait_result
== THREAD_WAITING
);
864 wait_result
= thread_block(THREAD_CONTINUE_NULL
);
865 assert(wait_result
== THREAD_TIMED_OUT
);
869 unsigned int mutex_yield_wait
= 0;
870 unsigned int mutex_yield_no_wait
= 0;
879 lck_mtx_assert(lck
, LCK_MTX_ASSERT_OWNED
);
882 if (lck
->lck_mtx_tag
== LCK_MTX_TAG_INDIRECT
)
883 waiters
= lck
->lck_mtx_ptr
->lck_mtx
.lck_mtx_waiters
;
885 waiters
= lck
->lck_mtx_waiters
;
888 mutex_yield_no_wait
++;
899 * Routine: lck_rw_sleep
904 lck_sleep_action_t lck_sleep_action
,
906 wait_interrupt_t interruptible
)
909 lck_rw_type_t lck_rw_type
;
910 thread_t thread
= current_thread();
912 if ((lck_sleep_action
& ~LCK_SLEEP_MASK
) != 0)
913 panic("Invalid lock sleep action %x\n", lck_sleep_action
);
915 if (lck_sleep_action
& LCK_SLEEP_PROMOTED_PRI
) {
917 * Although we are dropping the RW lock, the intent in most cases
918 * is that this thread remains as an observer, since it may hold
919 * some secondary resource, but must yield to avoid deadlock. In
920 * this situation, make sure that the thread is boosted to the
921 * RW lock ceiling while blocked, so that it can re-acquire the
922 * RW lock at that priority.
924 thread
->rwlock_count
++;
927 res
= assert_wait(event
, interruptible
);
928 if (res
== THREAD_WAITING
) {
929 lck_rw_type
= lck_rw_done(lck
);
930 res
= thread_block(THREAD_CONTINUE_NULL
);
931 if (!(lck_sleep_action
& LCK_SLEEP_UNLOCK
)) {
932 if (!(lck_sleep_action
& (LCK_SLEEP_SHARED
|LCK_SLEEP_EXCLUSIVE
)))
933 lck_rw_lock(lck
, lck_rw_type
);
934 else if (lck_sleep_action
& LCK_SLEEP_EXCLUSIVE
)
935 lck_rw_lock_exclusive(lck
);
937 lck_rw_lock_shared(lck
);
941 if (lck_sleep_action
& LCK_SLEEP_UNLOCK
)
942 (void)lck_rw_done(lck
);
944 if (lck_sleep_action
& LCK_SLEEP_PROMOTED_PRI
) {
945 if ((thread
->rwlock_count
-- == 1 /* field now 0 */) && (thread
->sched_flags
& TH_SFLAG_RW_PROMOTED
)) {
946 /* sched_flags checked without lock, but will be rechecked while clearing */
948 /* Only if the caller wanted the lck_rw_t returned unlocked should we drop to 0 */
949 assert(lck_sleep_action
& LCK_SLEEP_UNLOCK
);
951 lck_rw_clear_promotion(thread
);
960 * Routine: lck_rw_sleep_deadline
963 lck_rw_sleep_deadline(
965 lck_sleep_action_t lck_sleep_action
,
967 wait_interrupt_t interruptible
,
971 lck_rw_type_t lck_rw_type
;
972 thread_t thread
= current_thread();
974 if ((lck_sleep_action
& ~LCK_SLEEP_MASK
) != 0)
975 panic("Invalid lock sleep action %x\n", lck_sleep_action
);
977 if (lck_sleep_action
& LCK_SLEEP_PROMOTED_PRI
) {
978 thread
->rwlock_count
++;
981 res
= assert_wait_deadline(event
, interruptible
, deadline
);
982 if (res
== THREAD_WAITING
) {
983 lck_rw_type
= lck_rw_done(lck
);
984 res
= thread_block(THREAD_CONTINUE_NULL
);
985 if (!(lck_sleep_action
& LCK_SLEEP_UNLOCK
)) {
986 if (!(lck_sleep_action
& (LCK_SLEEP_SHARED
|LCK_SLEEP_EXCLUSIVE
)))
987 lck_rw_lock(lck
, lck_rw_type
);
988 else if (lck_sleep_action
& LCK_SLEEP_EXCLUSIVE
)
989 lck_rw_lock_exclusive(lck
);
991 lck_rw_lock_shared(lck
);
995 if (lck_sleep_action
& LCK_SLEEP_UNLOCK
)
996 (void)lck_rw_done(lck
);
998 if (lck_sleep_action
& LCK_SLEEP_PROMOTED_PRI
) {
999 if ((thread
->rwlock_count
-- == 1 /* field now 0 */) && (thread
->sched_flags
& TH_SFLAG_RW_PROMOTED
)) {
1000 /* sched_flags checked without lock, but will be rechecked while clearing */
1002 /* Only if the caller wanted the lck_rw_t returned unlocked should we drop to 0 */
1003 assert(lck_sleep_action
& LCK_SLEEP_UNLOCK
);
1005 lck_rw_clear_promotion(thread
);
1013 * Reader-writer lock promotion
1015 * We support a limited form of reader-writer
1016 * lock promotion whose effects are:
1018 * * Qualifying threads have decay disabled
1019 * * Scheduler priority is reset to a floor of
1020 * of their statically assigned priority
1021 * or BASEPRI_BACKGROUND
1023 * The rationale is that lck_rw_ts do not have
1024 * a single owner, so we cannot apply a directed
1025 * priority boost from all waiting threads
1026 * to all holding threads without maintaining
1027 * lists of all shared owners and all waiting
1028 * threads for every lock.
1030 * Instead (and to preserve the uncontended fast-
1031 * path), acquiring (or attempting to acquire)
1032 * a RW lock in shared or exclusive lock increments
1033 * a per-thread counter. Only if that thread stops
1034 * making forward progress (for instance blocking
1035 * on a mutex, or being preempted) do we consult
1036 * the counter and apply the priority floor.
1037 * When the thread becomes runnable again (or in
1038 * the case of preemption it never stopped being
1039 * runnable), it has the priority boost and should
1040 * be in a good position to run on the CPU and
1041 * release all RW locks (at which point the priority
1042 * boost is cleared).
1044 * Care must be taken to ensure that priority
1045 * boosts are not retained indefinitely, since unlike
1046 * mutex priority boosts (where the boost is tied
1047 * to the mutex lifecycle), the boost is tied
1048 * to the thread and independent of any particular
1049 * lck_rw_t. Assertions are in place on return
1050 * to userspace so that the boost is not held
1053 * The routines that increment/decrement the
1054 * per-thread counter should err on the side of
1055 * incrementing any time a preemption is possible
1056 * and the lock would be visible to the rest of the
1057 * system as held (so it should be incremented before
1058 * interlocks are dropped/preemption is enabled, or
1059 * before a CAS is executed to acquire the lock).
1064 * lck_rw_clear_promotion: Undo priority promotions when the last RW
1065 * lock is released by a thread (if a promotion was active)
1067 void lck_rw_clear_promotion(thread_t thread
)
1069 assert(thread
->rwlock_count
== 0);
1071 /* Cancel any promotions if the thread had actually blocked while holding a RW lock */
1072 spl_t s
= splsched();
1074 thread_lock(thread
);
1076 if (thread
->sched_flags
& TH_SFLAG_RW_PROMOTED
) {
1077 thread
->sched_flags
&= ~TH_SFLAG_RW_PROMOTED
;
1079 if (thread
->sched_flags
& TH_SFLAG_PROMOTED
) {
1080 /* Thread still has a mutex promotion */
1081 } else if (thread
->sched_flags
& TH_SFLAG_DEPRESSED_MASK
) {
1082 KERNEL_DEBUG_CONSTANT(MACHDBG_CODE(DBG_MACH_SCHED
, MACH_RW_DEMOTE
) | DBG_FUNC_NONE
,
1083 thread
->sched_pri
, DEPRESSPRI
, 0, 0, 0);
1085 set_sched_pri(thread
, DEPRESSPRI
);
1087 KERNEL_DEBUG_CONSTANT(MACHDBG_CODE(DBG_MACH_SCHED
, MACH_RW_DEMOTE
) | DBG_FUNC_NONE
,
1088 thread
->sched_pri
, thread
->priority
, 0, 0, 0);
1090 SCHED(compute_priority
)(thread
, FALSE
);
1094 thread_unlock(thread
);
1099 host_lockgroup_info(
1101 lockgroup_info_array_t
*lockgroup_infop
,
1102 mach_msg_type_number_t
*lockgroup_infoCntp
)
1104 lockgroup_info_t
*lockgroup_info_base
;
1105 lockgroup_info_t
*lockgroup_info
;
1106 vm_offset_t lockgroup_info_addr
;
1107 vm_size_t lockgroup_info_size
;
1114 if (host
== HOST_NULL
)
1115 return KERN_INVALID_HOST
;
1117 lck_mtx_lock(&lck_grp_lock
);
1119 lockgroup_info_size
= round_page(lck_grp_cnt
* sizeof *lockgroup_info
);
1120 kr
= kmem_alloc_pageable(ipc_kernel_map
,
1121 &lockgroup_info_addr
, lockgroup_info_size
);
1122 if (kr
!= KERN_SUCCESS
) {
1123 lck_mtx_unlock(&lck_grp_lock
);
1127 lockgroup_info_base
= (lockgroup_info_t
*) lockgroup_info_addr
;
1128 lck_grp
= (lck_grp_t
*)queue_first(&lck_grp_queue
);
1129 lockgroup_info
= lockgroup_info_base
;
1131 for (i
= 0; i
< lck_grp_cnt
; i
++) {
1133 lockgroup_info
->lock_spin_cnt
= lck_grp
->lck_grp_spincnt
;
1134 lockgroup_info
->lock_spin_util_cnt
= lck_grp
->lck_grp_stat
.lck_grp_spin_stat
.lck_grp_spin_util_cnt
;
1135 lockgroup_info
->lock_spin_held_cnt
= lck_grp
->lck_grp_stat
.lck_grp_spin_stat
.lck_grp_spin_held_cnt
;
1136 lockgroup_info
->lock_spin_miss_cnt
= lck_grp
->lck_grp_stat
.lck_grp_spin_stat
.lck_grp_spin_miss_cnt
;
1137 lockgroup_info
->lock_spin_held_max
= lck_grp
->lck_grp_stat
.lck_grp_spin_stat
.lck_grp_spin_held_max
;
1138 lockgroup_info
->lock_spin_held_cum
= lck_grp
->lck_grp_stat
.lck_grp_spin_stat
.lck_grp_spin_held_cum
;
1140 lockgroup_info
->lock_mtx_cnt
= lck_grp
->lck_grp_mtxcnt
;
1141 lockgroup_info
->lock_mtx_util_cnt
= lck_grp
->lck_grp_stat
.lck_grp_mtx_stat
.lck_grp_mtx_util_cnt
;
1142 lockgroup_info
->lock_mtx_held_cnt
= lck_grp
->lck_grp_stat
.lck_grp_mtx_stat
.lck_grp_mtx_held_cnt
;
1143 lockgroup_info
->lock_mtx_miss_cnt
= lck_grp
->lck_grp_stat
.lck_grp_mtx_stat
.lck_grp_mtx_miss_cnt
;
1144 lockgroup_info
->lock_mtx_wait_cnt
= lck_grp
->lck_grp_stat
.lck_grp_mtx_stat
.lck_grp_mtx_wait_cnt
;
1145 lockgroup_info
->lock_mtx_held_max
= lck_grp
->lck_grp_stat
.lck_grp_mtx_stat
.lck_grp_mtx_held_max
;
1146 lockgroup_info
->lock_mtx_held_cum
= lck_grp
->lck_grp_stat
.lck_grp_mtx_stat
.lck_grp_mtx_held_cum
;
1147 lockgroup_info
->lock_mtx_wait_max
= lck_grp
->lck_grp_stat
.lck_grp_mtx_stat
.lck_grp_mtx_wait_max
;
1148 lockgroup_info
->lock_mtx_wait_cum
= lck_grp
->lck_grp_stat
.lck_grp_mtx_stat
.lck_grp_mtx_wait_cum
;
1150 lockgroup_info
->lock_rw_cnt
= lck_grp
->lck_grp_rwcnt
;
1151 lockgroup_info
->lock_rw_util_cnt
= lck_grp
->lck_grp_stat
.lck_grp_rw_stat
.lck_grp_rw_util_cnt
;
1152 lockgroup_info
->lock_rw_held_cnt
= lck_grp
->lck_grp_stat
.lck_grp_rw_stat
.lck_grp_rw_held_cnt
;
1153 lockgroup_info
->lock_rw_miss_cnt
= lck_grp
->lck_grp_stat
.lck_grp_rw_stat
.lck_grp_rw_miss_cnt
;
1154 lockgroup_info
->lock_rw_wait_cnt
= lck_grp
->lck_grp_stat
.lck_grp_rw_stat
.lck_grp_rw_wait_cnt
;
1155 lockgroup_info
->lock_rw_held_max
= lck_grp
->lck_grp_stat
.lck_grp_rw_stat
.lck_grp_rw_held_max
;
1156 lockgroup_info
->lock_rw_held_cum
= lck_grp
->lck_grp_stat
.lck_grp_rw_stat
.lck_grp_rw_held_cum
;
1157 lockgroup_info
->lock_rw_wait_max
= lck_grp
->lck_grp_stat
.lck_grp_rw_stat
.lck_grp_rw_wait_max
;
1158 lockgroup_info
->lock_rw_wait_cum
= lck_grp
->lck_grp_stat
.lck_grp_rw_stat
.lck_grp_rw_wait_cum
;
1160 (void) strncpy(lockgroup_info
->lockgroup_name
,lck_grp
->lck_grp_name
, LOCKGROUP_MAX_NAME
);
1162 lck_grp
= (lck_grp_t
*)(queue_next((queue_entry_t
)(lck_grp
)));
1166 *lockgroup_infoCntp
= lck_grp_cnt
;
1167 lck_mtx_unlock(&lck_grp_lock
);
1169 used
= (*lockgroup_infoCntp
) * sizeof *lockgroup_info
;
1171 if (used
!= lockgroup_info_size
)
1172 bzero((char *) lockgroup_info
, lockgroup_info_size
- used
);
1174 kr
= vm_map_copyin(ipc_kernel_map
, (vm_map_address_t
)lockgroup_info_addr
,
1175 (vm_map_size_t
)lockgroup_info_size
, TRUE
, ©
);
1176 assert(kr
== KERN_SUCCESS
);
1178 *lockgroup_infop
= (lockgroup_info_t
*) copy
;
1180 return(KERN_SUCCESS
);