X-Git-Url: https://git.saurik.com/apple/xnu.git/blobdiff_plain/3e170ce000f1506b7b5d2c5c7faec85ceabb573d..eb6b6ca394357805f2bdba989abae309f718b4d8:/osfmk/kern/locks.c

diff --git a/osfmk/kern/locks.c b/osfmk/kern/locks.c
index 4a498b214..78aee369c 100644
--- a/osfmk/kern/locks.c
+++ b/osfmk/kern/locks.c
@@ -1,8 +1,8 @@
 /*
- * Copyright (c) 2000-2007 Apple Inc. All rights reserved.
+ * Copyright (c) 2000-2019 Apple Inc. All rights reserved.
  *
  * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
- * 
+ *
  * This file contains Original Code and/or Modifications of Original Code
  * as defined in and that are subject to the Apple Public Source License
  * Version 2.0 (the 'License'). You may not use this file except in
@@ -11,10 +11,10 @@
  * unlawful or unlicensed copies of an Apple operating system, or to
  * circumvent, violate, or enable the circumvention or violation of, any
  * terms of an Apple operating system software license agreement.
- * 
+ *
  * Please obtain a copy of the License at
  * http://www.opensource.apple.com/apsl/ and read it before using this file.
- * 
+ *
  * The Original Code and all software distributed under the License are
  * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
  * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
@@ -22,37 +22,40 @@
  * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
  * Please see the License for the specific language governing rights and
  * limitations under the License.
- * 
+ *
  * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
  */
 /*
  * @OSF_COPYRIGHT@
  */
-/* 
+/*
  * Mach Operating System
  * Copyright (c) 1991,1990,1989,1988,1987 Carnegie Mellon University
  * All Rights Reserved.
- * 
+ *
  * Permission to use, copy, modify and distribute this software and its
  * documentation is hereby granted, provided that both the copyright
  * notice and this permission notice appear in all copies of the
  * software, derivative works or modified versions, and any portions
  * thereof, and that both notices appear in supporting documentation.
- * 
+ *
  * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS"
  * CONDITION.  CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND FOR
  * ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
- * 
+ *
  * Carnegie Mellon requests users of this software to return to
- * 
+ *
  *  Software Distribution Coordinator  or  Software.Distribution@CS.CMU.EDU
  *  School of Computer Science
  *  Carnegie Mellon University
  *  Pittsburgh PA 15213-3890
- * 
+ *
  * any improvements or extensions that they make and grant Carnegie Mellon
  * the rights to redistribute these changes.
  */
+
+#define LOCK_PRIVATE 1
+
 #include <mach_ldebug.h>
 #include <debug.h>
 
@@ -60,6 +63,7 @@
 #include <mach/mach_host_server.h>
 #include <mach_debug/lockgroup_info.h>
 
+#include <kern/lock_stat.h>
 #include <kern/locks.h>
 #include <kern/misc_protos.h>
 #include <kern/kalloc.h>
@@ -67,35 +71,59 @@
 #include <kern/processor.h>
 #include <kern/sched_prim.h>
 #include <kern/debug.h>
+#include <libkern/section_keywords.h>
+#include <machine/atomic.h>
+#include <machine/machine_cpu.h>
 #include <string.h>
 
-
 #include <sys/kdebug.h>
 
-#if	CONFIG_DTRACE
-/*
- * We need only enough declarations from the BSD-side to be able to
- * test if our probe is active, and to call __dtrace_probe().  Setting
- * NEED_DTRACE_DEFS gets a local copy of those definitions pulled in.
- */
-#define NEED_DTRACE_DEFS
-#include <../bsd/sys/lockstat.h>
+#define LCK_MTX_SLEEP_CODE              0
+#define LCK_MTX_SLEEP_DEADLINE_CODE     1
+#define LCK_MTX_LCK_WAIT_CODE           2
+#define LCK_MTX_UNLCK_WAKEUP_CODE       3
+
+#if MACH_LDEBUG
+#define ALIGN_TEST(p, t) do{if((uintptr_t)p&(sizeof(t)-1)) __builtin_trap();}while(0)
+#else
+#define ALIGN_TEST(p, t) do{}while(0)
 #endif
 
-#define	LCK_MTX_SLEEP_CODE		0
-#define	LCK_MTX_SLEEP_DEADLINE_CODE	1
-#define	LCK_MTX_LCK_WAIT_CODE		2
-#define	LCK_MTX_UNLCK_WAKEUP_CODE	3
+#define NOINLINE                __attribute__((noinline))
+
+#define ordered_load_hw(lock)          os_atomic_load(&(lock)->lock_data, compiler_acq_rel)
+#define ordered_store_hw(lock, value)  os_atomic_store(&(lock)->lock_data, (value), compiler_acq_rel)
 
-static queue_head_t	lck_grp_queue;
-static unsigned int	lck_grp_cnt;
 
-decl_lck_mtx_data(static,lck_grp_lock)
+queue_head_t     lck_grp_queue;
+unsigned int     lck_grp_cnt;
+
+decl_lck_mtx_data(, lck_grp_lock);
 static lck_mtx_ext_t lck_grp_lock_ext;
 
-lck_grp_attr_t	LockDefaultGroupAttr;
-lck_grp_t		LockCompatGroup;
-lck_attr_t		LockDefaultLckAttr;
+SECURITY_READ_ONLY_LATE(boolean_t) spinlock_timeout_panic = TRUE;
+
+lck_grp_attr_t  LockDefaultGroupAttr;
+lck_grp_t               LockCompatGroup;
+lck_attr_t              LockDefaultLckAttr;
+
+#if CONFIG_DTRACE && __SMP__
+#if defined (__x86_64__)
+uint64_t dtrace_spin_threshold = 500; // 500ns
+#elif defined(__arm__) || defined(__arm64__)
+uint64_t dtrace_spin_threshold = LOCK_PANIC_TIMEOUT / 1000000; // 500ns
+#endif
+#endif
+
+uintptr_t
+unslide_for_kdebug(void* object)
+{
+	if (__improbable(kdebug_enable)) {
+		return VM_KERNEL_UNSLIDE_OR_PERM(object);
+	} else {
+		return 0;
+	}
+}
 
 /*
  * Routine:	lck_mod_init
@@ -108,50 +136,61 @@ lck_mod_init(
 	/*
 	 * Obtain "lcks" options:this currently controls lock statistics
 	 */
-	if (!PE_parse_boot_argn("lcks", &LcksOpts, sizeof (LcksOpts)))
+	if (!PE_parse_boot_argn("lcks", &LcksOpts, sizeof(LcksOpts))) {
 		LcksOpts = 0;
+	}
+
+
+#if (DEVELOPMENT || DEBUG) && defined(__x86_64__)
+	if (!PE_parse_boot_argn("-disable_mtx_chk", &LckDisablePreemptCheck, sizeof(LckDisablePreemptCheck))) {
+		LckDisablePreemptCheck = 0;
+	}
+#endif /* (DEVELOPMENT || DEBUG) && defined(__x86_64__) */
 
 	queue_init(&lck_grp_queue);
-	
-	/* 
+
+	/*
 	 * Need to bootstrap the LockCompatGroup instead of calling lck_grp_init() here. This avoids
 	 * grabbing the lck_grp_lock before it is initialized.
 	 */
-	
+
 	bzero(&LockCompatGroup, sizeof(lck_grp_t));
 	(void) strncpy(LockCompatGroup.lck_grp_name, "Compatibility APIs", LCK_GRP_MAX_NAME);
-	
-	if (LcksOpts & enaLkStat)
-		LockCompatGroup.lck_grp_attr = LCK_GRP_ATTR_STAT;
-    else
-		LockCompatGroup.lck_grp_attr = LCK_ATTR_NONE;
-	
-	LockCompatGroup.lck_grp_refcnt = 1;
-	
+
+	LockCompatGroup.lck_grp_attr = LCK_ATTR_NONE;
+	if (LcksOpts & enaLkStat) {
+		LockCompatGroup.lck_grp_attr |= LCK_GRP_ATTR_STAT;
+	}
+	if (LcksOpts & enaLkTimeStat) {
+		LockCompatGroup.lck_grp_attr |= LCK_GRP_ATTR_TIME_STAT;
+	}
+
+	os_ref_init(&LockCompatGroup.lck_grp_refcnt, NULL);
+
 	enqueue_tail(&lck_grp_queue, (queue_entry_t)&LockCompatGroup);
 	lck_grp_cnt = 1;
-	
+
 	lck_grp_attr_setdefault(&LockDefaultGroupAttr);
 	lck_attr_setdefault(&LockDefaultLckAttr);
-	
+
 	lck_mtx_init_ext(&lck_grp_lock, &lck_grp_lock_ext, &LockCompatGroup, &LockDefaultLckAttr);
-	
 }
 
 /*
  * Routine:	lck_grp_attr_alloc_init
  */
 
-lck_grp_attr_t	*
+lck_grp_attr_t  *
 lck_grp_attr_alloc_init(
 	void)
 {
-	lck_grp_attr_t	*attr;
+	lck_grp_attr_t  *attr;
 
-	if ((attr = (lck_grp_attr_t *)kalloc(sizeof(lck_grp_attr_t))) != 0)
+	if ((attr = (lck_grp_attr_t *)kalloc(sizeof(lck_grp_attr_t))) != 0) {
 		lck_grp_attr_setdefault(attr);
+	}
 
-	return(attr);
+	return attr;
 }
 
 
@@ -161,34 +200,35 @@ lck_grp_attr_alloc_init(
 
 void
 lck_grp_attr_setdefault(
-	lck_grp_attr_t	*attr)
+	lck_grp_attr_t  *attr)
 {
-	if (LcksOpts & enaLkStat)
+	if (LcksOpts & enaLkStat) {
 		attr->grp_attr_val = LCK_GRP_ATTR_STAT;
-	else
+	} else {
 		attr->grp_attr_val = 0;
+	}
 }
 
 
 /*
- * Routine: 	lck_grp_attr_setstat
+ * Routine:     lck_grp_attr_setstat
  */
 
 void
 lck_grp_attr_setstat(
-	lck_grp_attr_t	*attr)
+	lck_grp_attr_t  *attr)
 {
-	(void)hw_atomic_or(&attr->grp_attr_val, LCK_GRP_ATTR_STAT);
+	os_atomic_or(&attr->grp_attr_val, LCK_GRP_ATTR_STAT, relaxed);
 }
 
 
 /*
- * Routine: 	lck_grp_attr_free
+ * Routine:     lck_grp_attr_free
  */
 
 void
 lck_grp_attr_free(
-	lck_grp_attr_t	*attr)
+	lck_grp_attr_t  *attr)
 {
 	kfree(attr, sizeof(lck_grp_attr_t));
 }
@@ -200,15 +240,16 @@ lck_grp_attr_free(
 
 lck_grp_t *
 lck_grp_alloc_init(
-	const char*	grp_name,
-	lck_grp_attr_t	*attr)
+	const char*     grp_name,
+	lck_grp_attr_t  *attr)
 {
-	lck_grp_t	*grp;
+	lck_grp_t       *grp;
 
-	if ((grp = (lck_grp_t *)kalloc(sizeof(lck_grp_t))) != 0)
+	if ((grp = (lck_grp_t *)kalloc(sizeof(lck_grp_t))) != 0) {
 		lck_grp_init(grp, grp_name, attr);
+	}
 
-	return(grp);
+	return grp;
 }
 
 /*
@@ -218,18 +259,45 @@ lck_grp_alloc_init(
 void
 lck_grp_init(lck_grp_t * grp, const char * grp_name, lck_grp_attr_t * attr)
 {
+	/* make sure locking infrastructure has been initialized */
+	assert(lck_grp_cnt > 0);
+
 	bzero((void *)grp, sizeof(lck_grp_t));
 
 	(void)strlcpy(grp->lck_grp_name, grp_name, LCK_GRP_MAX_NAME);
 
-	if (attr != LCK_GRP_ATTR_NULL)
+	if (attr != LCK_GRP_ATTR_NULL) {
 		grp->lck_grp_attr = attr->grp_attr_val;
-	else if (LcksOpts & enaLkStat)
-		grp->lck_grp_attr = LCK_GRP_ATTR_STAT;
-	else
-		grp->lck_grp_attr = LCK_ATTR_NONE;
+	} else {
+		grp->lck_grp_attr = 0;
+		if (LcksOpts & enaLkStat) {
+			grp->lck_grp_attr |= LCK_GRP_ATTR_STAT;
+		}
+		if (LcksOpts & enaLkTimeStat) {
+			grp->lck_grp_attr |= LCK_GRP_ATTR_TIME_STAT;
+		}
+	}
+
+	if (grp->lck_grp_attr & LCK_GRP_ATTR_STAT) {
+		lck_grp_stats_t *stats = &grp->lck_grp_stats;
+
+#if LOCK_STATS
+		lck_grp_stat_enable(&stats->lgss_spin_held);
+		lck_grp_stat_enable(&stats->lgss_spin_miss);
+#endif /* LOCK_STATS */
+
+		lck_grp_stat_enable(&stats->lgss_mtx_held);
+		lck_grp_stat_enable(&stats->lgss_mtx_miss);
+		lck_grp_stat_enable(&stats->lgss_mtx_direct_wait);
+	}
+	if (grp->lck_grp_attr * LCK_GRP_ATTR_TIME_STAT) {
+#if LOCK_STATS
+		lck_grp_stats_t *stats = &grp->lck_grp_stats;
+		lck_grp_stat_enable(&stats->lgss_spin_spin);
+#endif /* LOCK_STATS */
+	}
 
-	grp->lck_grp_refcnt = 1;
+	os_ref_init(&grp->lck_grp_refcnt, NULL);
 
 	lck_mtx_lock(&lck_grp_lock);
 	enqueue_tail(&lck_grp_queue, (queue_entry_t)grp);
@@ -238,12 +306,12 @@ lck_grp_init(lck_grp_t * grp, const char * grp_name, lck_grp_attr_t * attr)
 }
 
 /*
- * Routine: 	lck_grp_free
+ * Routine:     lck_grp_free
  */
 
 void
 lck_grp_free(
-	lck_grp_t	*grp)
+	lck_grp_t       *grp)
 {
 	lck_mtx_lock(&lck_grp_lock);
 	lck_grp_cnt--;
@@ -254,27 +322,30 @@ lck_grp_free(
 
 
 /*
- * Routine: 	lck_grp_reference
+ * Routine:     lck_grp_reference
  */
 
 void
 lck_grp_reference(
-	lck_grp_t	*grp)
+	lck_grp_t       *grp)
 {
-	(void)hw_atomic_add(&grp->lck_grp_refcnt, 1);
+	os_ref_retain(&grp->lck_grp_refcnt);
 }
 
 
 /*
- * Routine: 	lck_grp_deallocate
+ * Routine:     lck_grp_deallocate
  */
 
 void
 lck_grp_deallocate(
-	lck_grp_t	*grp)
+	lck_grp_t       *grp)
 {
-	if (hw_atomic_sub(&grp->lck_grp_refcnt, 1) == 0)
-	 	kfree(grp, sizeof(lck_grp_t));
+	if (os_ref_release(&grp->lck_grp_refcnt) != 0) {
+		return;
+	}
+
+	kfree(grp, sizeof(lck_grp_t));
 }
 
 /*
@@ -283,10 +354,10 @@ lck_grp_deallocate(
 
 void
 lck_grp_lckcnt_incr(
-	lck_grp_t	*grp,
-	lck_type_t	lck_type)
+	lck_grp_t       *grp,
+	lck_type_t      lck_type)
 {
-	unsigned int	*lckcnt;
+	unsigned int    *lckcnt;
 
 	switch (lck_type) {
 	case LCK_TYPE_SPIN:
@@ -302,7 +373,7 @@ lck_grp_lckcnt_incr(
 		return panic("lck_grp_lckcnt_incr(): invalid lock type: %d\n", lck_type);
 	}
 
-	(void)hw_atomic_add(lckcnt, 1);
+	os_atomic_inc(lckcnt, relaxed);
 }
 
 /*
@@ -311,10 +382,11 @@ lck_grp_lckcnt_incr(
 
 void
 lck_grp_lckcnt_decr(
-	lck_grp_t	*grp,
-	lck_type_t	lck_type)
+	lck_grp_t       *grp,
+	lck_type_t      lck_type)
 {
-	unsigned int	*lckcnt;
+	unsigned int    *lckcnt;
+	int             updated;
 
 	switch (lck_type) {
 	case LCK_TYPE_SPIN:
@@ -327,10 +399,12 @@ lck_grp_lckcnt_decr(
 		lckcnt = &grp->lck_grp_rwcnt;
 		break;
 	default:
-		return panic("lck_grp_lckcnt_decr(): invalid lock type: %d\n", lck_type);
+		panic("lck_grp_lckcnt_decr(): invalid lock type: %d\n", lck_type);
+		return;
 	}
 
-	(void)hw_atomic_sub(lckcnt, 1);
+	updated = os_atomic_dec(lckcnt, relaxed);
+	assert(updated >= 0);
 }
 
 /*
@@ -341,12 +415,13 @@ lck_attr_t *
 lck_attr_alloc_init(
 	void)
 {
-	lck_attr_t	*attr;
+	lck_attr_t      *attr;
 
-	if ((attr = (lck_attr_t *)kalloc(sizeof(lck_attr_t))) != 0)
+	if ((attr = (lck_attr_t *)kalloc(sizeof(lck_attr_t))) != 0) {
 		lck_attr_setdefault(attr);
+	}
 
-	return(attr);
+	return attr;
 }
 
 
@@ -356,20 +431,24 @@ lck_attr_alloc_init(
 
 void
 lck_attr_setdefault(
-	lck_attr_t	*attr)
+	lck_attr_t      *attr)
 {
-#if   __i386__ || __x86_64__
+#if __arm__ || __arm64__
+	/* <rdar://problem/4404579>: Using LCK_ATTR_DEBUG here causes panic at boot time for arm */
+	attr->lck_attr_val =  LCK_ATTR_NONE;
+#elif __i386__ || __x86_64__
 #if     !DEBUG
- 	if (LcksOpts & enaLkDeb)
- 		attr->lck_attr_val =  LCK_ATTR_DEBUG;
- 	else
- 		attr->lck_attr_val =  LCK_ATTR_NONE;
+	if (LcksOpts & enaLkDeb) {
+		attr->lck_attr_val =  LCK_ATTR_DEBUG;
+	} else {
+		attr->lck_attr_val =  LCK_ATTR_NONE;
+	}
 #else
- 	attr->lck_attr_val =  LCK_ATTR_DEBUG;
-#endif	/* !DEBUG */
+	attr->lck_attr_val =  LCK_ATTR_DEBUG;
+#endif  /* !DEBUG */
 #else
 #error Unknown architecture.
-#endif	/* __arm__ */
+#endif  /* __arm__ */
 }
 
 
@@ -378,9 +457,9 @@ lck_attr_setdefault(
  */
 void
 lck_attr_setdebug(
-	lck_attr_t	*attr)
+	lck_attr_t      *attr)
 {
-	(void)hw_atomic_or(&attr->lck_attr_val, LCK_ATTR_DEBUG);
+	os_atomic_or(&attr->lck_attr_val, LCK_ATTR_DEBUG, relaxed);
 }
 
 /*
@@ -388,9 +467,9 @@ lck_attr_setdebug(
  */
 void
 lck_attr_cleardebug(
-	lck_attr_t	*attr)
+	lck_attr_t      *attr)
 {
-	(void)hw_atomic_and(&attr->lck_attr_val, ~LCK_ATTR_DEBUG);
+	os_atomic_andnot(&attr->lck_attr_val, LCK_ATTR_DEBUG, relaxed);
 }
 
 
@@ -399,9 +478,9 @@ lck_attr_cleardebug(
  */
 void
 lck_attr_rw_shared_priority(
-	lck_attr_t	*attr)
+	lck_attr_t      *attr)
 {
-	(void)hw_atomic_or(&attr->lck_attr_val, LCK_ATTR_RW_SHARED_PRIORITY);
+	os_atomic_or(&attr->lck_attr_val, LCK_ATTR_RW_SHARED_PRIORITY, relaxed);
 }
 
 
@@ -410,796 +489,2765 @@ lck_attr_rw_shared_priority(
  */
 void
 lck_attr_free(
-	lck_attr_t	*attr)
+	lck_attr_t      *attr)
 {
 	kfree(attr, sizeof(lck_attr_t));
 }
 
-
 /*
- * Routine:	lck_spin_sleep
+ * Routine:	hw_lock_init
+ *
+ *	Initialize a hardware lock.
  */
-wait_result_t
-lck_spin_sleep(
-        lck_spin_t		*lck,
-	lck_sleep_action_t	lck_sleep_action,
-	event_t			event,
-	wait_interrupt_t	interruptible)
-{
-	wait_result_t	res;
- 
-	if ((lck_sleep_action & ~LCK_SLEEP_MASK) != 0)
-		panic("Invalid lock sleep action %x\n", lck_sleep_action);
+void
+hw_lock_init(hw_lock_t lock)
+{
+	ordered_store_hw(lock, 0);
+}
 
-	res = assert_wait(event, interruptible);
-	if (res == THREAD_WAITING) {
-		lck_spin_unlock(lck);
-		res = thread_block(THREAD_CONTINUE_NULL);
-		if (!(lck_sleep_action & LCK_SLEEP_UNLOCK))
-			lck_spin_lock(lck);
+#if     __SMP__
+static inline bool
+hw_lock_trylock_contended(hw_lock_t lock, uintptr_t newval)
+{
+#if OS_ATOMIC_USE_LLSC
+	uintptr_t oldval;
+	os_atomic_rmw_loop(&lock->lock_data, oldval, newval, acquire, {
+		if (oldval != 0) {
+		        wait_for_event(); // clears the monitor so we don't need give_up()
+		        return false;
+		}
+	});
+	return true;
+#else // !OS_ATOMIC_USE_LLSC
+#if OS_ATOMIC_HAS_LLSC
+	uintptr_t oldval = os_atomic_load_exclusive(&lock->lock_data, relaxed);
+	if (oldval != 0) {
+		wait_for_event(); // clears the monitor so we don't need give_up()
+		return false;
 	}
-	else
-	if (lck_sleep_action & LCK_SLEEP_UNLOCK)
-		lck_spin_unlock(lck);
-
-	return res;
+#endif // OS_ATOMIC_HAS_LLSC
+	return os_atomic_cmpxchg(&lock->lock_data, 0, newval, acquire);
+#endif // !OS_ATOMIC_USE_LLSC
 }
 
-
 /*
- * Routine:	lck_spin_sleep_deadline
+ *	Routine: hw_lock_lock_contended
+ *
+ *	Spin until lock is acquired or timeout expires.
+ *	timeout is in mach_absolute_time ticks. Called with
+ *	preemption disabled.
  */
-wait_result_t
-lck_spin_sleep_deadline(
-        lck_spin_t		*lck,
-	lck_sleep_action_t	lck_sleep_action,
-	event_t			event,
-	wait_interrupt_t	interruptible,
-	uint64_t		deadline)
+static unsigned int NOINLINE
+hw_lock_lock_contended(hw_lock_t lock, uintptr_t data, uint64_t timeout, boolean_t do_panic LCK_GRP_ARG(lck_grp_t *grp))
 {
-	wait_result_t   res;
-
-	if ((lck_sleep_action & ~LCK_SLEEP_MASK) != 0)
-		panic("Invalid lock sleep action %x\n", lck_sleep_action);
+	uint64_t        end = 0;
+	uintptr_t       holder = lock->lock_data;
+	int             i;
 
-	res = assert_wait_deadline(event, interruptible, deadline);
-	if (res == THREAD_WAITING) {
-		lck_spin_unlock(lck);
-		res = thread_block(THREAD_CONTINUE_NULL);
-		if (!(lck_sleep_action & LCK_SLEEP_UNLOCK))
-			lck_spin_lock(lck);
+	if (timeout == 0) {
+		timeout = LOCK_PANIC_TIMEOUT;
 	}
-	else
-	if (lck_sleep_action & LCK_SLEEP_UNLOCK)
-		lck_spin_unlock(lck);
+#if CONFIG_DTRACE || LOCK_STATS
+	uint64_t begin = 0;
+	boolean_t stat_enabled = lck_grp_spin_spin_enabled(lock LCK_GRP_ARG(grp));
+#endif /* CONFIG_DTRACE || LOCK_STATS */
+
+#if LOCK_STATS || CONFIG_DTRACE
+	if (__improbable(stat_enabled)) {
+		begin = mach_absolute_time();
+	}
+#endif /* LOCK_STATS || CONFIG_DTRACE */
+	for (;;) {
+		for (i = 0; i < LOCK_SNOOP_SPINS; i++) {
+			cpu_pause();
+#if (!__ARM_ENABLE_WFE_) || (LOCK_PRETEST)
+			holder = ordered_load_hw(lock);
+			if (holder != 0) {
+				continue;
+			}
+#endif
+			if (hw_lock_trylock_contended(lock, data)) {
+#if CONFIG_DTRACE || LOCK_STATS
+				if (__improbable(stat_enabled)) {
+					lck_grp_spin_update_spin(lock LCK_GRP_ARG(grp), mach_absolute_time() - begin);
+				}
+				lck_grp_spin_update_miss(lock LCK_GRP_ARG(grp));
+#endif /* CONFIG_DTRACE || LOCK_STATS */
+				return 1;
+			}
+		}
+		if (end == 0) {
+			end = ml_get_timebase() + timeout;
+		} else if (ml_get_timebase() >= end) {
+			break;
+		}
+	}
+	if (do_panic) {
+		// Capture the actual time spent blocked, which may be higher than the timeout
+		// if a misbehaving interrupt stole this thread's CPU time.
+		panic("Spinlock timeout after %llu ticks, %p = %lx",
+		    (ml_get_timebase() - end + timeout), lock, holder);
+	}
+	return 0;
+}
+#endif  // __SMP__
 
-	return res;
+void *
+hw_wait_while_equals(void **address, void *current)
+{
+#if     __SMP__
+	void *v;
+	uint64_t end = 0;
+
+	for (;;) {
+		for (int i = 0; i < LOCK_SNOOP_SPINS; i++) {
+			cpu_pause();
+#if OS_ATOMIC_HAS_LLSC
+			v = os_atomic_load_exclusive(address, relaxed);
+			if (__probable(v != current)) {
+				os_atomic_clear_exclusive();
+				return v;
+			}
+			wait_for_event();
+#else
+			v = os_atomic_load(address, relaxed);
+			if (__probable(v != current)) {
+				return v;
+			}
+#endif // OS_ATOMIC_HAS_LLSC
+		}
+		if (end == 0) {
+			end = ml_get_timebase() + LOCK_PANIC_TIMEOUT;
+		} else if (ml_get_timebase() >= end) {
+			panic("Wait while equals timeout @ *%p == %p", address, v);
+		}
+	}
+#else // !__SMP__
+	panic("Value at %p is %p", address, current);
+	__builtin_unreachable();
+#endif // !__SMP__
 }
 
+static inline void
+hw_lock_lock_internal(hw_lock_t lock, thread_t thread LCK_GRP_ARG(lck_grp_t *grp))
+{
+	uintptr_t       state;
+
+	state = LCK_MTX_THREAD_TO_STATE(thread) | PLATFORM_LCK_ILOCK;
+#if     __SMP__
+#if     LOCK_PRETEST
+	if (ordered_load_hw(lock)) {
+		goto contended;
+	}
+#endif  // LOCK_PRETEST
+	if (hw_lock_trylock_contended(lock, state)) {
+		goto end;
+	}
+#if     LOCK_PRETEST
+contended:
+#endif  // LOCK_PRETEST
+	hw_lock_lock_contended(lock, state, 0, spinlock_timeout_panic LCK_GRP_ARG(grp));
+end:
+#else   // __SMP__
+	if (lock->lock_data) {
+		panic("Spinlock held %p", lock);
+	}
+	lock->lock_data = state;
+#endif  // __SMP__
+	lck_grp_spin_update_held(lock LCK_GRP_ARG(grp));
+
+	return;
+}
 
 /*
- * Routine:	lck_mtx_clear_promoted
+ *	Routine: hw_lock_lock
  *
- * Handle clearing of TH_SFLAG_PROMOTED,
- * adjusting thread priority as needed.
- *
- * Called with thread lock held
+ *	Acquire lock, spinning until it becomes available,
+ *	return with preemption disabled.
  */
-static void
-lck_mtx_clear_promoted (
-	thread_t 			thread,
-	__kdebug_only uintptr_t		trace_lck)
+void
+(hw_lock_lock)(hw_lock_t lock LCK_GRP_ARG(lck_grp_t *grp))
 {
-	thread->sched_flags &= ~TH_SFLAG_PROMOTED;
+	thread_t thread = current_thread();
+	disable_preemption_for_thread(thread);
+	hw_lock_lock_internal(lock, thread LCK_GRP_ARG(grp));
+}
 
-	if (thread->sched_flags & TH_SFLAG_RW_PROMOTED) {
-		/* Thread still has a RW lock promotion */
-	} else if (thread->sched_flags & TH_SFLAG_DEPRESSED_MASK) {
-		KERNEL_DEBUG_CONSTANT(
-			MACHDBG_CODE(DBG_MACH_SCHED,MACH_DEMOTE) | DBG_FUNC_NONE,
-				thread->sched_pri, DEPRESSPRI, 0, trace_lck, 0);
-		set_sched_pri(thread, DEPRESSPRI);
-	} else {
-		if (thread->base_pri < thread->sched_pri) {
-			KERNEL_DEBUG_CONSTANT(
-				MACHDBG_CODE(DBG_MACH_SCHED,MACH_DEMOTE) | DBG_FUNC_NONE,
-					thread->sched_pri, thread->base_pri, 0, trace_lck, 0);
-		}
-		thread_recompute_sched_pri(thread, FALSE);
+/*
+ *	Routine: hw_lock_lock_nopreempt
+ *
+ *	Acquire lock, spinning until it becomes available.
+ */
+void
+(hw_lock_lock_nopreempt)(hw_lock_t lock LCK_GRP_ARG(lck_grp_t *grp))
+{
+	thread_t thread = current_thread();
+	if (__improbable(!preemption_disabled_for_thread(thread))) {
+		panic("Attempt to take no-preempt spinlock %p in preemptible context", lock);
 	}
+	hw_lock_lock_internal(lock, thread LCK_GRP_ARG(grp));
 }
 
-
 /*
- * Routine:	lck_mtx_sleep
+ *	Routine: hw_lock_to
+ *
+ *	Acquire lock, spinning until it becomes available or timeout.
+ *	Timeout is in mach_absolute_time ticks, return with
+ *	preemption disabled.
  */
-wait_result_t
-lck_mtx_sleep(
-        lck_mtx_t		*lck,
-	lck_sleep_action_t	lck_sleep_action,
-	event_t			event,
-	wait_interrupt_t	interruptible)
-{
-	wait_result_t	res;
-	thread_t		thread = current_thread();
- 
-	KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS, LCK_MTX_SLEEP_CODE) | DBG_FUNC_START,
-		     VM_KERNEL_UNSLIDE_OR_PERM(lck), (int)lck_sleep_action, VM_KERNEL_UNSLIDE_OR_PERM(event), (int)interruptible, 0);
-
-	if ((lck_sleep_action & ~LCK_SLEEP_MASK) != 0)
-		panic("Invalid lock sleep action %x\n", lck_sleep_action);
-
-	if (lck_sleep_action & LCK_SLEEP_PROMOTED_PRI) {
-		/*
-		 * We overload the RW lock promotion to give us a priority ceiling
-		 * during the time that this thread is asleep, so that when it
-		 * is re-awakened (and not yet contending on the mutex), it is
-		 * runnable at a reasonably high priority.
-		 */
-		thread->rwlock_count++;
+unsigned
+int
+(hw_lock_to)(hw_lock_t lock, uint64_t timeout LCK_GRP_ARG(lck_grp_t *grp))
+{
+	thread_t        thread;
+	uintptr_t       state;
+	unsigned int success = 0;
+
+	thread = current_thread();
+	disable_preemption_for_thread(thread);
+	state = LCK_MTX_THREAD_TO_STATE(thread) | PLATFORM_LCK_ILOCK;
+#if     __SMP__
+#if     LOCK_PRETEST
+	if (ordered_load_hw(lock)) {
+		goto contended;
 	}
-
-	res = assert_wait(event, interruptible);
-	if (res == THREAD_WAITING) {
-		lck_mtx_unlock(lck);
-		res = thread_block(THREAD_CONTINUE_NULL);
-		if (!(lck_sleep_action & LCK_SLEEP_UNLOCK)) {
-			if ((lck_sleep_action & LCK_SLEEP_SPIN))
-				lck_mtx_lock_spin(lck);
-			else
-				lck_mtx_lock(lck);
-		}
+#endif  // LOCK_PRETEST
+	if (hw_lock_trylock_contended(lock, state)) {
+		success = 1;
+		goto end;
 	}
-	else
-	if (lck_sleep_action & LCK_SLEEP_UNLOCK)
-		lck_mtx_unlock(lck);
-
-	if (lck_sleep_action & LCK_SLEEP_PROMOTED_PRI) {
-		if ((thread->rwlock_count-- == 1 /* field now 0 */) && (thread->sched_flags & TH_SFLAG_RW_PROMOTED)) {
-			/* sched_flags checked without lock, but will be rechecked while clearing */
-			lck_rw_clear_promotion(thread);
-		}
+#if     LOCK_PRETEST
+contended:
+#endif  // LOCK_PRETEST
+	success = hw_lock_lock_contended(lock, state, timeout, FALSE LCK_GRP_ARG(grp));
+end:
+#else   // __SMP__
+	(void)timeout;
+	if (ordered_load_hw(lock) == 0) {
+		ordered_store_hw(lock, state);
+		success = 1;
 	}
-
-	KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS, LCK_MTX_SLEEP_CODE) | DBG_FUNC_END, (int)res, 0, 0, 0, 0);
-
-	return res;
+#endif  // __SMP__
+	if (success) {
+		lck_grp_spin_update_held(lock LCK_GRP_ARG(grp));
+	}
+	return success;
 }
 
-
 /*
- * Routine:	lck_mtx_sleep_deadline
+ *	Routine: hw_lock_try
+ *
+ *	returns with preemption disabled on success.
  */
-wait_result_t
-lck_mtx_sleep_deadline(
-        lck_mtx_t		*lck,
-	lck_sleep_action_t	lck_sleep_action,
-	event_t			event,
-	wait_interrupt_t	interruptible,
-	uint64_t		deadline)
+static inline unsigned int
+hw_lock_try_internal(hw_lock_t lock, thread_t thread LCK_GRP_ARG(lck_grp_t *grp))
 {
-	wait_result_t   res;
-	thread_t		thread = current_thread();
-
-	KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS, LCK_MTX_SLEEP_DEADLINE_CODE) | DBG_FUNC_START,
-		     VM_KERNEL_UNSLIDE_OR_PERM(lck), (int)lck_sleep_action, VM_KERNEL_UNSLIDE_OR_PERM(event), (int)interruptible, 0);
-
-	if ((lck_sleep_action & ~LCK_SLEEP_MASK) != 0)
-		panic("Invalid lock sleep action %x\n", lck_sleep_action);
+	int             success = 0;
 
-	if (lck_sleep_action & LCK_SLEEP_PROMOTED_PRI) {
-		/*
-		 * See lck_mtx_sleep().
-		 */
-		thread->rwlock_count++;
+#if     __SMP__
+#if     LOCK_PRETEST
+	if (ordered_load_hw(lock)) {
+		goto failed;
 	}
-
-	res = assert_wait_deadline(event, interruptible, deadline);
-	if (res == THREAD_WAITING) {
-		lck_mtx_unlock(lck);
-		res = thread_block(THREAD_CONTINUE_NULL);
-		if (!(lck_sleep_action & LCK_SLEEP_UNLOCK)) {
-			if ((lck_sleep_action & LCK_SLEEP_SPIN))
-				lck_mtx_lock_spin(lck);
-			else
-				lck_mtx_lock(lck);
-		}
+#endif  // LOCK_PRETEST
+	success = os_atomic_cmpxchg(&lock->lock_data, 0,
+	    LCK_MTX_THREAD_TO_STATE(thread) | PLATFORM_LCK_ILOCK, acquire);
+#else
+	if (lock->lock_data == 0) {
+		lock->lock_data = LCK_MTX_THREAD_TO_STATE(thread) | PLATFORM_LCK_ILOCK;
+		success = 1;
 	}
-	else
-	if (lck_sleep_action & LCK_SLEEP_UNLOCK)
-		lck_mtx_unlock(lck);
+#endif  // __SMP__
 
-	if (lck_sleep_action & LCK_SLEEP_PROMOTED_PRI) {
-		if ((thread->rwlock_count-- == 1 /* field now 0 */) && (thread->sched_flags & TH_SFLAG_RW_PROMOTED)) {
-			/* sched_flags checked without lock, but will be rechecked while clearing */
-			lck_rw_clear_promotion(thread);
-		}
+#if     LOCK_PRETEST
+failed:
+#endif  // LOCK_PRETEST
+	if (success) {
+		lck_grp_spin_update_held(lock LCK_GRP_ARG(grp));
 	}
+	return success;
+}
 
-	KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS, LCK_MTX_SLEEP_DEADLINE_CODE) | DBG_FUNC_END, (int)res, 0, 0, 0, 0);
+unsigned
+int
+(hw_lock_try)(hw_lock_t lock LCK_GRP_ARG(lck_grp_t *grp))
+{
+	thread_t thread = current_thread();
+	disable_preemption_for_thread(thread);
+	unsigned int success = hw_lock_try_internal(lock, thread LCK_GRP_ARG(grp));
+	if (!success) {
+		enable_preemption();
+	}
+	return success;
+}
 
-	return res;
+unsigned
+int
+(hw_lock_try_nopreempt)(hw_lock_t lock LCK_GRP_ARG(lck_grp_t *grp))
+{
+	thread_t thread = current_thread();
+	if (__improbable(!preemption_disabled_for_thread(thread))) {
+		panic("Attempt to test no-preempt spinlock %p in preemptible context", lock);
+	}
+	return hw_lock_try_internal(lock, thread LCK_GRP_ARG(grp));
 }
 
 /*
- * Routine: 	lck_mtx_lock_wait
- *
- * Invoked in order to wait on contention.
+ *	Routine: hw_lock_unlock
  *
- * Called with the interlock locked and
- * returns it unlocked.
+ *	Unconditionally release lock, release preemption level.
  */
+static inline void
+hw_lock_unlock_internal(hw_lock_t lock)
+{
+	os_atomic_store(&lock->lock_data, 0, release);
+#if __arm__ || __arm64__
+	// ARM tests are only for open-source exclusion
+	set_event();
+#endif  // __arm__ || __arm64__
+#if     CONFIG_DTRACE
+	LOCKSTAT_RECORD(LS_LCK_SPIN_UNLOCK_RELEASE, lock, 0);
+#endif /* CONFIG_DTRACE */
+}
+
 void
-lck_mtx_lock_wait (
-	lck_mtx_t			*lck,
-	thread_t			holder)
-{
-	thread_t		self = current_thread();
-	lck_mtx_t		*mutex;
-	__kdebug_only uintptr_t	trace_lck = VM_KERNEL_UNSLIDE_OR_PERM(lck);
-	__kdebug_only uintptr_t	trace_holder = VM_KERNEL_UNSLIDE_OR_PERM(holder);
-	integer_t		priority;
-	spl_t			s = splsched();
-#if	CONFIG_DTRACE
-	uint64_t		sleep_start = 0;
+(hw_lock_unlock)(hw_lock_t lock)
+{
+	hw_lock_unlock_internal(lock);
+	enable_preemption();
+}
 
-	if (lockstat_probemap[LS_LCK_MTX_LOCK_BLOCK] || lockstat_probemap[LS_LCK_MTX_EXT_LOCK_BLOCK]) {
-		sleep_start = mach_absolute_time();
+void
+(hw_lock_unlock_nopreempt)(hw_lock_t lock)
+{
+	if (__improbable(!preemption_disabled_for_thread(current_thread()))) {
+		panic("Attempt to release no-preempt spinlock %p in preemptible context", lock);
 	}
-#endif
+	hw_lock_unlock_internal(lock);
+}
 
-	if (lck->lck_mtx_tag != LCK_MTX_TAG_INDIRECT)
-		mutex = lck;
-	else
-		mutex = &lck->lck_mtx_ptr->lck_mtx;
+/*
+ *	Routine hw_lock_held, doesn't change preemption state.
+ *	N.B.  Racy, of course.
+ */
+unsigned int
+hw_lock_held(hw_lock_t lock)
+{
+	return ordered_load_hw(lock) != 0;
+}
 
-	KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS, LCK_MTX_LCK_WAIT_CODE) | DBG_FUNC_START, trace_lck, trace_holder, 0, 0, 0);
+#if     __SMP__
+static unsigned int
+hw_lock_bit_to_contended(hw_lock_bit_t *lock, uint32_t mask, uint32_t timeout LCK_GRP_ARG(lck_grp_t *grp));
+#endif
 
-	priority = self->sched_pri;
-	if (priority < self->base_pri)
-		priority = self->base_pri;
-	if (priority < BASEPRI_DEFAULT)
-		priority = BASEPRI_DEFAULT;
+static inline unsigned int
+hw_lock_bit_to_internal(hw_lock_bit_t *lock, unsigned int bit, uint32_t timeout LCK_GRP_ARG(lck_grp_t *grp))
+{
+	unsigned int success = 0;
+	uint32_t        mask = (1 << bit);
+#if     !__SMP__
+	uint32_t        state;
+#endif
 
-	/* Do not promote past promotion ceiling */
-	priority = MIN(priority, MAXPRI_PROMOTE);
+#if     __SMP__
+	if (__improbable(!hw_atomic_test_and_set32(lock, mask, mask, memory_order_acquire, FALSE))) {
+		success = hw_lock_bit_to_contended(lock, mask, timeout LCK_GRP_ARG(grp));
+	} else {
+		success = 1;
+	}
+#else   // __SMP__
+	(void)timeout;
+	state = ordered_load_bit(lock);
+	if (!(mask & state)) {
+		ordered_store_bit(lock, state | mask);
+		success = 1;
+	}
+#endif  // __SMP__
 
-	thread_lock(holder);
-	if (mutex->lck_mtx_pri == 0)
-		holder->promotions++;
-	holder->sched_flags |= TH_SFLAG_PROMOTED;
-	if (mutex->lck_mtx_pri < priority && holder->sched_pri < priority) {
-		KERNEL_DEBUG_CONSTANT(
-			MACHDBG_CODE(DBG_MACH_SCHED,MACH_PROMOTE) | DBG_FUNC_NONE,
-					holder->sched_pri, priority, trace_holder, trace_lck, 0);
-		set_sched_pri(holder, priority);
+	if (success) {
+		lck_grp_spin_update_held(lock LCK_GRP_ARG(grp));
 	}
-	thread_unlock(holder);
-	splx(s);
 
-	if (mutex->lck_mtx_pri < priority)
-		mutex->lck_mtx_pri = priority;
-	if (self->pending_promoter[self->pending_promoter_index] == NULL) {
-		self->pending_promoter[self->pending_promoter_index] = mutex;
-		mutex->lck_mtx_waiters++;
+	return success;
+}
+
+unsigned
+int
+(hw_lock_bit_to)(hw_lock_bit_t * lock, unsigned int bit, uint32_t timeout LCK_GRP_ARG(lck_grp_t *grp))
+{
+	_disable_preemption();
+	return hw_lock_bit_to_internal(lock, bit, timeout LCK_GRP_ARG(grp));
+}
+
+#if     __SMP__
+static unsigned int NOINLINE
+hw_lock_bit_to_contended(hw_lock_bit_t *lock, uint32_t mask, uint32_t timeout LCK_GRP_ARG(lck_grp_t *grp))
+{
+	uint64_t        end = 0;
+	int             i;
+#if CONFIG_DTRACE || LOCK_STATS
+	uint64_t begin = 0;
+	boolean_t stat_enabled = lck_grp_spin_spin_enabled(lock LCK_GRP_ARG(grp));
+#endif /* CONFIG_DTRACE || LOCK_STATS */
+
+#if LOCK_STATS || CONFIG_DTRACE
+	if (__improbable(stat_enabled)) {
+		begin = mach_absolute_time();
 	}
-	else
-	if (self->pending_promoter[self->pending_promoter_index] != mutex) {
-		self->pending_promoter[++self->pending_promoter_index] = mutex;
-		mutex->lck_mtx_waiters++;
+#endif /* LOCK_STATS || CONFIG_DTRACE */
+	for (;;) {
+		for (i = 0; i < LOCK_SNOOP_SPINS; i++) {
+			// Always load-exclusive before wfe
+			// This grabs the monitor and wakes up on a release event
+			if (hw_atomic_test_and_set32(lock, mask, mask, memory_order_acquire, TRUE)) {
+				goto end;
+			}
+		}
+		if (end == 0) {
+			end = ml_get_timebase() + timeout;
+		} else if (ml_get_timebase() >= end) {
+			break;
+		}
 	}
+	return 0;
+end:
+#if CONFIG_DTRACE || LOCK_STATS
+	if (__improbable(stat_enabled)) {
+		lck_grp_spin_update_spin(lock LCK_GRP_ARG(grp), mach_absolute_time() - begin);
+	}
+	lck_grp_spin_update_miss(lock LCK_GRP_ARG(grp));
+#endif /* CONFIG_DTRACE || LCK_GRP_STAT */
 
-	assert_wait(LCK_MTX_EVENT(mutex), THREAD_UNINT);
-	lck_mtx_ilk_unlock(mutex);
-
-	thread_block(THREAD_CONTINUE_NULL);
+	return 1;
+}
+#endif  // __SMP__
 
-	KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS, LCK_MTX_LCK_WAIT_CODE) | DBG_FUNC_END, 0, 0, 0, 0, 0);
-#if	CONFIG_DTRACE
-	/*
-	 * Record the Dtrace lockstat probe for blocking, block time
-	 * measured from when we were entered.
-	 */
-	if (sleep_start) {
-		if (lck->lck_mtx_tag != LCK_MTX_TAG_INDIRECT) {
-			LOCKSTAT_RECORD(LS_LCK_MTX_LOCK_BLOCK, lck,
-			    mach_absolute_time() - sleep_start);
-		} else {
-			LOCKSTAT_RECORD(LS_LCK_MTX_EXT_LOCK_BLOCK, lck,
-			    mach_absolute_time() - sleep_start);
-		}
+void
+(hw_lock_bit)(hw_lock_bit_t * lock, unsigned int bit LCK_GRP_ARG(lck_grp_t *grp))
+{
+	if (hw_lock_bit_to(lock, bit, LOCK_PANIC_TIMEOUT, LCK_GRP_PROBEARG(grp))) {
+		return;
 	}
+#if     __SMP__
+	panic("hw_lock_bit(): timed out (%p)", lock);
+#else
+	panic("hw_lock_bit(): interlock held (%p)", lock);
 #endif
 }
 
-/*
- * Routine: 	lck_mtx_lock_acquire
- *
- * Invoked on acquiring the mutex when there is
- * contention.
- *
- * Returns the current number of waiters.
- *
- * Called with the interlock locked.
- */
-int
-lck_mtx_lock_acquire(
-	lck_mtx_t		*lck)
+void
+(hw_lock_bit_nopreempt)(hw_lock_bit_t * lock, unsigned int bit LCK_GRP_ARG(lck_grp_t *grp))
 {
-	thread_t		thread = current_thread();
-	lck_mtx_t		*mutex;
-	integer_t		priority;
-	spl_t			s;
-	__kdebug_only uintptr_t	trace_lck = VM_KERNEL_UNSLIDE_OR_PERM(lck);
-
-	if (lck->lck_mtx_tag != LCK_MTX_TAG_INDIRECT)
-		mutex = lck;
-	else
-		mutex = &lck->lck_mtx_ptr->lck_mtx;
-
-	if (thread->pending_promoter[thread->pending_promoter_index] == mutex) {
-		thread->pending_promoter[thread->pending_promoter_index] = NULL;
-		if (thread->pending_promoter_index > 0)
-			thread->pending_promoter_index--;
-		mutex->lck_mtx_waiters--;
-	}
-
-	if (mutex->lck_mtx_waiters)
-		priority = mutex->lck_mtx_pri;
-	else {
-		mutex->lck_mtx_pri = 0;
-		priority = 0;
-	}
-
-	if (priority || thread->was_promoted_on_wakeup) {
-		s = splsched();
-		thread_lock(thread);
-
-		if (priority) {
-			thread->promotions++;
-			thread->sched_flags |= TH_SFLAG_PROMOTED;
-			if (thread->sched_pri < priority) {
-				KERNEL_DEBUG_CONSTANT(
-					MACHDBG_CODE(DBG_MACH_SCHED,MACH_PROMOTE) | DBG_FUNC_NONE,
-							thread->sched_pri, priority, 0, trace_lck, 0);
-				/* Do not promote past promotion ceiling */
-				assert(priority <= MAXPRI_PROMOTE);
-				set_sched_pri(thread, priority);
-			}
-		}
-		if (thread->was_promoted_on_wakeup) {
-			thread->was_promoted_on_wakeup = 0;
-			if (thread->promotions == 0)
-				lck_mtx_clear_promoted(thread, trace_lck);
-		}
-
-		thread_unlock(thread);
-		splx(s);
+	if (__improbable(get_preemption_level() == 0)) {
+		panic("Attempt to take no-preempt bitlock %p in preemptible context", lock);
 	}
-
-#if CONFIG_DTRACE
-	if (lockstat_probemap[LS_LCK_MTX_LOCK_ACQUIRE] || lockstat_probemap[LS_LCK_MTX_EXT_LOCK_ACQUIRE]) {
-		if (lck->lck_mtx_tag != LCK_MTX_TAG_INDIRECT) {
-			LOCKSTAT_RECORD(LS_LCK_MTX_LOCK_ACQUIRE, lck, 0);
-		} else {
-			LOCKSTAT_RECORD(LS_LCK_MTX_EXT_LOCK_ACQUIRE, lck, 0);
-		}
+	if (hw_lock_bit_to_internal(lock, bit, LOCK_PANIC_TIMEOUT LCK_GRP_ARG(grp))) {
+		return;
 	}
-#endif	
-	return (mutex->lck_mtx_waiters);
+#if     __SMP__
+	panic("hw_lock_bit_nopreempt(): timed out (%p)", lock);
+#else
+	panic("hw_lock_bit_nopreempt(): interlock held (%p)", lock);
+#endif
 }
 
-/*
- * Routine: 	lck_mtx_unlock_wakeup
- *
- * Invoked on unlock when there is contention.
- *
- * Called with the interlock locked.
- */
-void
-lck_mtx_unlock_wakeup (
-	lck_mtx_t			*lck,
-	thread_t			holder)
+unsigned
+int
+(hw_lock_bit_try)(hw_lock_bit_t * lock, unsigned int bit LCK_GRP_ARG(lck_grp_t *grp))
 {
-	thread_t		thread = current_thread();
-	lck_mtx_t		*mutex;
-	__kdebug_only uintptr_t trace_lck = VM_KERNEL_UNSLIDE_OR_PERM(lck);
-
-	if (lck->lck_mtx_tag != LCK_MTX_TAG_INDIRECT)
-		mutex = lck;
-	else
-		mutex = &lck->lck_mtx_ptr->lck_mtx;
-
-	if (thread != holder)
-		panic("lck_mtx_unlock_wakeup: mutex %p holder %p\n", mutex, holder);
-
-	KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS, LCK_MTX_UNLCK_WAKEUP_CODE) | DBG_FUNC_START, trace_lck, VM_KERNEL_UNSLIDE_OR_PERM(holder), 0, 0, 0);
-
-	assert(mutex->lck_mtx_waiters > 0);
-	if (mutex->lck_mtx_waiters > 1)
-		thread_wakeup_one_with_pri(LCK_MTX_EVENT(lck), lck->lck_mtx_pri);
-	else
-		thread_wakeup_one(LCK_MTX_EVENT(lck));
+	uint32_t        mask = (1 << bit);
+#if     !__SMP__
+	uint32_t        state;
+#endif
+	boolean_t       success = FALSE;
 
-	if (thread->promotions > 0) {
-		spl_t		s = splsched();
+	_disable_preemption();
+#if     __SMP__
+	// TODO: consider weak (non-looping) atomic test-and-set
+	success = hw_atomic_test_and_set32(lock, mask, mask, memory_order_acquire, FALSE);
+#else
+	state = ordered_load_bit(lock);
+	if (!(mask & state)) {
+		ordered_store_bit(lock, state | mask);
+		success = TRUE;
+	}
+#endif  // __SMP__
+	if (!success) {
+		_enable_preemption();
+	}
 
-		thread_lock(thread);
-		if (--thread->promotions == 0 && (thread->sched_flags & TH_SFLAG_PROMOTED))
-			lck_mtx_clear_promoted(thread, trace_lck);
-		thread_unlock(thread);
-		splx(s);
+	if (success) {
+		lck_grp_spin_update_held(lock LCK_GRP_ARG(grp));
 	}
 
-	KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS, LCK_MTX_UNLCK_WAKEUP_CODE) | DBG_FUNC_END, 0, 0, 0, 0, 0);
+	return success;
 }
 
-void
-lck_mtx_unlockspin_wakeup (
-	lck_mtx_t			*lck)
+static inline void
+hw_unlock_bit_internal(hw_lock_bit_t *lock, unsigned int bit)
 {
-	assert(lck->lck_mtx_waiters > 0);
-	thread_wakeup_one(LCK_MTX_EVENT(lck));
+	uint32_t        mask = (1 << bit);
+#if     !__SMP__
+	uint32_t        state;
+#endif
 
-	KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS, LCK_MTX_UNLCK_WAKEUP_CODE) | DBG_FUNC_NONE, VM_KERNEL_UNSLIDE_OR_PERM(lck), 0, 0, 1, 0);
+#if     __SMP__
+	os_atomic_andnot(lock, mask, release);
+#if __arm__
+	set_event();
+#endif
+#else   // __SMP__
+	state = ordered_load_bit(lock);
+	ordered_store_bit(lock, state & ~mask);
+#endif  // __SMP__
 #if CONFIG_DTRACE
-	/*
-	 * When there are waiters, we skip the hot-patch spot in the
-	 * fastpath, so we record it here.
-	 */
-	LOCKSTAT_RECORD(LS_LCK_MTX_UNLOCK_RELEASE, lck, 0);
+	LOCKSTAT_RECORD(LS_LCK_SPIN_UNLOCK_RELEASE, lock, bit);
 #endif
 }
 
-
 /*
- * Routine: 	mutex_pause
+ *	Routine:	hw_unlock_bit
  *
- * Called by former callers of simple_lock_pause().
+ *		Release spin-lock. The second parameter is the bit number to test and set.
+ *		Decrement the preemption level.
  */
-#define MAX_COLLISION_COUNTS	32
-#define MAX_COLLISION 	8
-
-unsigned int max_collision_count[MAX_COLLISION_COUNTS];
-
-uint32_t collision_backoffs[MAX_COLLISION] = {
-        10, 50, 100, 200, 400, 600, 800, 1000
-};
-
+void
+hw_unlock_bit(hw_lock_bit_t * lock, unsigned int bit)
+{
+	hw_unlock_bit_internal(lock, bit);
+	_enable_preemption();
+}
 
 void
-mutex_pause(uint32_t collisions)
+hw_unlock_bit_nopreempt(hw_lock_bit_t * lock, unsigned int bit)
 {
-	wait_result_t wait_result;
-	uint32_t	back_off;
+	if (__improbable(get_preemption_level() == 0)) {
+		panic("Attempt to release no-preempt bitlock %p in preemptible context", lock);
+	}
+	hw_unlock_bit_internal(lock, bit);
+}
 
-	if (collisions >= MAX_COLLISION_COUNTS)
-	        collisions = MAX_COLLISION_COUNTS - 1;
-	max_collision_count[collisions]++;
+/*
+ * Routine:	lck_spin_sleep
+ */
+wait_result_t
+lck_spin_sleep_grp(
+	lck_spin_t              *lck,
+	lck_sleep_action_t      lck_sleep_action,
+	event_t                 event,
+	wait_interrupt_t        interruptible,
+	lck_grp_t               *grp)
+{
+	wait_result_t   res;
 
-	if (collisions >= MAX_COLLISION)
-	        collisions = MAX_COLLISION - 1;
-	back_off = collision_backoffs[collisions];
+	if ((lck_sleep_action & ~LCK_SLEEP_MASK) != 0) {
+		panic("Invalid lock sleep action %x\n", lck_sleep_action);
+	}
 
-	wait_result = assert_wait_timeout((event_t)mutex_pause, THREAD_UNINT, back_off, NSEC_PER_USEC);
-	assert(wait_result == THREAD_WAITING);
+	res = assert_wait(event, interruptible);
+	if (res == THREAD_WAITING) {
+		lck_spin_unlock(lck);
+		res = thread_block(THREAD_CONTINUE_NULL);
+		if (!(lck_sleep_action & LCK_SLEEP_UNLOCK)) {
+			lck_spin_lock_grp(lck, grp);
+		}
+	} else if (lck_sleep_action & LCK_SLEEP_UNLOCK) {
+		lck_spin_unlock(lck);
+	}
 
-	wait_result = thread_block(THREAD_CONTINUE_NULL);
-	assert(wait_result == THREAD_TIMED_OUT);
+	return res;
 }
 
+wait_result_t
+lck_spin_sleep(
+	lck_spin_t              *lck,
+	lck_sleep_action_t      lck_sleep_action,
+	event_t                 event,
+	wait_interrupt_t        interruptible)
+{
+	return lck_spin_sleep_grp(lck, lck_sleep_action, event, interruptible, LCK_GRP_NULL);
+}
 
-unsigned int mutex_yield_wait = 0;
-unsigned int mutex_yield_no_wait = 0;
-
-void
-lck_mtx_yield(
-	    lck_mtx_t	*lck)
+/*
+ * Routine:	lck_spin_sleep_deadline
+ */
+wait_result_t
+lck_spin_sleep_deadline(
+	lck_spin_t              *lck,
+	lck_sleep_action_t      lck_sleep_action,
+	event_t                 event,
+	wait_interrupt_t        interruptible,
+	uint64_t                deadline)
 {
-	int	waiters;
-	
-#if DEBUG
-	lck_mtx_assert(lck, LCK_MTX_ASSERT_OWNED);
-#endif /* DEBUG */
-	
-	if (lck->lck_mtx_tag == LCK_MTX_TAG_INDIRECT)
-	        waiters = lck->lck_mtx_ptr->lck_mtx.lck_mtx_waiters;
-	else
-	        waiters = lck->lck_mtx_waiters;
-
-	if ( !waiters) {
-	        mutex_yield_no_wait++;
-	} else {
-	        mutex_yield_wait++;
-		lck_mtx_unlock(lck);
-		mutex_pause(0);
-		lck_mtx_lock(lck);
+	wait_result_t   res;
+
+	if ((lck_sleep_action & ~LCK_SLEEP_MASK) != 0) {
+		panic("Invalid lock sleep action %x\n", lck_sleep_action);
+	}
+
+	res = assert_wait_deadline(event, interruptible, deadline);
+	if (res == THREAD_WAITING) {
+		lck_spin_unlock(lck);
+		res = thread_block(THREAD_CONTINUE_NULL);
+		if (!(lck_sleep_action & LCK_SLEEP_UNLOCK)) {
+			lck_spin_lock(lck);
+		}
+	} else if (lck_sleep_action & LCK_SLEEP_UNLOCK) {
+		lck_spin_unlock(lck);
 	}
-}
 
+	return res;
+}
 
 /*
- * Routine:	lck_rw_sleep
+ * Routine:	lck_mtx_sleep
  */
 wait_result_t
-lck_rw_sleep(
-        lck_rw_t		*lck,
-	lck_sleep_action_t	lck_sleep_action,
-	event_t			event,
-	wait_interrupt_t	interruptible)
+lck_mtx_sleep(
+	lck_mtx_t               *lck,
+	lck_sleep_action_t      lck_sleep_action,
+	event_t                 event,
+	wait_interrupt_t        interruptible)
 {
-	wait_result_t	res;
-	lck_rw_type_t	lck_rw_type;
-	thread_t		thread = current_thread();
+	wait_result_t   res;
+	thread_t                thread = current_thread();
 
-	if ((lck_sleep_action & ~LCK_SLEEP_MASK) != 0)
+	KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS, LCK_MTX_SLEEP_CODE) | DBG_FUNC_START,
+	    VM_KERNEL_UNSLIDE_OR_PERM(lck), (int)lck_sleep_action, VM_KERNEL_UNSLIDE_OR_PERM(event), (int)interruptible, 0);
+
+	if ((lck_sleep_action & ~LCK_SLEEP_MASK) != 0) {
 		panic("Invalid lock sleep action %x\n", lck_sleep_action);
+	}
 
 	if (lck_sleep_action & LCK_SLEEP_PROMOTED_PRI) {
 		/*
-		 * Although we are dropping the RW lock, the intent in most cases
-		 * is that this thread remains as an observer, since it may hold
-		 * some secondary resource, but must yield to avoid deadlock. In
-		 * this situation, make sure that the thread is boosted to the
-		 * RW lock ceiling while blocked, so that it can re-acquire the
-		 * RW lock at that priority.
+		 * We overload the RW lock promotion to give us a priority ceiling
+		 * during the time that this thread is asleep, so that when it
+		 * is re-awakened (and not yet contending on the mutex), it is
+		 * runnable at a reasonably high priority.
 		 */
 		thread->rwlock_count++;
 	}
 
 	res = assert_wait(event, interruptible);
 	if (res == THREAD_WAITING) {
-		lck_rw_type = lck_rw_done(lck);
+		lck_mtx_unlock(lck);
 		res = thread_block(THREAD_CONTINUE_NULL);
 		if (!(lck_sleep_action & LCK_SLEEP_UNLOCK)) {
-			if (!(lck_sleep_action & (LCK_SLEEP_SHARED|LCK_SLEEP_EXCLUSIVE)))
-				lck_rw_lock(lck, lck_rw_type);
-			else if (lck_sleep_action & LCK_SLEEP_EXCLUSIVE)
-				lck_rw_lock_exclusive(lck);
-			else
-				lck_rw_lock_shared(lck);
+			if ((lck_sleep_action & LCK_SLEEP_SPIN)) {
+				lck_mtx_lock_spin(lck);
+			} else if ((lck_sleep_action & LCK_SLEEP_SPIN_ALWAYS)) {
+				lck_mtx_lock_spin_always(lck);
+			} else {
+				lck_mtx_lock(lck);
+			}
 		}
+	} else if (lck_sleep_action & LCK_SLEEP_UNLOCK) {
+		lck_mtx_unlock(lck);
 	}
-	else
-	if (lck_sleep_action & LCK_SLEEP_UNLOCK)
-		(void)lck_rw_done(lck);
 
 	if (lck_sleep_action & LCK_SLEEP_PROMOTED_PRI) {
 		if ((thread->rwlock_count-- == 1 /* field now 0 */) && (thread->sched_flags & TH_SFLAG_RW_PROMOTED)) {
 			/* sched_flags checked without lock, but will be rechecked while clearing */
-
-			/* Only if the caller wanted the lck_rw_t returned unlocked should we drop to 0 */
-			assert(lck_sleep_action & LCK_SLEEP_UNLOCK);
-
-			lck_rw_clear_promotion(thread);
+			lck_rw_clear_promotion(thread, unslide_for_kdebug(event));
 		}
 	}
 
+	KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS, LCK_MTX_SLEEP_CODE) | DBG_FUNC_END, (int)res, 0, 0, 0, 0);
+
 	return res;
 }
 
 
 /*
- * Routine:	lck_rw_sleep_deadline
+ * Routine:	lck_mtx_sleep_deadline
  */
 wait_result_t
-lck_rw_sleep_deadline(
-	lck_rw_t		*lck,
-	lck_sleep_action_t	lck_sleep_action,
-	event_t			event,
-	wait_interrupt_t	interruptible,
-	uint64_t		deadline)
+lck_mtx_sleep_deadline(
+	lck_mtx_t               *lck,
+	lck_sleep_action_t      lck_sleep_action,
+	event_t                 event,
+	wait_interrupt_t        interruptible,
+	uint64_t                deadline)
 {
 	wait_result_t   res;
-	lck_rw_type_t	lck_rw_type;
-	thread_t		thread = current_thread();
+	thread_t                thread = current_thread();
+
+	KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS, LCK_MTX_SLEEP_DEADLINE_CODE) | DBG_FUNC_START,
+	    VM_KERNEL_UNSLIDE_OR_PERM(lck), (int)lck_sleep_action, VM_KERNEL_UNSLIDE_OR_PERM(event), (int)interruptible, 0);
 
-	if ((lck_sleep_action & ~LCK_SLEEP_MASK) != 0)
+	if ((lck_sleep_action & ~LCK_SLEEP_MASK) != 0) {
 		panic("Invalid lock sleep action %x\n", lck_sleep_action);
+	}
 
 	if (lck_sleep_action & LCK_SLEEP_PROMOTED_PRI) {
+		/*
+		 * See lck_mtx_sleep().
+		 */
 		thread->rwlock_count++;
 	}
 
 	res = assert_wait_deadline(event, interruptible, deadline);
 	if (res == THREAD_WAITING) {
-		lck_rw_type = lck_rw_done(lck);
+		lck_mtx_unlock(lck);
 		res = thread_block(THREAD_CONTINUE_NULL);
 		if (!(lck_sleep_action & LCK_SLEEP_UNLOCK)) {
-			if (!(lck_sleep_action & (LCK_SLEEP_SHARED|LCK_SLEEP_EXCLUSIVE)))
-				lck_rw_lock(lck, lck_rw_type);
-			else if (lck_sleep_action & LCK_SLEEP_EXCLUSIVE)
-				lck_rw_lock_exclusive(lck);
-			else
-				lck_rw_lock_shared(lck);
+			if ((lck_sleep_action & LCK_SLEEP_SPIN)) {
+				lck_mtx_lock_spin(lck);
+			} else {
+				lck_mtx_lock(lck);
+			}
 		}
+	} else if (lck_sleep_action & LCK_SLEEP_UNLOCK) {
+		lck_mtx_unlock(lck);
 	}
-	else
-	if (lck_sleep_action & LCK_SLEEP_UNLOCK)
-		(void)lck_rw_done(lck);
 
 	if (lck_sleep_action & LCK_SLEEP_PROMOTED_PRI) {
 		if ((thread->rwlock_count-- == 1 /* field now 0 */) && (thread->sched_flags & TH_SFLAG_RW_PROMOTED)) {
 			/* sched_flags checked without lock, but will be rechecked while clearing */
-
-			/* Only if the caller wanted the lck_rw_t returned unlocked should we drop to 0 */
-			assert(lck_sleep_action & LCK_SLEEP_UNLOCK);
-
-			lck_rw_clear_promotion(thread);
+			lck_rw_clear_promotion(thread, unslide_for_kdebug(event));
 		}
 	}
 
+	KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS, LCK_MTX_SLEEP_DEADLINE_CODE) | DBG_FUNC_END, (int)res, 0, 0, 0, 0);
+
 	return res;
 }
 
 /*
- * Reader-writer lock promotion
+ * Lock Boosting Invariants:
  *
- * We support a limited form of reader-writer
- * lock promotion whose effects are:
- * 
- *   * Qualifying threads have decay disabled
- *   * Scheduler priority is reset to a floor of
- *     of their statically assigned priority
- *     or BASEPRI_BACKGROUND
+ * The lock owner is always promoted to the max priority of all its waiters.
+ * Max priority is capped at MAXPRI_PROMOTE.
  *
- * The rationale is that lck_rw_ts do not have
- * a single owner, so we cannot apply a directed
- * priority boost from all waiting threads
- * to all holding threads without maintaining
- * lists of all shared owners and all waiting
- * threads for every lock.
+ * The last waiter is not given a promotion when it wakes up or acquires the lock.
+ * When the last waiter is waking up, a new contender can always come in and
+ * steal the lock without having to wait for the last waiter to make forward progress.
+ */
+
+/*
+ * Routine: lck_mtx_lock_wait
  *
- * Instead (and to preserve the uncontended fast-
- * path), acquiring (or attempting to acquire)
- * a RW lock in shared or exclusive lock increments
- * a per-thread counter. Only if that thread stops
- * making forward progress (for instance blocking
- * on a mutex, or being preempted) do we consult
- * the counter and apply the priority floor.
- * When the thread becomes runnable again (or in
- * the case of preemption it never stopped being
- * runnable), it has the priority boost and should
- * be in a good position to run on the CPU and
- * release all RW locks (at which point the priority
- * boost is cleared).
+ * Invoked in order to wait on contention.
  *
- * Care must be taken to ensure that priority
- * boosts are not retained indefinitely, since unlike
- * mutex priority boosts (where the boost is tied
- * to the mutex lifecycle), the boost is tied
- * to the thread and independent of any particular
- * lck_rw_t. Assertions are in place on return
- * to userspace so that the boost is not held
- * indefinitely.
+ * Called with the interlock locked and
+ * returns it unlocked.
  *
- * The routines that increment/decrement the
- * per-thread counter should err on the side of
- * incrementing any time a preemption is possible
- * and the lock would be visible to the rest of the
- * system as held (so it should be incremented before
- * interlocks are dropped/preemption is enabled, or
- * before a CAS is executed to acquire the lock).
+ * Always aggressively sets the owning thread to promoted,
+ * even if it's the same or higher priority
+ * This prevents it from lowering its own priority while holding a lock
  *
+ * TODO: Come up with a more efficient way to handle same-priority promotions
+ *      <rdar://problem/30737670> ARM mutex contention logic could avoid taking the thread lock
  */
-
-/*
- * lck_rw_clear_promotion: Undo priority promotions when the last RW
- * lock is released by a thread (if a promotion was active)
- */
-void lck_rw_clear_promotion(thread_t thread)
+void
+lck_mtx_lock_wait(
+	lck_mtx_t                       *lck,
+	thread_t                        holder,
+	struct turnstile                **ts)
 {
-	assert(thread->rwlock_count == 0);
+	thread_t                thread = current_thread();
+	lck_mtx_t               *mutex;
+	__kdebug_only uintptr_t trace_lck = unslide_for_kdebug(lck);
 
-	/* Cancel any promotions if the thread had actually blocked while holding a RW lock */
-	spl_t s = splsched();
-
-	thread_lock(thread);
+#if     CONFIG_DTRACE
+	uint64_t                sleep_start = 0;
+
+	if (lockstat_probemap[LS_LCK_MTX_LOCK_BLOCK] || lockstat_probemap[LS_LCK_MTX_EXT_LOCK_BLOCK]) {
+		sleep_start = mach_absolute_time();
+	}
+#endif
+
+	if (lck->lck_mtx_tag != LCK_MTX_TAG_INDIRECT) {
+		mutex = lck;
+	} else {
+		mutex = &lck->lck_mtx_ptr->lck_mtx;
+	}
+
+	KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS, LCK_MTX_LCK_WAIT_CODE) | DBG_FUNC_START,
+	    trace_lck, (uintptr_t)thread_tid(thread), 0, 0, 0);
+
+	assert(thread->waiting_for_mutex == NULL);
+	thread->waiting_for_mutex = mutex;
+	mutex->lck_mtx_waiters++;
+
+	if (*ts == NULL) {
+		*ts = turnstile_prepare((uintptr_t)mutex, NULL, TURNSTILE_NULL, TURNSTILE_KERNEL_MUTEX);
+	}
+
+	struct turnstile *turnstile = *ts;
+	thread_set_pending_block_hint(thread, kThreadWaitKernelMutex);
+	turnstile_update_inheritor(turnstile, holder, (TURNSTILE_DELAYED_UPDATE | TURNSTILE_INHERITOR_THREAD));
+
+	waitq_assert_wait64(&turnstile->ts_waitq, CAST_EVENT64_T(LCK_MTX_EVENT(mutex)), THREAD_UNINT | THREAD_WAIT_NOREPORT_USER, TIMEOUT_WAIT_FOREVER);
+
+	lck_mtx_ilk_unlock(mutex);
+
+	turnstile_update_inheritor_complete(turnstile, TURNSTILE_INTERLOCK_NOT_HELD);
+
+	thread_block(THREAD_CONTINUE_NULL);
+
+	thread->waiting_for_mutex = NULL;
+
+	KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS, LCK_MTX_LCK_WAIT_CODE) | DBG_FUNC_END, 0, 0, 0, 0, 0);
+#if     CONFIG_DTRACE
+	/*
+	 * Record the DTrace lockstat probe for blocking, block time
+	 * measured from when we were entered.
+	 */
+	if (sleep_start) {
+		if (lck->lck_mtx_tag != LCK_MTX_TAG_INDIRECT) {
+			LOCKSTAT_RECORD(LS_LCK_MTX_LOCK_BLOCK, lck,
+			    mach_absolute_time() - sleep_start);
+		} else {
+			LOCKSTAT_RECORD(LS_LCK_MTX_EXT_LOCK_BLOCK, lck,
+			    mach_absolute_time() - sleep_start);
+		}
+	}
+#endif
+}
+
+/*
+ * Routine:     lck_mtx_lock_acquire
+ *
+ * Invoked on acquiring the mutex when there is
+ * contention.
+ *
+ * Returns the current number of waiters.
+ *
+ * Called with the interlock locked.
+ */
+int
+lck_mtx_lock_acquire(
+	lck_mtx_t               *lck,
+	struct turnstile        *ts)
+{
+	thread_t                thread = current_thread();
+	lck_mtx_t               *mutex;
+
+	if (lck->lck_mtx_tag != LCK_MTX_TAG_INDIRECT) {
+		mutex = lck;
+	} else {
+		mutex = &lck->lck_mtx_ptr->lck_mtx;
+	}
+
+	assert(thread->waiting_for_mutex == NULL);
+
+	if (mutex->lck_mtx_waiters > 0) {
+		if (ts == NULL) {
+			ts = turnstile_prepare((uintptr_t)mutex, NULL, TURNSTILE_NULL, TURNSTILE_KERNEL_MUTEX);
+		}
+
+		turnstile_update_inheritor(ts, thread, (TURNSTILE_IMMEDIATE_UPDATE | TURNSTILE_INHERITOR_THREAD));
+		turnstile_update_inheritor_complete(ts, TURNSTILE_INTERLOCK_HELD);
+	}
+
+	if (ts != NULL) {
+		turnstile_complete((uintptr_t)mutex, NULL, NULL, TURNSTILE_KERNEL_MUTEX);
+	}
+
+	return mutex->lck_mtx_waiters;
+}
+
+/*
+ * Routine:     lck_mtx_unlock_wakeup
+ *
+ * Invoked on unlock when there is contention.
+ *
+ * Called with the interlock locked.
+ *
+ * NOTE: callers should call turnstile_clenup after
+ * dropping the interlock.
+ */
+boolean_t
+lck_mtx_unlock_wakeup(
+	lck_mtx_t                       *lck,
+	thread_t                        holder)
+{
+	thread_t                thread = current_thread();
+	lck_mtx_t               *mutex;
+	__kdebug_only uintptr_t trace_lck = unslide_for_kdebug(lck);
+	struct turnstile *ts;
+	kern_return_t did_wake;
+
+	if (lck->lck_mtx_tag != LCK_MTX_TAG_INDIRECT) {
+		mutex = lck;
+	} else {
+		mutex = &lck->lck_mtx_ptr->lck_mtx;
+	}
+
+	if (thread != holder) {
+		panic("lck_mtx_unlock_wakeup: mutex %p holder %p\n", mutex, holder);
+	}
+
+	KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS, LCK_MTX_UNLCK_WAKEUP_CODE) | DBG_FUNC_START,
+	    trace_lck, (uintptr_t)thread_tid(thread), 0, 0, 0);
+
+	assert(mutex->lck_mtx_waiters > 0);
+	assert(thread->waiting_for_mutex == NULL);
+
+	ts = turnstile_prepare((uintptr_t)mutex, NULL, TURNSTILE_NULL, TURNSTILE_KERNEL_MUTEX);
+
+	if (mutex->lck_mtx_waiters > 1) {
+		/* WAITQ_PROMOTE_ON_WAKE will call turnstile_update_inheritor on the wokenup thread */
+		did_wake = waitq_wakeup64_one(&ts->ts_waitq, CAST_EVENT64_T(LCK_MTX_EVENT(mutex)), THREAD_AWAKENED, WAITQ_PROMOTE_ON_WAKE);
+	} else {
+		did_wake = waitq_wakeup64_one(&ts->ts_waitq, CAST_EVENT64_T(LCK_MTX_EVENT(mutex)), THREAD_AWAKENED, WAITQ_ALL_PRIORITIES);
+		turnstile_update_inheritor(ts, NULL, TURNSTILE_IMMEDIATE_UPDATE);
+	}
+	assert(did_wake == KERN_SUCCESS);
+
+	turnstile_update_inheritor_complete(ts, TURNSTILE_INTERLOCK_HELD);
+	turnstile_complete((uintptr_t)mutex, NULL, NULL, TURNSTILE_KERNEL_MUTEX);
+
+	mutex->lck_mtx_waiters--;
+
+	KERNEL_DEBUG(MACHDBG_CODE(DBG_MACH_LOCKS, LCK_MTX_UNLCK_WAKEUP_CODE) | DBG_FUNC_END, 0, 0, 0, 0, 0);
+
+	return mutex->lck_mtx_waiters > 0;
+}
+
+/*
+ * Routine:     mutex_pause
+ *
+ * Called by former callers of simple_lock_pause().
+ */
+#define MAX_COLLISION_COUNTS    32
+#define MAX_COLLISION   8
+
+unsigned int max_collision_count[MAX_COLLISION_COUNTS];
+
+uint32_t collision_backoffs[MAX_COLLISION] = {
+	10, 50, 100, 200, 400, 600, 800, 1000
+};
+
+
+void
+mutex_pause(uint32_t collisions)
+{
+	wait_result_t wait_result;
+	uint32_t        back_off;
+
+	if (collisions >= MAX_COLLISION_COUNTS) {
+		collisions = MAX_COLLISION_COUNTS - 1;
+	}
+	max_collision_count[collisions]++;
+
+	if (collisions >= MAX_COLLISION) {
+		collisions = MAX_COLLISION - 1;
+	}
+	back_off = collision_backoffs[collisions];
+
+	wait_result = assert_wait_timeout((event_t)mutex_pause, THREAD_UNINT, back_off, NSEC_PER_USEC);
+	assert(wait_result == THREAD_WAITING);
+
+	wait_result = thread_block(THREAD_CONTINUE_NULL);
+	assert(wait_result == THREAD_TIMED_OUT);
+}
+
+
+unsigned int mutex_yield_wait = 0;
+unsigned int mutex_yield_no_wait = 0;
+
+void
+lck_mtx_yield(
+	lck_mtx_t   *lck)
+{
+	int     waiters;
+
+#if DEBUG
+	lck_mtx_assert(lck, LCK_MTX_ASSERT_OWNED);
+#endif /* DEBUG */
+
+	if (lck->lck_mtx_tag == LCK_MTX_TAG_INDIRECT) {
+		waiters = lck->lck_mtx_ptr->lck_mtx.lck_mtx_waiters;
+	} else {
+		waiters = lck->lck_mtx_waiters;
+	}
+
+	if (!waiters) {
+		mutex_yield_no_wait++;
+	} else {
+		mutex_yield_wait++;
+		lck_mtx_unlock(lck);
+		mutex_pause(0);
+		lck_mtx_lock(lck);
+	}
+}
+
+
+/*
+ * Routine:	lck_rw_sleep
+ */
+wait_result_t
+lck_rw_sleep(
+	lck_rw_t                *lck,
+	lck_sleep_action_t      lck_sleep_action,
+	event_t                 event,
+	wait_interrupt_t        interruptible)
+{
+	wait_result_t   res;
+	lck_rw_type_t   lck_rw_type;
+	thread_t                thread = current_thread();
+
+	if ((lck_sleep_action & ~LCK_SLEEP_MASK) != 0) {
+		panic("Invalid lock sleep action %x\n", lck_sleep_action);
+	}
+
+	if (lck_sleep_action & LCK_SLEEP_PROMOTED_PRI) {
+		/*
+		 * Although we are dropping the RW lock, the intent in most cases
+		 * is that this thread remains as an observer, since it may hold
+		 * some secondary resource, but must yield to avoid deadlock. In
+		 * this situation, make sure that the thread is boosted to the
+		 * RW lock ceiling while blocked, so that it can re-acquire the
+		 * RW lock at that priority.
+		 */
+		thread->rwlock_count++;
+	}
+
+	res = assert_wait(event, interruptible);
+	if (res == THREAD_WAITING) {
+		lck_rw_type = lck_rw_done(lck);
+		res = thread_block(THREAD_CONTINUE_NULL);
+		if (!(lck_sleep_action & LCK_SLEEP_UNLOCK)) {
+			if (!(lck_sleep_action & (LCK_SLEEP_SHARED | LCK_SLEEP_EXCLUSIVE))) {
+				lck_rw_lock(lck, lck_rw_type);
+			} else if (lck_sleep_action & LCK_SLEEP_EXCLUSIVE) {
+				lck_rw_lock_exclusive(lck);
+			} else {
+				lck_rw_lock_shared(lck);
+			}
+		}
+	} else if (lck_sleep_action & LCK_SLEEP_UNLOCK) {
+		(void)lck_rw_done(lck);
+	}
+
+	if (lck_sleep_action & LCK_SLEEP_PROMOTED_PRI) {
+		if ((thread->rwlock_count-- == 1 /* field now 0 */) && (thread->sched_flags & TH_SFLAG_RW_PROMOTED)) {
+			/* sched_flags checked without lock, but will be rechecked while clearing */
+
+			/* Only if the caller wanted the lck_rw_t returned unlocked should we drop to 0 */
+			assert(lck_sleep_action & LCK_SLEEP_UNLOCK);
+
+			lck_rw_clear_promotion(thread, unslide_for_kdebug(event));
+		}
+	}
+
+	return res;
+}
+
+
+/*
+ * Routine:	lck_rw_sleep_deadline
+ */
+wait_result_t
+lck_rw_sleep_deadline(
+	lck_rw_t                *lck,
+	lck_sleep_action_t      lck_sleep_action,
+	event_t                 event,
+	wait_interrupt_t        interruptible,
+	uint64_t                deadline)
+{
+	wait_result_t   res;
+	lck_rw_type_t   lck_rw_type;
+	thread_t                thread = current_thread();
+
+	if ((lck_sleep_action & ~LCK_SLEEP_MASK) != 0) {
+		panic("Invalid lock sleep action %x\n", lck_sleep_action);
+	}
+
+	if (lck_sleep_action & LCK_SLEEP_PROMOTED_PRI) {
+		thread->rwlock_count++;
+	}
+
+	res = assert_wait_deadline(event, interruptible, deadline);
+	if (res == THREAD_WAITING) {
+		lck_rw_type = lck_rw_done(lck);
+		res = thread_block(THREAD_CONTINUE_NULL);
+		if (!(lck_sleep_action & LCK_SLEEP_UNLOCK)) {
+			if (!(lck_sleep_action & (LCK_SLEEP_SHARED | LCK_SLEEP_EXCLUSIVE))) {
+				lck_rw_lock(lck, lck_rw_type);
+			} else if (lck_sleep_action & LCK_SLEEP_EXCLUSIVE) {
+				lck_rw_lock_exclusive(lck);
+			} else {
+				lck_rw_lock_shared(lck);
+			}
+		}
+	} else if (lck_sleep_action & LCK_SLEEP_UNLOCK) {
+		(void)lck_rw_done(lck);
+	}
+
+	if (lck_sleep_action & LCK_SLEEP_PROMOTED_PRI) {
+		if ((thread->rwlock_count-- == 1 /* field now 0 */) && (thread->sched_flags & TH_SFLAG_RW_PROMOTED)) {
+			/* sched_flags checked without lock, but will be rechecked while clearing */
+
+			/* Only if the caller wanted the lck_rw_t returned unlocked should we drop to 0 */
+			assert(lck_sleep_action & LCK_SLEEP_UNLOCK);
+
+			lck_rw_clear_promotion(thread, unslide_for_kdebug(event));
+		}
+	}
+
+	return res;
+}
+
+/*
+ * Reader-writer lock promotion
+ *
+ * We support a limited form of reader-writer
+ * lock promotion whose effects are:
+ *
+ *   * Qualifying threads have decay disabled
+ *   * Scheduler priority is reset to a floor of
+ *     of their statically assigned priority
+ *     or MINPRI_RWLOCK
+ *
+ * The rationale is that lck_rw_ts do not have
+ * a single owner, so we cannot apply a directed
+ * priority boost from all waiting threads
+ * to all holding threads without maintaining
+ * lists of all shared owners and all waiting
+ * threads for every lock.
+ *
+ * Instead (and to preserve the uncontended fast-
+ * path), acquiring (or attempting to acquire)
+ * a RW lock in shared or exclusive lock increments
+ * a per-thread counter. Only if that thread stops
+ * making forward progress (for instance blocking
+ * on a mutex, or being preempted) do we consult
+ * the counter and apply the priority floor.
+ * When the thread becomes runnable again (or in
+ * the case of preemption it never stopped being
+ * runnable), it has the priority boost and should
+ * be in a good position to run on the CPU and
+ * release all RW locks (at which point the priority
+ * boost is cleared).
+ *
+ * Care must be taken to ensure that priority
+ * boosts are not retained indefinitely, since unlike
+ * mutex priority boosts (where the boost is tied
+ * to the mutex lifecycle), the boost is tied
+ * to the thread and independent of any particular
+ * lck_rw_t. Assertions are in place on return
+ * to userspace so that the boost is not held
+ * indefinitely.
+ *
+ * The routines that increment/decrement the
+ * per-thread counter should err on the side of
+ * incrementing any time a preemption is possible
+ * and the lock would be visible to the rest of the
+ * system as held (so it should be incremented before
+ * interlocks are dropped/preemption is enabled, or
+ * before a CAS is executed to acquire the lock).
+ *
+ */
+
+/*
+ * lck_rw_clear_promotion: Undo priority promotions when the last RW
+ * lock is released by a thread (if a promotion was active)
+ */
+void
+lck_rw_clear_promotion(thread_t thread, uintptr_t trace_obj)
+{
+	assert(thread->rwlock_count == 0);
+
+	/* Cancel any promotions if the thread had actually blocked while holding a RW lock */
+	spl_t s = splsched();
+	thread_lock(thread);
 
 	if (thread->sched_flags & TH_SFLAG_RW_PROMOTED) {
-		thread->sched_flags &= ~TH_SFLAG_RW_PROMOTED;
-
-		if (thread->sched_flags & TH_SFLAG_PROMOTED) {
-			/* Thread still has a mutex promotion */
-		} else if (thread->sched_flags & TH_SFLAG_DEPRESSED_MASK) {
-			KERNEL_DEBUG_CONSTANT(MACHDBG_CODE(DBG_MACH_SCHED, MACH_RW_DEMOTE) | DBG_FUNC_NONE,
-							      thread->sched_pri, DEPRESSPRI, 0, 0, 0);
-			
-			set_sched_pri(thread, DEPRESSPRI);
+		sched_thread_unpromote_reason(thread, TH_SFLAG_RW_PROMOTED, trace_obj);
+	}
+
+	thread_unlock(thread);
+	splx(s);
+}
+
+/*
+ * Callout from context switch if the thread goes
+ * off core with a positive rwlock_count
+ *
+ * Called at splsched with the thread locked
+ */
+void
+lck_rw_set_promotion_locked(thread_t thread)
+{
+	if (LcksOpts & disLkRWPrio) {
+		return;
+	}
+
+	assert(thread->rwlock_count > 0);
+
+	if (!(thread->sched_flags & TH_SFLAG_RW_PROMOTED)) {
+		sched_thread_promote_reason(thread, TH_SFLAG_RW_PROMOTED, 0);
+	}
+}
+
+kern_return_t
+host_lockgroup_info(
+	host_t                                  host,
+	lockgroup_info_array_t  *lockgroup_infop,
+	mach_msg_type_number_t  *lockgroup_infoCntp)
+{
+	lockgroup_info_t        *lockgroup_info_base;
+	lockgroup_info_t        *lockgroup_info;
+	vm_offset_t                     lockgroup_info_addr;
+	vm_size_t                       lockgroup_info_size;
+	vm_size_t                       lockgroup_info_vmsize;
+	lck_grp_t                       *lck_grp;
+	unsigned int            i;
+	vm_map_copy_t           copy;
+	kern_return_t           kr;
+
+	if (host == HOST_NULL) {
+		return KERN_INVALID_HOST;
+	}
+
+	lck_mtx_lock(&lck_grp_lock);
+
+	lockgroup_info_size = lck_grp_cnt * sizeof(*lockgroup_info);
+	lockgroup_info_vmsize = round_page(lockgroup_info_size);
+	kr = kmem_alloc_pageable(ipc_kernel_map,
+	    &lockgroup_info_addr, lockgroup_info_vmsize, VM_KERN_MEMORY_IPC);
+	if (kr != KERN_SUCCESS) {
+		lck_mtx_unlock(&lck_grp_lock);
+		return kr;
+	}
+
+	lockgroup_info_base = (lockgroup_info_t *) lockgroup_info_addr;
+	lck_grp = (lck_grp_t *)queue_first(&lck_grp_queue);
+	lockgroup_info = lockgroup_info_base;
+
+	for (i = 0; i < lck_grp_cnt; i++) {
+		lockgroup_info->lock_spin_cnt = lck_grp->lck_grp_spincnt;
+		lockgroup_info->lock_rw_cnt = lck_grp->lck_grp_rwcnt;
+		lockgroup_info->lock_mtx_cnt = lck_grp->lck_grp_mtxcnt;
+
+#if LOCK_STATS
+		lockgroup_info->lock_spin_held_cnt = lck_grp->lck_grp_stats.lgss_spin_held.lgs_count;
+		lockgroup_info->lock_spin_miss_cnt = lck_grp->lck_grp_stats.lgss_spin_miss.lgs_count;
+#endif /* LOCK_STATS */
+
+		// Historically on x86, held was used for "direct wait" and util for "held"
+		lockgroup_info->lock_mtx_util_cnt = lck_grp->lck_grp_stats.lgss_mtx_held.lgs_count;
+		lockgroup_info->lock_mtx_held_cnt = lck_grp->lck_grp_stats.lgss_mtx_direct_wait.lgs_count;
+		lockgroup_info->lock_mtx_miss_cnt = lck_grp->lck_grp_stats.lgss_mtx_miss.lgs_count;
+		lockgroup_info->lock_mtx_wait_cnt = lck_grp->lck_grp_stats.lgss_mtx_wait.lgs_count;
+
+		(void) strncpy(lockgroup_info->lockgroup_name, lck_grp->lck_grp_name, LOCKGROUP_MAX_NAME);
+
+		lck_grp = (lck_grp_t *)(queue_next((queue_entry_t)(lck_grp)));
+		lockgroup_info++;
+	}
+
+	*lockgroup_infoCntp = lck_grp_cnt;
+	lck_mtx_unlock(&lck_grp_lock);
+
+	if (lockgroup_info_size != lockgroup_info_vmsize) {
+		bzero((char *)lockgroup_info, lockgroup_info_vmsize - lockgroup_info_size);
+	}
+
+	kr = vm_map_copyin(ipc_kernel_map, (vm_map_address_t)lockgroup_info_addr,
+	    (vm_map_size_t)lockgroup_info_size, TRUE, &copy);
+	assert(kr == KERN_SUCCESS);
+
+	*lockgroup_infop = (lockgroup_info_t *) copy;
+
+	return KERN_SUCCESS;
+}
+
+/*
+ * sleep_with_inheritor and wakeup_with_inheritor KPI
+ *
+ * Functions that allow to sleep on an event and use turnstile to propagate the priority of the sleeping threads to
+ * the latest thread specified as inheritor.
+ *
+ * The inheritor management is delegated to the caller, the caller needs to store a thread identifier to provide to this functions to specified upon whom
+ * direct the push. The inheritor cannot run in user space while holding a push from an event. Therefore is the caller responsibility to call a
+ * wakeup_with_inheritor from inheritor before running in userspace or specify another inheritor before letting the old inheritor run in userspace.
+ *
+ * sleep_with_inheritor requires to hold a locking primitive while invoked, but wakeup_with_inheritor and change_sleep_inheritor don't require it.
+ *
+ * Turnstile requires a non blocking primitive as interlock to synchronize the turnstile data structure manipulation, threfore sleep_with_inheritor, change_sleep_inheritor and
+ * wakeup_with_inheritor will require the same interlock to manipulate turnstiles.
+ * If sleep_with_inheritor is associated with a locking primitive that can block (like lck_mtx_t or lck_rw_t), an handoff to a non blocking primitive is required before
+ * invoking any turnstile operation.
+ *
+ * All functions will save the turnstile associated with the event on the turnstile kernel hash table and will use the the turnstile kernel hash table bucket
+ * spinlock as the turnstile interlock. Because we do not want to hold interrupt disabled while holding the bucket interlock a new turnstile kernel hash table
+ * is instantiated for this KPI to manage the hash without interrupt disabled.
+ * Also:
+ * - all events on the system that hash on the same bucket will contend on the same spinlock.
+ * - every event will have a dedicated wait_queue.
+ *
+ * Different locking primitives can be associated with sleep_with_inheritor as long as the primitive_lock() and primitive_unlock() functions are provided to
+ * sleep_with_inheritor_turnstile to perform the handoff with the bucket spinlock.
+ */
+
+kern_return_t
+wakeup_with_inheritor_and_turnstile_type(event_t event, turnstile_type_t type, wait_result_t result, bool wake_one, lck_wake_action_t action, thread_t *thread_wokenup)
+{
+	uint32_t index;
+	struct turnstile *ts = NULL;
+	kern_return_t ret = KERN_NOT_WAITING;
+	int priority;
+	thread_t wokeup;
+
+	/*
+	 * the hash bucket spinlock is used as turnstile interlock
+	 */
+	turnstile_hash_bucket_lock((uintptr_t)event, &index, type);
+
+	ts = turnstile_prepare((uintptr_t)event, NULL, TURNSTILE_NULL, type);
+
+	if (wake_one) {
+		if (action == LCK_WAKE_DEFAULT) {
+			priority = WAITQ_PROMOTE_ON_WAKE;
+		} else {
+			assert(action == LCK_WAKE_DO_NOT_TRANSFER_PUSH);
+			priority = WAITQ_ALL_PRIORITIES;
+		}
+
+		/*
+		 * WAITQ_PROMOTE_ON_WAKE will call turnstile_update_inheritor
+		 * if it finds a thread
+		 */
+		wokeup = waitq_wakeup64_identify(&ts->ts_waitq, CAST_EVENT64_T(event), result, priority);
+		if (wokeup != NULL) {
+			if (thread_wokenup != NULL) {
+				*thread_wokenup = wokeup;
+			} else {
+				thread_deallocate_safe(wokeup);
+			}
+			ret = KERN_SUCCESS;
+			if (action == LCK_WAKE_DO_NOT_TRANSFER_PUSH) {
+				goto complete;
+			}
+		} else {
+			if (thread_wokenup != NULL) {
+				*thread_wokenup = NULL;
+			}
+			turnstile_update_inheritor(ts, TURNSTILE_INHERITOR_NULL, TURNSTILE_IMMEDIATE_UPDATE);
+			ret = KERN_NOT_WAITING;
+		}
+	} else {
+		ret = waitq_wakeup64_all(&ts->ts_waitq, CAST_EVENT64_T(event), result, WAITQ_ALL_PRIORITIES);
+		turnstile_update_inheritor(ts, TURNSTILE_INHERITOR_NULL, TURNSTILE_IMMEDIATE_UPDATE);
+	}
+
+	/*
+	 * turnstile_update_inheritor_complete could be called while holding the interlock.
+	 * In this case the new inheritor or is null, or is a thread that is just been woken up
+	 * and have not blocked because it is racing with the same interlock used here
+	 * after the wait.
+	 * So there is no chain to update for the new inheritor.
+	 *
+	 * However unless the current thread is the old inheritor,
+	 * old inheritor can be blocked and requires a chain update.
+	 *
+	 * The chain should be short because kernel turnstiles cannot have user turnstiles
+	 * chained after them.
+	 *
+	 * We can anyway optimize this by asking turnstile to tell us
+	 * if old inheritor needs an update and drop the lock
+	 * just in that case.
+	 */
+	turnstile_hash_bucket_unlock((uintptr_t)NULL, &index, type, 0);
+
+	turnstile_update_inheritor_complete(ts, TURNSTILE_INTERLOCK_NOT_HELD);
+
+	turnstile_hash_bucket_lock((uintptr_t)NULL, &index, type);
+
+complete:
+	turnstile_complete((uintptr_t)event, NULL, NULL, type);
+
+	turnstile_hash_bucket_unlock((uintptr_t)NULL, &index, type, 0);
+
+	turnstile_cleanup();
+
+	return ret;
+}
+
+static wait_result_t
+sleep_with_inheritor_and_turnstile_type(event_t event,
+    thread_t inheritor,
+    wait_interrupt_t interruptible,
+    uint64_t deadline,
+    turnstile_type_t type,
+    void (^primitive_lock)(void),
+    void (^primitive_unlock)(void))
+{
+	wait_result_t ret;
+	uint32_t index;
+	struct turnstile *ts = NULL;
+
+	/*
+	 * the hash bucket spinlock is used as turnstile interlock,
+	 * lock it before releasing the primitive lock
+	 */
+	turnstile_hash_bucket_lock((uintptr_t)event, &index, type);
+
+	primitive_unlock();
+
+	ts = turnstile_prepare((uintptr_t)event, NULL, TURNSTILE_NULL, type);
+
+	thread_set_pending_block_hint(current_thread(), kThreadWaitSleepWithInheritor);
+	/*
+	 * We need TURNSTILE_DELAYED_UPDATE because we will call
+	 * waitq_assert_wait64 after.
+	 */
+	turnstile_update_inheritor(ts, inheritor, (TURNSTILE_DELAYED_UPDATE | TURNSTILE_INHERITOR_THREAD));
+
+	ret = waitq_assert_wait64(&ts->ts_waitq, CAST_EVENT64_T(event), interruptible, deadline);
+
+	turnstile_hash_bucket_unlock((uintptr_t)NULL, &index, type, 0);
+
+	/*
+	 * Update new and old inheritor chains outside the interlock;
+	 */
+	turnstile_update_inheritor_complete(ts, TURNSTILE_INTERLOCK_NOT_HELD);
+
+	if (ret == THREAD_WAITING) {
+		ret = thread_block(THREAD_CONTINUE_NULL);
+	}
+
+	turnstile_hash_bucket_lock((uintptr_t)NULL, &index, type);
+
+	turnstile_complete((uintptr_t)event, NULL, NULL, type);
+
+	turnstile_hash_bucket_unlock((uintptr_t)NULL, &index, type, 0);
+
+	turnstile_cleanup();
+
+	primitive_lock();
+
+	return ret;
+}
+
+kern_return_t
+change_sleep_inheritor_and_turnstile_type(event_t event,
+    thread_t inheritor,
+    turnstile_type_t type)
+{
+	uint32_t index;
+	struct turnstile *ts = NULL;
+	kern_return_t ret =  KERN_SUCCESS;
+	/*
+	 * the hash bucket spinlock is used as turnstile interlock
+	 */
+	turnstile_hash_bucket_lock((uintptr_t)event, &index, type);
+
+	ts = turnstile_prepare((uintptr_t)event, NULL, TURNSTILE_NULL, type);
+
+	if (!turnstile_has_waiters(ts)) {
+		ret = KERN_NOT_WAITING;
+	}
+
+	/*
+	 * We will not call an assert_wait later so use TURNSTILE_IMMEDIATE_UPDATE
+	 */
+	turnstile_update_inheritor(ts, inheritor, (TURNSTILE_IMMEDIATE_UPDATE | TURNSTILE_INHERITOR_THREAD));
+
+	turnstile_hash_bucket_unlock((uintptr_t)NULL, &index, type, 0);
+
+	/*
+	 * update the chains outside the interlock
+	 */
+	turnstile_update_inheritor_complete(ts, TURNSTILE_INTERLOCK_NOT_HELD);
+
+	turnstile_hash_bucket_lock((uintptr_t)NULL, &index, type);
+
+	turnstile_complete((uintptr_t)event, NULL, NULL, type);
+
+	turnstile_hash_bucket_unlock((uintptr_t)NULL, &index, type, 0);
+
+	turnstile_cleanup();
+
+	return ret;
+}
+
+typedef void (^void_block_void)(void);
+
+/*
+ * sleep_with_inheritor functions with lck_mtx_t as locking primitive.
+ */
+
+wait_result_t
+lck_mtx_sleep_with_inheritor_and_turnstile_type(lck_mtx_t *lock, lck_sleep_action_t lck_sleep_action, event_t event, thread_t inheritor, wait_interrupt_t interruptible, uint64_t deadline, turnstile_type_t type)
+{
+	LCK_MTX_ASSERT(lock, LCK_MTX_ASSERT_OWNED);
+
+	if (lck_sleep_action & LCK_SLEEP_UNLOCK) {
+		return sleep_with_inheritor_and_turnstile_type(event,
+		           inheritor,
+		           interruptible,
+		           deadline,
+		           type,
+		           ^{;},
+		           ^{lck_mtx_unlock(lock);});
+	} else if (lck_sleep_action & LCK_SLEEP_SPIN) {
+		return sleep_with_inheritor_and_turnstile_type(event,
+		           inheritor,
+		           interruptible,
+		           deadline,
+		           type,
+		           ^{lck_mtx_lock_spin(lock);},
+		           ^{lck_mtx_unlock(lock);});
+	} else if (lck_sleep_action & LCK_SLEEP_SPIN_ALWAYS) {
+		return sleep_with_inheritor_and_turnstile_type(event,
+		           inheritor,
+		           interruptible,
+		           deadline,
+		           type,
+		           ^{lck_mtx_lock_spin_always(lock);},
+		           ^{lck_mtx_unlock(lock);});
+	} else {
+		return sleep_with_inheritor_and_turnstile_type(event,
+		           inheritor,
+		           interruptible,
+		           deadline,
+		           type,
+		           ^{lck_mtx_lock(lock);},
+		           ^{lck_mtx_unlock(lock);});
+	}
+}
+
+/*
+ * Name: lck_spin_sleep_with_inheritor
+ *
+ * Description: deschedule the current thread and wait on the waitq associated with event to be woken up.
+ *              While waiting, the sched priority of the waiting thread will contribute to the push of the event that will
+ *              be directed to the inheritor specified.
+ *              An interruptible mode and deadline can be specified to return earlier from the wait.
+ *
+ * Args:
+ *   Arg1: lck_spin_t lock used to protect the sleep. The lock will be dropped while sleeping and reaquired before returning according to the sleep action specified.
+ *   Arg2: sleep action. LCK_SLEEP_DEFAULT, LCK_SLEEP_UNLOCK.
+ *   Arg3: event to wait on.
+ *   Arg4: thread to propagate the event push to.
+ *   Arg5: interruptible flag for wait.
+ *   Arg6: deadline for wait.
+ *
+ * Conditions: Lock must be held. Returns with the lock held according to the sleep action specified.
+ *             Lock will be dropped while waiting.
+ *             The inheritor specified cannot run in user space until another inheritor is specified for the event or a
+ *             wakeup for the event is called.
+ *
+ * Returns: result of the wait.
+ */
+wait_result_t
+lck_spin_sleep_with_inheritor(
+	lck_spin_t *lock,
+	lck_sleep_action_t lck_sleep_action,
+	event_t event,
+	thread_t inheritor,
+	wait_interrupt_t interruptible,
+	uint64_t deadline)
+{
+	if (lck_sleep_action & LCK_SLEEP_UNLOCK) {
+		return sleep_with_inheritor_and_turnstile_type(event, inheritor,
+		           interruptible, deadline, TURNSTILE_SLEEP_INHERITOR,
+		           ^{}, ^{ lck_spin_unlock(lock); });
+	} else {
+		return sleep_with_inheritor_and_turnstile_type(event, inheritor,
+		           interruptible, deadline, TURNSTILE_SLEEP_INHERITOR,
+		           ^{ lck_spin_lock(lock); }, ^{ lck_spin_unlock(lock); });
+	}
+}
+
+/*
+ * Name: lck_mtx_sleep_with_inheritor
+ *
+ * Description: deschedule the current thread and wait on the waitq associated with event to be woken up.
+ *              While waiting, the sched priority of the waiting thread will contribute to the push of the event that will
+ *              be directed to the inheritor specified.
+ *              An interruptible mode and deadline can be specified to return earlier from the wait.
+ *
+ * Args:
+ *   Arg1: lck_mtx_t lock used to protect the sleep. The lock will be dropped while sleeping and reaquired before returning according to the sleep action specified.
+ *   Arg2: sleep action. LCK_SLEEP_DEFAULT, LCK_SLEEP_UNLOCK, LCK_SLEEP_SPIN, LCK_SLEEP_SPIN_ALWAYS.
+ *   Arg3: event to wait on.
+ *   Arg4: thread to propagate the event push to.
+ *   Arg5: interruptible flag for wait.
+ *   Arg6: deadline for wait.
+ *
+ * Conditions: Lock must be held. Returns with the lock held according to the sleep action specified.
+ *             Lock will be dropped while waiting.
+ *             The inheritor specified cannot run in user space until another inheritor is specified for the event or a
+ *             wakeup for the event is called.
+ *
+ * Returns: result of the wait.
+ */
+wait_result_t
+lck_mtx_sleep_with_inheritor(lck_mtx_t *lock, lck_sleep_action_t lck_sleep_action, event_t event, thread_t inheritor, wait_interrupt_t interruptible, uint64_t deadline)
+{
+	return lck_mtx_sleep_with_inheritor_and_turnstile_type(lock, lck_sleep_action, event, inheritor, interruptible, deadline, TURNSTILE_SLEEP_INHERITOR);
+}
+
+/*
+ * sleep_with_inheritor functions with lck_rw_t as locking primitive.
+ */
+
+wait_result_t
+lck_rw_sleep_with_inheritor_and_turnstile_type(lck_rw_t *lock, lck_sleep_action_t lck_sleep_action, event_t event, thread_t inheritor, wait_interrupt_t interruptible, uint64_t deadline, turnstile_type_t type)
+{
+	__block lck_rw_type_t lck_rw_type = LCK_RW_TYPE_EXCLUSIVE;
+
+	LCK_RW_ASSERT(lock, LCK_RW_ASSERT_HELD);
+
+	if (lck_sleep_action & LCK_SLEEP_UNLOCK) {
+		return sleep_with_inheritor_and_turnstile_type(event,
+		           inheritor,
+		           interruptible,
+		           deadline,
+		           type,
+		           ^{;},
+		           ^{lck_rw_type = lck_rw_done(lock);});
+	} else if (!(lck_sleep_action & (LCK_SLEEP_SHARED | LCK_SLEEP_EXCLUSIVE))) {
+		return sleep_with_inheritor_and_turnstile_type(event,
+		           inheritor,
+		           interruptible,
+		           deadline,
+		           type,
+		           ^{lck_rw_lock(lock, lck_rw_type);},
+		           ^{lck_rw_type = lck_rw_done(lock);});
+	} else if (lck_sleep_action & LCK_SLEEP_EXCLUSIVE) {
+		return sleep_with_inheritor_and_turnstile_type(event,
+		           inheritor,
+		           interruptible,
+		           deadline,
+		           type,
+		           ^{lck_rw_lock_exclusive(lock);},
+		           ^{lck_rw_type = lck_rw_done(lock);});
+	} else {
+		return sleep_with_inheritor_and_turnstile_type(event,
+		           inheritor,
+		           interruptible,
+		           deadline,
+		           type,
+		           ^{lck_rw_lock_shared(lock);},
+		           ^{lck_rw_type = lck_rw_done(lock);});
+	}
+}
+
+/*
+ * Name: lck_rw_sleep_with_inheritor
+ *
+ * Description: deschedule the current thread and wait on the waitq associated with event to be woken up.
+ *              While waiting, the sched priority of the waiting thread will contribute to the push of the event that will
+ *              be directed to the inheritor specified.
+ *              An interruptible mode and deadline can be specified to return earlier from the wait.
+ *
+ * Args:
+ *   Arg1: lck_rw_t lock used to protect the sleep. The lock will be dropped while sleeping and reaquired before returning according to the sleep action specified.
+ *   Arg2: sleep action. LCK_SLEEP_DEFAULT, LCK_SLEEP_SHARED, LCK_SLEEP_EXCLUSIVE.
+ *   Arg3: event to wait on.
+ *   Arg4: thread to propagate the event push to.
+ *   Arg5: interruptible flag for wait.
+ *   Arg6: deadline for wait.
+ *
+ * Conditions: Lock must be held. Returns with the lock held according to the sleep action specified.
+ *             Lock will be dropped while waiting.
+ *             The inheritor specified cannot run in user space until another inheritor is specified for the event or a
+ *             wakeup for the event is called.
+ *
+ * Returns: result of the wait.
+ */
+wait_result_t
+lck_rw_sleep_with_inheritor(lck_rw_t *lock, lck_sleep_action_t lck_sleep_action, event_t event, thread_t inheritor, wait_interrupt_t interruptible, uint64_t deadline)
+{
+	return lck_rw_sleep_with_inheritor_and_turnstile_type(lock, lck_sleep_action, event, inheritor, interruptible, deadline, TURNSTILE_SLEEP_INHERITOR);
+}
+
+/*
+ * wakeup_with_inheritor functions are independent from the locking primitive.
+ */
+
+/*
+ * Name: wakeup_one_with_inheritor
+ *
+ * Description: wake up one waiter for event if any. The thread woken up will be the one with the higher sched priority waiting on event.
+ *              The push for the event will be transferred from the last inheritor to the woken up thread if LCK_WAKE_DEFAULT is specified.
+ *              If LCK_WAKE_DO_NOT_TRANSFER_PUSH is specified the push will not be transferred.
+ *
+ * Args:
+ *   Arg1: event to wake from.
+ *   Arg2: wait result to pass to the woken up thread.
+ *   Arg3: wake flag. LCK_WAKE_DEFAULT or LCK_WAKE_DO_NOT_TRANSFER_PUSH.
+ *   Arg4: pointer for storing the thread wokenup.
+ *
+ * Returns: KERN_NOT_WAITING if no threads were waiting, KERN_SUCCESS otherwise.
+ *
+ * Conditions: The new inheritor wokenup cannot run in user space until another inheritor is specified for the event or a
+ *             wakeup for the event is called.
+ *             A reference for the wokenup thread is acquired.
+ *             NOTE: this cannot be called from interrupt context.
+ */
+kern_return_t
+wakeup_one_with_inheritor(event_t event, wait_result_t result, lck_wake_action_t action, thread_t *thread_wokenup)
+{
+	return wakeup_with_inheritor_and_turnstile_type(event,
+	           TURNSTILE_SLEEP_INHERITOR,
+	           result,
+	           TRUE,
+	           action,
+	           thread_wokenup);
+}
+
+/*
+ * Name: wakeup_all_with_inheritor
+ *
+ * Description: wake up all waiters waiting for event. The old inheritor will lose the push.
+ *
+ * Args:
+ *   Arg1: event to wake from.
+ *   Arg2: wait result to pass to the woken up threads.
+ *
+ * Returns: KERN_NOT_WAITING if no threads were waiting, KERN_SUCCESS otherwise.
+ *
+ * Conditions: NOTE: this cannot be called from interrupt context.
+ */
+kern_return_t
+wakeup_all_with_inheritor(event_t event, wait_result_t result)
+{
+	return wakeup_with_inheritor_and_turnstile_type(event,
+	           TURNSTILE_SLEEP_INHERITOR,
+	           result,
+	           FALSE,
+	           0,
+	           NULL);
+}
+
+/*
+ * change_sleep_inheritor is independent from the locking primitive.
+ */
+
+/*
+ * Name: change_sleep_inheritor
+ *
+ * Description: Redirect the push of the waiting threads of event to the new inheritor specified.
+ *
+ * Args:
+ *   Arg1: event to redirect the push.
+ *   Arg2: new inheritor for event.
+ *
+ * Returns: KERN_NOT_WAITING if no threads were waiting, KERN_SUCCESS otherwise.
+ *
+ * Conditions: In case of success, the new inheritor cannot run in user space until another inheritor is specified for the event or a
+ *             wakeup for the event is called.
+ *             NOTE: this cannot be called from interrupt context.
+ */
+kern_return_t
+change_sleep_inheritor(event_t event, thread_t inheritor)
+{
+	return change_sleep_inheritor_and_turnstile_type(event,
+	           inheritor,
+	           TURNSTILE_SLEEP_INHERITOR);
+}
+
+void
+kdp_sleep_with_inheritor_find_owner(struct waitq * waitq, __unused event64_t event, thread_waitinfo_t * waitinfo)
+{
+	assert(waitinfo->wait_type == kThreadWaitSleepWithInheritor);
+	assert(waitq_is_turnstile_queue(waitq));
+	waitinfo->owner = 0;
+	waitinfo->context = 0;
+
+	if (waitq_held(waitq)) {
+		return;
+	}
+
+	struct turnstile *turnstile = waitq_to_turnstile(waitq);
+	assert(turnstile->ts_inheritor_flags & TURNSTILE_INHERITOR_THREAD);
+	waitinfo->owner = thread_tid(turnstile->ts_inheritor);
+}
+
+typedef void (*void_func_void)(void);
+
+static kern_return_t
+gate_try_close(gate_t *gate)
+{
+	uintptr_t state;
+	thread_t holder;
+	kern_return_t ret;
+	__assert_only bool waiters;
+	thread_t thread = current_thread();
+
+	if (os_atomic_cmpxchg(&gate->gate_data, 0, GATE_THREAD_TO_STATE(thread), acquire)) {
+		return KERN_SUCCESS;
+	}
+
+	gate_ilock(gate);
+	state = ordered_load_gate(gate);
+	holder = GATE_STATE_TO_THREAD(state);
+
+	if (holder == NULL) {
+		waiters = gate_has_waiters(state);
+		assert(waiters == FALSE);
+
+		state = GATE_THREAD_TO_STATE(current_thread());
+		state |= GATE_ILOCK;
+		ordered_store_gate(gate, state);
+		ret = KERN_SUCCESS;
+	} else {
+		if (holder == current_thread()) {
+			panic("Trying to close a gate already owned by current thread %p", current_thread());
+		}
+		ret = KERN_FAILURE;
+	}
+
+	gate_iunlock(gate);
+	return ret;
+}
+
+static void
+gate_close(gate_t* gate)
+{
+	uintptr_t state;
+	thread_t holder;
+	__assert_only bool waiters;
+	thread_t thread = current_thread();
+
+	if (os_atomic_cmpxchg(&gate->gate_data, 0, GATE_THREAD_TO_STATE(thread), acquire)) {
+		return;
+	}
+
+	gate_ilock(gate);
+	state = ordered_load_gate(gate);
+	holder = GATE_STATE_TO_THREAD(state);
+
+	if (holder != NULL) {
+		panic("Closing a gate already owned by %p from current thread %p", holder, current_thread());
+	}
+
+	waiters = gate_has_waiters(state);
+	assert(waiters == FALSE);
+
+	state = GATE_THREAD_TO_STATE(thread);
+	state |= GATE_ILOCK;
+	ordered_store_gate(gate, state);
+
+	gate_iunlock(gate);
+}
+
+static void
+gate_open_turnstile(gate_t *gate)
+{
+	struct turnstile *ts = NULL;
+
+	ts = turnstile_prepare((uintptr_t)gate, &gate->turnstile, TURNSTILE_NULL, TURNSTILE_KERNEL_MUTEX);
+	waitq_wakeup64_all(&ts->ts_waitq, CAST_EVENT64_T(GATE_EVENT(gate)), THREAD_AWAKENED, WAITQ_ALL_PRIORITIES);
+	turnstile_update_inheritor(ts, TURNSTILE_INHERITOR_NULL, TURNSTILE_IMMEDIATE_UPDATE);
+	turnstile_update_inheritor_complete(ts, TURNSTILE_INTERLOCK_HELD);
+	turnstile_complete((uintptr_t)gate, &gate->turnstile, NULL, TURNSTILE_KERNEL_MUTEX);
+	/*
+	 * We can do the cleanup while holding the interlock.
+	 * It is ok because:
+	 * 1. current_thread is the previous inheritor and it is running
+	 * 2. new inheritor is NULL.
+	 * => No chain of turnstiles needs to be updated.
+	 */
+	turnstile_cleanup();
+}
+
+static void
+gate_open(gate_t *gate)
+{
+	uintptr_t state;
+	thread_t holder;
+	bool waiters;
+	thread_t thread = current_thread();
+
+	if (os_atomic_cmpxchg(&gate->gate_data, GATE_THREAD_TO_STATE(thread), 0, release)) {
+		return;
+	}
+
+	gate_ilock(gate);
+	state = ordered_load_gate(gate);
+	holder = GATE_STATE_TO_THREAD(state);
+	waiters = gate_has_waiters(state);
+
+	if (holder != thread) {
+		panic("Opening gate owned by %p from current thread %p", holder, thread);
+	}
+
+	if (waiters) {
+		gate_open_turnstile(gate);
+	}
+
+	state = GATE_ILOCK;
+	ordered_store_gate(gate, state);
+
+	gate_iunlock(gate);
+}
+
+static kern_return_t
+gate_handoff_turnstile(gate_t *gate,
+    int flags,
+    thread_t *thread_woken_up,
+    bool *waiters)
+{
+	struct turnstile *ts = NULL;
+	kern_return_t ret = KERN_FAILURE;
+	thread_t hp_thread;
+
+	ts = turnstile_prepare((uintptr_t)gate, &gate->turnstile, TURNSTILE_NULL, TURNSTILE_KERNEL_MUTEX);
+	/*
+	 * Wake up the higest priority thread waiting on the gate
+	 */
+	hp_thread = waitq_wakeup64_identify(&ts->ts_waitq, CAST_EVENT64_T(GATE_EVENT(gate)), THREAD_AWAKENED, WAITQ_PROMOTE_ON_WAKE);
+
+	if (hp_thread != NULL) {
+		/*
+		 * In this case waitq_wakeup64_identify has called turnstile_update_inheritor for us
+		 */
+		turnstile_update_inheritor_complete(ts, TURNSTILE_INTERLOCK_HELD);
+		*thread_woken_up = hp_thread;
+		*waiters = turnstile_has_waiters(ts);
+		/*
+		 * Note: hp_thread is the new holder and the new inheritor.
+		 * In case there are no more waiters, it doesn't need to be the inheritor
+		 * and it shouldn't be it by the time it finishes the wait, so that its next open or
+		 * handoff can go through the fast path.
+		 * We could set the inheritor to NULL here, or the new holder itself can set it
+		 * on its way back from the sleep. In the latter case there are more chanses that
+		 * new waiters will come by, avoiding to do the opearation at all.
+		 */
+		ret = KERN_SUCCESS;
+	} else {
+		/*
+		 * waiters can have been woken up by an interrupt and still not
+		 * have updated gate->waiters, so we couldn't find them on the waitq.
+		 * Update the inheritor to NULL here, so that the current thread can return to userspace
+		 * indipendently from when the interrupted waiters will finish the wait.
+		 */
+		if (flags == GATE_HANDOFF_OPEN_IF_NO_WAITERS) {
+			turnstile_update_inheritor(ts, TURNSTILE_INHERITOR_NULL, TURNSTILE_IMMEDIATE_UPDATE);
+			turnstile_update_inheritor_complete(ts, TURNSTILE_INTERLOCK_HELD);
+		}
+		// there are no waiters.
+		ret = KERN_NOT_WAITING;
+	}
+
+	turnstile_complete((uintptr_t)gate, &gate->turnstile, NULL, TURNSTILE_KERNEL_MUTEX);
+
+	/*
+	 * We can do the cleanup while holding the interlock.
+	 * It is ok because:
+	 * 1. current_thread is the previous inheritor and it is running
+	 * 2. new inheritor is NULL or it is a just wokenup thread that will race acquiring the lock
+	 *    of the gate before trying to sleep.
+	 * => No chain of turnstiles needs to be updated.
+	 */
+	turnstile_cleanup();
+
+	return ret;
+}
+
+static kern_return_t
+gate_handoff(gate_t *gate,
+    int flags)
+{
+	kern_return_t ret;
+	thread_t new_holder = NULL;
+	uintptr_t state;
+	thread_t holder;
+	bool waiters;
+	thread_t thread = current_thread();
+
+	assert(flags == GATE_HANDOFF_OPEN_IF_NO_WAITERS || flags == GATE_HANDOFF_DEFAULT);
+
+	if (flags == GATE_HANDOFF_OPEN_IF_NO_WAITERS) {
+		if (os_atomic_cmpxchg(&gate->gate_data, GATE_THREAD_TO_STATE(thread), 0, release)) {
+			//gate opened but there were no waiters, so return KERN_NOT_WAITING.
+			return KERN_NOT_WAITING;
+		}
+	}
+
+	gate_ilock(gate);
+	state = ordered_load_gate(gate);
+	holder = GATE_STATE_TO_THREAD(state);
+	waiters = gate_has_waiters(state);
+
+	if (holder != current_thread()) {
+		panic("Handing off gate owned by %p from current thread %p", holder, current_thread());
+	}
+
+	if (waiters) {
+		ret = gate_handoff_turnstile(gate, flags, &new_holder, &waiters);
+		if (ret == KERN_SUCCESS) {
+			state = GATE_THREAD_TO_STATE(new_holder);
+			if (waiters) {
+				state |= GATE_WAITERS;
+			}
+		} else {
+			if (flags == GATE_HANDOFF_OPEN_IF_NO_WAITERS) {
+				state = 0;
+			}
+		}
+	} else {
+		if (flags == GATE_HANDOFF_OPEN_IF_NO_WAITERS) {
+			state = 0;
+		}
+		ret = KERN_NOT_WAITING;
+	}
+	state |= GATE_ILOCK;
+	ordered_store_gate(gate, state);
+
+	gate_iunlock(gate);
+
+	if (new_holder) {
+		thread_deallocate(new_holder);
+	}
+	return ret;
+}
+
+static void_func_void
+gate_steal_turnstile(gate_t *gate,
+    thread_t new_inheritor)
+{
+	struct turnstile *ts = NULL;
+
+	ts = turnstile_prepare((uintptr_t)gate, &gate->turnstile, TURNSTILE_NULL, TURNSTILE_KERNEL_MUTEX);
+
+	turnstile_update_inheritor(ts, new_inheritor, (TURNSTILE_IMMEDIATE_UPDATE | TURNSTILE_INHERITOR_THREAD));
+	turnstile_update_inheritor_complete(ts, TURNSTILE_INTERLOCK_HELD);
+	turnstile_complete((uintptr_t)gate, &gate->turnstile, NULL, TURNSTILE_KERNEL_MUTEX);
+
+	/*
+	 * turnstile_cleanup might need to update the chain of the old holder.
+	 * This operation should happen without the turnstile interlock held.
+	 */
+	return turnstile_cleanup;
+}
+
+static void
+gate_steal(gate_t *gate)
+{
+	uintptr_t state;
+	thread_t holder;
+	thread_t thread = current_thread();
+	bool waiters;
+
+	void_func_void func_after_interlock_unlock;
+
+	gate_ilock(gate);
+	state = ordered_load_gate(gate);
+	holder = GATE_STATE_TO_THREAD(state);
+	waiters = gate_has_waiters(state);
+
+	assert(holder != NULL);
+	state = GATE_THREAD_TO_STATE(thread) | GATE_ILOCK;
+	if (waiters) {
+		state |= GATE_WAITERS;
+		ordered_store_gate(gate, state);
+		func_after_interlock_unlock = gate_steal_turnstile(gate, thread);
+		gate_iunlock(gate);
+
+		func_after_interlock_unlock();
+	} else {
+		ordered_store_gate(gate, state);
+		gate_iunlock(gate);
+	}
+}
+
+static void_func_void
+gate_wait_turnstile(gate_t *gate,
+    wait_interrupt_t interruptible,
+    uint64_t deadline,
+    thread_t holder,
+    wait_result_t* wait,
+    bool* waiters)
+{
+	struct turnstile *ts;
+	uintptr_t state;
+
+	ts = turnstile_prepare((uintptr_t)gate, &gate->turnstile, TURNSTILE_NULL, TURNSTILE_KERNEL_MUTEX);
+
+	turnstile_update_inheritor(ts, holder, (TURNSTILE_DELAYED_UPDATE | TURNSTILE_INHERITOR_THREAD));
+	waitq_assert_wait64(&ts->ts_waitq, CAST_EVENT64_T(GATE_EVENT(gate)), interruptible, deadline);
+
+	gate_iunlock(gate);
+
+	turnstile_update_inheritor_complete(ts, TURNSTILE_INTERLOCK_NOT_HELD);
+
+	*wait = thread_block(THREAD_CONTINUE_NULL);
+
+	gate_ilock(gate);
+
+	*waiters = turnstile_has_waiters(ts);
+
+	if (!*waiters) {
+		/*
+		 * We want to enable the fast path as soon as we see that there are no more waiters.
+		 * On the fast path the holder will not do any turnstile operations.
+		 * Set the inheritor as NULL here.
+		 *
+		 * NOTE: if it was an open operation that woke this thread up, the inheritor has
+		 * already been set to NULL.
+		 */
+		state = ordered_load_gate(gate);
+		holder = GATE_STATE_TO_THREAD(state);
+		if (holder &&
+		    ((*wait != THREAD_AWAKENED) ||     // thread interrupted or timedout
+		    holder == current_thread())) {     // thread was woken up and it is the new holder
+			turnstile_update_inheritor(ts, TURNSTILE_INHERITOR_NULL, TURNSTILE_IMMEDIATE_UPDATE);
+			turnstile_update_inheritor_complete(ts, TURNSTILE_INTERLOCK_NOT_HELD);
+		}
+	}
+
+	turnstile_complete((uintptr_t)gate, &gate->turnstile, NULL, TURNSTILE_KERNEL_MUTEX);
+
+	/*
+	 * turnstile_cleanup might need to update the chain of the old holder.
+	 * This operation should happen without the turnstile primitive interlock held.
+	 */
+	return turnstile_cleanup;
+}
+
+static gate_wait_result_t
+gate_wait(gate_t* gate,
+    wait_interrupt_t interruptible,
+    uint64_t deadline,
+    void (^primitive_unlock)(void),
+    void (^primitive_lock)(void))
+{
+	gate_wait_result_t ret;
+	void_func_void func_after_interlock_unlock;
+	wait_result_t wait_result;
+	uintptr_t state;
+	thread_t holder;
+	bool waiters;
+
+
+	gate_ilock(gate);
+	state = ordered_load_gate(gate);
+	holder = GATE_STATE_TO_THREAD(state);
+
+	if (holder == NULL) {
+		panic("Trying to wait on open gate thread %p gate %p", current_thread(), gate);
+	}
+
+	state |= GATE_WAITERS;
+	ordered_store_gate(gate, state);
+
+	/*
+	 * Release the primitive lock before any
+	 * turnstile operation. Turnstile
+	 * does not support a blocking primitive as
+	 * interlock.
+	 *
+	 * In this way, concurrent threads will be
+	 * able to acquire the primitive lock
+	 * but still will wait for me through the
+	 * gate interlock.
+	 */
+	primitive_unlock();
+
+	func_after_interlock_unlock = gate_wait_turnstile(    gate,
+	    interruptible,
+	    deadline,
+	    holder,
+	    &wait_result,
+	    &waiters);
+
+	state = ordered_load_gate(gate);
+	holder = GATE_STATE_TO_THREAD(state);
+
+	switch (wait_result) {
+	case THREAD_INTERRUPTED:
+	case THREAD_TIMED_OUT:
+		assert(holder != current_thread());
+
+		if (waiters) {
+			state |= GATE_WAITERS;
+		} else {
+			state &= ~GATE_WAITERS;
+		}
+		ordered_store_gate(gate, state);
+
+		if (wait_result == THREAD_INTERRUPTED) {
+			ret = GATE_INTERRUPTED;
+		} else {
+			ret = GATE_TIMED_OUT;
+		}
+		break;
+	default:
+		/*
+		 * Note it is possible that even if the gate was handed off to
+		 * me, someone called gate_steal() before I woke up.
+		 *
+		 * As well as it is possible that the gate was opened, but someone
+		 * closed it while I was waking up.
+		 *
+		 * In both cases we return GATE_OPENED, as the gate was opened to me
+		 * at one point, it is the caller responsibility to check again if
+		 * the gate is open.
+		 */
+		if (holder == current_thread()) {
+			ret = GATE_HANDOFF;
 		} else {
-			KERNEL_DEBUG_CONSTANT(MACHDBG_CODE(DBG_MACH_SCHED, MACH_RW_DEMOTE) | DBG_FUNC_NONE,
-								  thread->sched_pri, thread->base_pri, 0, 0, 0);
-			
-			thread_recompute_sched_pri(thread, FALSE);
+			ret = GATE_OPENED;
 		}
+		break;
 	}
 
-	thread_unlock(thread);
-	splx(s);
+	gate_iunlock(gate);
+
+	/*
+	 * turnstile func that needs to be executed without
+	 * holding the primitive interlock
+	 */
+	func_after_interlock_unlock();
+
+	primitive_lock();
+
+	return ret;
+}
+static void
+gate_assert(gate_t *gate, int flags)
+{
+	uintptr_t state;
+	thread_t holder;
+
+	gate_ilock(gate);
+	state = ordered_load_gate(gate);
+	holder = GATE_STATE_TO_THREAD(state);
+
+	switch (flags) {
+	case GATE_ASSERT_CLOSED:
+		assert(holder != NULL);
+		break;
+	case GATE_ASSERT_OPEN:
+		assert(holder == NULL);
+		break;
+	case GATE_ASSERT_HELD:
+		assert(holder == current_thread());
+		break;
+	default:
+		panic("invalid %s flag %d", __func__, flags);
+	}
+
+	gate_iunlock(gate);
+}
+
+static void
+gate_init(gate_t *gate)
+{
+	gate->gate_data = 0;
+	gate->turnstile = NULL;
+}
+
+static void
+gate_destroy(__assert_only gate_t *gate)
+{
+	assert(gate->gate_data == 0);
+	assert(gate->turnstile == NULL);
+}
+
+/*
+ * Name: lck_rw_gate_init
+ *
+ * Description: initializes a variable declared with decl_lck_rw_gate_data.
+ *
+ * Args:
+ *   Arg1: lck_rw_t lock used to protect the gate.
+ *   Arg2: pointer to the gate data declared with decl_lck_rw_gate_data.
+ */
+void
+lck_rw_gate_init(lck_rw_t *lock, gate_t *gate)
+{
+	(void) lock;
+	gate_init(gate);
+}
+
+/*
+ * Name: lck_rw_gate_destroy
+ *
+ * Description: destroys a variable previously initialized.
+ *
+ * Args:
+ *   Arg1: lck_rw_t lock used to protect the gate.
+ *   Arg2: pointer to the gate data declared with decl_lck_rw_gate_data.
+ */
+void
+lck_rw_gate_destroy(lck_rw_t *lock, gate_t *gate)
+{
+	(void) lock;
+	gate_destroy(gate);
+}
+
+/*
+ * Name: lck_rw_gate_try_close
+ *
+ * Description: Tries to close the gate.
+ *              In case of success the current thread will be set as
+ *              the holder of the gate.
+ *
+ * Args:
+ *   Arg1: lck_rw_t lock used to protect the gate.
+ *   Arg2: pointer to the gate data declared with decl_lck_rw_gate_data.
+ *
+ * Conditions: Lock must be held. Returns with the lock held.
+ *
+ * Returns:
+ *          KERN_SUCCESS in case the gate was successfully closed. The current thread is the new holder
+ *          of the gate.
+ *          A matching lck_rw_gate_open() or lck_rw_gate_handoff() needs to be called later on
+ *          to wake up possible waiters on the gate before returning to userspace.
+ *          If the intent is to conditionally probe the gate before waiting, the lock must not be dropped
+ *          between the calls to lck_rw_gate_try_close() and lck_rw_gate_wait().
+ *
+ *          KERN_FAILURE in case the gate was already closed. Will panic if the current thread was already the holder of the gate.
+ *          lck_rw_gate_wait() should be called instead if the intent is to unconditionally wait on this gate.
+ *          The calls to lck_rw_gate_try_close() and lck_rw_gate_wait() should
+ *          be done without dropping the lock that is protecting the gate in between.
+ */
+int
+lck_rw_gate_try_close(__assert_only lck_rw_t *lock, gate_t *gate)
+{
+	LCK_RW_ASSERT(lock, LCK_RW_ASSERT_HELD);
+
+	return gate_try_close(gate);
+}
+
+/*
+ * Name: lck_rw_gate_close
+ *
+ * Description: Closes the gate. The current thread will be set as
+ *              the holder of the gate. Will panic if the gate is already closed.
+ *              A matching lck_rw_gate_open() or lck_rw_gate_handoff() needs to be called later on
+ *              to wake up possible waiters on the gate before returning to userspace.
+ *
+ * Args:
+ *   Arg1: lck_rw_t lock used to protect the gate.
+ *   Arg2: pointer to the gate data declared with decl_lck_rw_gate_data.
+ *
+ * Conditions: Lock must be held. Returns with the lock held.
+ *             The gate must be open.
+ *
+ */
+void
+lck_rw_gate_close(__assert_only lck_rw_t *lock, gate_t *gate)
+{
+	LCK_RW_ASSERT(lock, LCK_RW_ASSERT_HELD);
+
+	return gate_close(gate);
+}
+
+/*
+ * Name: lck_rw_gate_open
+ *
+ * Description: Opens the gate and wakes up possible waiters.
+ *
+ * Args:
+ *   Arg1: lck_rw_t lock used to protect the gate.
+ *   Arg2: pointer to the gate data declared with decl_lck_rw_gate_data.
+ *
+ * Conditions: Lock must be held. Returns with the lock held.
+ *             The current thread must be the holder of the gate.
+ *
+ */
+void
+lck_rw_gate_open(__assert_only lck_rw_t *lock, gate_t *gate)
+{
+	LCK_RW_ASSERT(lock, LCK_RW_ASSERT_HELD);
+
+	gate_open(gate);
 }
 
+/*
+ * Name: lck_rw_gate_handoff
+ *
+ * Description: Tries to transfer the ownership of the gate. The waiter with highest sched
+ *              priority will be selected as the new holder of the gate, and woken up,
+ *              with the gate remaining in the closed state throughout.
+ *              If no waiters are present, the gate will be kept closed and KERN_NOT_WAITING
+ *              will be returned.
+ *              GATE_HANDOFF_OPEN_IF_NO_WAITERS flag can be used to specify if the gate should be opened in
+ *              case no waiters were found.
+ *
+ *
+ * Args:
+ *   Arg1: lck_rw_t lock used to protect the gate.
+ *   Arg2: pointer to the gate data declared with decl_lck_rw_gate_data.
+ *   Arg3: flags - GATE_HANDOFF_DEFAULT or GATE_HANDOFF_OPEN_IF_NO_WAITERS
+ *
+ * Conditions: Lock must be held. Returns with the lock held.
+ *             The current thread must be the holder of the gate.
+ *
+ * Returns:
+ *          KERN_SUCCESS in case one of the waiters became the new holder.
+ *          KERN_NOT_WAITING in case there were no waiters.
+ *
+ */
 kern_return_t
-host_lockgroup_info(
-	host_t					host,
-	lockgroup_info_array_t	*lockgroup_infop,
-	mach_msg_type_number_t	*lockgroup_infoCntp)
-{
-	lockgroup_info_t	*lockgroup_info_base;
-	lockgroup_info_t	*lockgroup_info;
-	vm_offset_t			lockgroup_info_addr;
-	vm_size_t			lockgroup_info_size;
-	lck_grp_t			*lck_grp;
-	unsigned int		i;
-	vm_size_t			used;
-	vm_map_copy_t		copy;
-	kern_return_t		kr;
-
-	if (host == HOST_NULL)
-		return KERN_INVALID_HOST;
+lck_rw_gate_handoff(__assert_only lck_rw_t *lock, gate_t *gate, int flags)
+{
+	LCK_RW_ASSERT(lock, LCK_RW_ASSERT_HELD);
 
-	lck_mtx_lock(&lck_grp_lock);
+	return gate_handoff(gate, flags);
+}
 
-	lockgroup_info_size = round_page(lck_grp_cnt * sizeof *lockgroup_info);
-	kr = kmem_alloc_pageable(ipc_kernel_map,
-						 &lockgroup_info_addr, lockgroup_info_size, VM_KERN_MEMORY_IPC);
-	if (kr != KERN_SUCCESS) {
-		lck_mtx_unlock(&lck_grp_lock);
-		return(kr);
+/*
+ * Name: lck_rw_gate_steal
+ *
+ * Description: Set the current ownership of the gate. It sets the current thread as the
+ *              new holder of the gate.
+ *              A matching lck_rw_gate_open() or lck_rw_gate_handoff() needs to be called later on
+ *              to wake up possible waiters on the gate before returning to userspace.
+ *              NOTE: the previous holder should not call lck_rw_gate_open() or lck_rw_gate_handoff()
+ *              anymore.
+ *
+ *
+ * Args:
+ *   Arg1: lck_rw_t lock used to protect the gate.
+ *   Arg2: pointer to the gate data declared with decl_lck_rw_gate_data.
+ *
+ * Conditions: Lock must be held. Returns with the lock held.
+ *             The gate must be closed and the current thread must not already be the holder.
+ *
+ */
+void
+lck_rw_gate_steal(__assert_only lck_rw_t *lock, gate_t *gate)
+{
+	LCK_RW_ASSERT(lock, LCK_RW_ASSERT_HELD);
+
+	gate_steal(gate);
+}
+
+/*
+ * Name: lck_rw_gate_wait
+ *
+ * Description: Waits for the current thread to become the holder of the gate or for the
+ *              gate to become open. An interruptible mode and deadline can be specified
+ *              to return earlier from the wait.
+ *
+ * Args:
+ *   Arg1: lck_rw_t lock used to protect the gate.
+ *   Arg2: pointer to the gate data declared with decl_lck_rw_gate_data.
+ *   Arg3: sleep action. LCK_SLEEP_DEFAULT, LCK_SLEEP_SHARED, LCK_SLEEP_EXCLUSIVE.
+ *   Arg3: interruptible flag for wait.
+ *   Arg4: deadline
+ *
+ * Conditions: Lock must be held. Returns with the lock held according to the sleep action specified.
+ *             Lock will be dropped while waiting.
+ *             The gate must be closed.
+ *
+ * Returns: Reason why the thread was woken up.
+ *          GATE_HANDOFF - the current thread was handed off the ownership of the gate.
+ *                         A matching lck_rw_gate_open() or lck_rw_gate_handoff() needs to be called later on
+ *                         to wake up possible waiters on the gate before returning to userspace.
+ *          GATE_OPENED - the gate was opened by the holder.
+ *          GATE_TIMED_OUT - the thread was woken up by a timeout.
+ *          GATE_INTERRUPTED - the thread was interrupted while sleeping.
+ *
+ */
+gate_wait_result_t
+lck_rw_gate_wait(lck_rw_t *lock, gate_t *gate, lck_sleep_action_t lck_sleep_action, wait_interrupt_t interruptible, uint64_t deadline)
+{
+	__block lck_rw_type_t lck_rw_type = LCK_RW_TYPE_EXCLUSIVE;
+
+	LCK_RW_ASSERT(lock, LCK_RW_ASSERT_HELD);
+
+	if (lck_sleep_action & LCK_SLEEP_UNLOCK) {
+		return gate_wait(gate,
+		           interruptible,
+		           deadline,
+		           ^{lck_rw_type = lck_rw_done(lock);},
+		           ^{;});
+	} else if (!(lck_sleep_action & (LCK_SLEEP_SHARED | LCK_SLEEP_EXCLUSIVE))) {
+		return gate_wait(gate,
+		           interruptible,
+		           deadline,
+		           ^{lck_rw_type = lck_rw_done(lock);},
+		           ^{lck_rw_lock(lock, lck_rw_type);});
+	} else if (lck_sleep_action & LCK_SLEEP_EXCLUSIVE) {
+		return gate_wait(gate,
+		           interruptible,
+		           deadline,
+		           ^{lck_rw_type = lck_rw_done(lock);},
+		           ^{lck_rw_lock_exclusive(lock);});
+	} else {
+		return gate_wait(gate,
+		           interruptible,
+		           deadline,
+		           ^{lck_rw_type = lck_rw_done(lock);},
+		           ^{lck_rw_lock_shared(lock);});
 	}
+}
 
-	lockgroup_info_base = (lockgroup_info_t *) lockgroup_info_addr;
-	lck_grp = (lck_grp_t *)queue_first(&lck_grp_queue);
-	lockgroup_info = lockgroup_info_base;
+/*
+ * Name: lck_rw_gate_assert
+ *
+ * Description: asserts that the gate is in the specified state.
+ *
+ * Args:
+ *   Arg1: lck_rw_t lock used to protect the gate.
+ *   Arg2: pointer to the gate data declared with decl_lck_rw_gate_data.
+ *   Arg3: flags to specified assert type.
+ *         GATE_ASSERT_CLOSED - the gate is currently closed
+ *         GATE_ASSERT_OPEN - the gate is currently opened
+ *         GATE_ASSERT_HELD - the gate is currently closed and the current thread is the holder
+ */
+void
+lck_rw_gate_assert(__assert_only lck_rw_t *lock, gate_t *gate, int flags)
+{
+	LCK_RW_ASSERT(lock, LCK_RW_ASSERT_HELD);
 
-	for (i = 0; i < lck_grp_cnt; i++) {
+	gate_assert(gate, flags);
+	return;
+}
 
-		lockgroup_info->lock_spin_cnt = lck_grp->lck_grp_spincnt;
-		lockgroup_info->lock_spin_util_cnt = lck_grp->lck_grp_stat.lck_grp_spin_stat.lck_grp_spin_util_cnt;
-		lockgroup_info->lock_spin_held_cnt = lck_grp->lck_grp_stat.lck_grp_spin_stat.lck_grp_spin_held_cnt;
-		lockgroup_info->lock_spin_miss_cnt = lck_grp->lck_grp_stat.lck_grp_spin_stat.lck_grp_spin_miss_cnt;
-		lockgroup_info->lock_spin_held_max = lck_grp->lck_grp_stat.lck_grp_spin_stat.lck_grp_spin_held_max;
-		lockgroup_info->lock_spin_held_cum = lck_grp->lck_grp_stat.lck_grp_spin_stat.lck_grp_spin_held_cum;
+/*
+ * Name: lck_mtx_gate_init
+ *
+ * Description: initializes a variable declared with decl_lck_mtx_gate_data.
+ *
+ * Args:
+ *   Arg1: lck_mtx_t lock used to protect the gate.
+ *   Arg2: pointer to the gate data declared with decl_lck_mtx_gate_data.
+ */
+void
+lck_mtx_gate_init(lck_mtx_t *lock, gate_t *gate)
+{
+	(void) lock;
+	gate_init(gate);
+}
 
-		lockgroup_info->lock_mtx_cnt = lck_grp->lck_grp_mtxcnt;
-		lockgroup_info->lock_mtx_util_cnt = lck_grp->lck_grp_stat.lck_grp_mtx_stat.lck_grp_mtx_util_cnt;
-		lockgroup_info->lock_mtx_held_cnt = lck_grp->lck_grp_stat.lck_grp_mtx_stat.lck_grp_mtx_held_cnt;
-		lockgroup_info->lock_mtx_miss_cnt = lck_grp->lck_grp_stat.lck_grp_mtx_stat.lck_grp_mtx_miss_cnt;
-		lockgroup_info->lock_mtx_wait_cnt = lck_grp->lck_grp_stat.lck_grp_mtx_stat.lck_grp_mtx_wait_cnt;
-		lockgroup_info->lock_mtx_held_max = lck_grp->lck_grp_stat.lck_grp_mtx_stat.lck_grp_mtx_held_max;
-		lockgroup_info->lock_mtx_held_cum = lck_grp->lck_grp_stat.lck_grp_mtx_stat.lck_grp_mtx_held_cum;
-		lockgroup_info->lock_mtx_wait_max = lck_grp->lck_grp_stat.lck_grp_mtx_stat.lck_grp_mtx_wait_max;
-		lockgroup_info->lock_mtx_wait_cum = lck_grp->lck_grp_stat.lck_grp_mtx_stat.lck_grp_mtx_wait_cum;
+/*
+ * Name: lck_mtx_gate_destroy
+ *
+ * Description: destroys a variable previously initialized
+ *
+ * Args:
+ *   Arg1: lck_mtx_t lock used to protect the gate.
+ *   Arg2: pointer to the gate data declared with decl_lck_mtx_gate_data.
+ */
+void
+lck_mtx_gate_destroy(lck_mtx_t *lock, gate_t *gate)
+{
+	(void) lock;
+	gate_destroy(gate);
+}
 
-		lockgroup_info->lock_rw_cnt = lck_grp->lck_grp_rwcnt;
-		lockgroup_info->lock_rw_util_cnt = lck_grp->lck_grp_stat.lck_grp_rw_stat.lck_grp_rw_util_cnt;
-		lockgroup_info->lock_rw_held_cnt = lck_grp->lck_grp_stat.lck_grp_rw_stat.lck_grp_rw_held_cnt;
-		lockgroup_info->lock_rw_miss_cnt = lck_grp->lck_grp_stat.lck_grp_rw_stat.lck_grp_rw_miss_cnt;
-		lockgroup_info->lock_rw_wait_cnt = lck_grp->lck_grp_stat.lck_grp_rw_stat.lck_grp_rw_wait_cnt;
-		lockgroup_info->lock_rw_held_max = lck_grp->lck_grp_stat.lck_grp_rw_stat.lck_grp_rw_held_max;
-		lockgroup_info->lock_rw_held_cum = lck_grp->lck_grp_stat.lck_grp_rw_stat.lck_grp_rw_held_cum;
-		lockgroup_info->lock_rw_wait_max = lck_grp->lck_grp_stat.lck_grp_rw_stat.lck_grp_rw_wait_max;
-		lockgroup_info->lock_rw_wait_cum = lck_grp->lck_grp_stat.lck_grp_rw_stat.lck_grp_rw_wait_cum;
+/*
+ * Name: lck_mtx_gate_try_close
+ *
+ * Description: Tries to close the gate.
+ *              In case of success the current thread will be set as
+ *              the holder of the gate.
+ *
+ * Args:
+ *   Arg1: lck_mtx_t lock used to protect the gate.
+ *   Arg2: pointer to the gate data declared with decl_lck_mtx_gate_data.
+ *
+ * Conditions: Lock must be held. Returns with the lock held.
+ *
+ * Returns:
+ *          KERN_SUCCESS in case the gate was successfully closed. The current thread is the new holder
+ *          of the gate.
+ *          A matching lck_mtx_gate_open() or lck_mtx_gate_handoff() needs to be called later on
+ *          to wake up possible waiters on the gate before returning to userspace.
+ *          If the intent is to conditionally probe the gate before waiting, the lock must not be dropped
+ *          between the calls to lck_mtx_gate_try_close() and lck_mtx_gate_wait().
+ *
+ *          KERN_FAILURE in case the gate was already closed. Will panic if the current thread was already the holder of the gate.
+ *          lck_mtx_gate_wait() should be called instead if the intent is to unconditionally wait on this gate.
+ *          The calls to lck_mtx_gate_try_close() and lck_mtx_gate_wait() should
+ *          be done without dropping the lock that is protecting the gate in between.
+ */
+int
+lck_mtx_gate_try_close(__assert_only lck_mtx_t *lock, gate_t *gate)
+{
+	LCK_MTX_ASSERT(lock, LCK_MTX_ASSERT_OWNED);
 
-		(void) strncpy(lockgroup_info->lockgroup_name,lck_grp->lck_grp_name, LOCKGROUP_MAX_NAME);
+	return gate_try_close(gate);
+}
 
-		lck_grp = (lck_grp_t *)(queue_next((queue_entry_t)(lck_grp)));
-		lockgroup_info++;
-	}
+/*
+ * Name: lck_mtx_gate_close
+ *
+ * Description: Closes the gate. The current thread will be set as
+ *              the holder of the gate. Will panic if the gate is already closed.
+ *              A matching lck_mtx_gate_open() or lck_mtx_gate_handoff() needs to be called later on
+ *              to wake up possible waiters on the gate before returning to userspace.
+ *
+ * Args:
+ *   Arg1: lck_mtx_t lock used to protect the gate.
+ *   Arg2: pointer to the gate data declared with decl_lck_mtx_gate_data.
+ *
+ * Conditions: Lock must be held. Returns with the lock held.
+ *             The gate must be open.
+ *
+ */
+void
+lck_mtx_gate_close(__assert_only lck_mtx_t *lock, gate_t *gate)
+{
+	LCK_MTX_ASSERT(lock, LCK_MTX_ASSERT_OWNED);
 
-	*lockgroup_infoCntp = lck_grp_cnt;
-	lck_mtx_unlock(&lck_grp_lock);
+	return gate_close(gate);
+}
 
-	used = (*lockgroup_infoCntp) * sizeof *lockgroup_info;
+/*
+ * Name: lck_mtx_gate_open
+ *
+ * Description: Opens of the gate and wakes up possible waiters.
+ *
+ * Args:
+ *   Arg1: lck_mtx_t lock used to protect the gate.
+ *   Arg2: pointer to the gate data declared with decl_lck_mtx_gate_data.
+ *
+ * Conditions: Lock must be held. Returns with the lock held.
+ *             The current thread must be the holder of the gate.
+ *
+ */
+void
+lck_mtx_gate_open(__assert_only lck_mtx_t *lock, gate_t *gate)
+{
+	LCK_MTX_ASSERT(lock, LCK_MTX_ASSERT_OWNED);
 
-	if (used != lockgroup_info_size)
-		bzero((char *) lockgroup_info, lockgroup_info_size - used);
+	gate_open(gate);
+}
 
-	kr = vm_map_copyin(ipc_kernel_map, (vm_map_address_t)lockgroup_info_addr,
-			   (vm_map_size_t)lockgroup_info_size, TRUE, &copy);
-	assert(kr == KERN_SUCCESS);
+/*
+ * Name: lck_mtx_gate_handoff
+ *
+ * Description: Set the current ownership of the gate. The waiter with highest sched
+ *              priority will be selected as the new holder of the gate, and woken up,
+ *              with the gate remaining in the closed state throughout.
+ *              If no waiters are present, the gate will be kept closed and KERN_NOT_WAITING
+ *              will be returned.
+ *              OPEN_ON_FAILURE flag can be used to specify if the gate should be opened in
+ *              case no waiters were found.
+ *
+ *
+ * Args:
+ *   Arg1: lck_mtx_t lock used to protect the gate.
+ *   Arg2: pointer to the gate data declared with decl_lck_mtx_gate_data.
+ *   Arg3: flags - GATE_NO_FALGS or OPEN_ON_FAILURE
+ *
+ * Conditions: Lock must be held. Returns with the lock held.
+ *             The current thread must be the holder of the gate.
+ *
+ * Returns:
+ *          KERN_SUCCESS in case one of the waiters became the new holder.
+ *          KERN_NOT_WAITING in case there were no waiters.
+ *
+ */
+kern_return_t
+lck_mtx_gate_handoff(__assert_only lck_mtx_t *lock, gate_t *gate, int flags)
+{
+	LCK_MTX_ASSERT(lock, LCK_MTX_ASSERT_OWNED);
 
-	*lockgroup_infop = (lockgroup_info_t *) copy;
+	return gate_handoff(gate, flags);
+}
+
+/*
+ * Name: lck_mtx_gate_steal
+ *
+ * Description: Steals the ownership of the gate. It sets the current thread as the
+ *              new holder of the gate.
+ *              A matching lck_mtx_gate_open() or lck_mtx_gate_handoff() needs to be called later on
+ *              to wake up possible waiters on the gate before returning to userspace.
+ *              NOTE: the previous holder should not call lck_mtx_gate_open() or lck_mtx_gate_handoff()
+ *              anymore.
+ *
+ *
+ * Args:
+ *   Arg1: lck_mtx_t lock used to protect the gate.
+ *   Arg2: pointer to the gate data declared with decl_lck_mtx_gate_data.
+ *
+ * Conditions: Lock must be held. Returns with the lock held.
+ *             The gate must be closed and the current thread must not already be the holder.
+ *
+ */
+void
+lck_mtx_gate_steal(__assert_only lck_mtx_t *lock, gate_t *gate)
+{
+	LCK_MTX_ASSERT(lock, LCK_MTX_ASSERT_OWNED);
 
-	return(KERN_SUCCESS);
+	gate_steal(gate);
+}
+
+/*
+ * Name: lck_mtx_gate_wait
+ *
+ * Description: Waits for the current thread to become the holder of the gate or for the
+ *              gate to become open. An interruptible mode and deadline can be specified
+ *              to return earlier from the wait.
+ *
+ * Args:
+ *   Arg1: lck_mtx_t lock used to protect the gate.
+ *   Arg2: pointer to the gate data declared with decl_lck_mtx_gate_data.
+ *   Arg3: sleep action. LCK_SLEEP_DEFAULT, LCK_SLEEP_UNLOCK, LCK_SLEEP_SPIN, LCK_SLEEP_SPIN_ALWAYS.
+ *   Arg3: interruptible flag for wait.
+ *   Arg4: deadline
+ *
+ * Conditions: Lock must be held. Returns with the lock held according to the sleep action specified.
+ *             Lock will be dropped while waiting.
+ *             The gate must be closed.
+ *
+ * Returns: Reason why the thread was woken up.
+ *          GATE_HANDOFF - the current thread was handed off the ownership of the gate.
+ *                         A matching lck_mtx_gate_open() or lck_mtx_gate_handoff() needs to be called later on
+ *                         to wake up possible waiters on the gate before returning to userspace.
+ *          GATE_OPENED - the gate was opened by the holder.
+ *          GATE_TIMED_OUT - the thread was woken up by a timeout.
+ *          GATE_INTERRUPTED - the thread was interrupted while sleeping.
+ *
+ */
+gate_wait_result_t
+lck_mtx_gate_wait(lck_mtx_t *lock, gate_t *gate, lck_sleep_action_t lck_sleep_action, wait_interrupt_t interruptible, uint64_t deadline)
+{
+	LCK_MTX_ASSERT(lock, LCK_MTX_ASSERT_OWNED);
+
+	if (lck_sleep_action & LCK_SLEEP_UNLOCK) {
+		return gate_wait(gate,
+		           interruptible,
+		           deadline,
+		           ^{lck_mtx_unlock(lock);},
+		           ^{;});
+	} else if (lck_sleep_action & LCK_SLEEP_SPIN) {
+		return gate_wait(gate,
+		           interruptible,
+		           deadline,
+		           ^{lck_mtx_unlock(lock);},
+		           ^{lck_mtx_lock_spin(lock);});
+	} else if (lck_sleep_action & LCK_SLEEP_SPIN_ALWAYS) {
+		return gate_wait(gate,
+		           interruptible,
+		           deadline,
+		           ^{lck_mtx_unlock(lock);},
+		           ^{lck_mtx_lock_spin_always(lock);});
+	} else {
+		return gate_wait(gate,
+		           interruptible,
+		           deadline,
+		           ^{lck_mtx_unlock(lock);},
+		           ^{lck_mtx_lock(lock);});
+	}
 }
 
+/*
+ * Name: lck_mtx_gate_assert
+ *
+ * Description: asserts that the gate is in the specified state.
+ *
+ * Args:
+ *   Arg1: lck_mtx_t lock used to protect the gate.
+ *   Arg2: pointer to the gate data declared with decl_lck_mtx_gate_data.
+ *   Arg3: flags to specified assert type.
+ *         GATE_ASSERT_CLOSED - the gate is currently closed
+ *         GATE_ASSERT_OPEN - the gate is currently opened
+ *         GATE_ASSERT_HELD - the gate is currently closed and the current thread is the holder
+ */
+void
+lck_mtx_gate_assert(__assert_only lck_mtx_t *lock, gate_t *gate, int flags)
+{
+	LCK_MTX_ASSERT(lock, LCK_MTX_ASSERT_OWNED);
+
+	gate_assert(gate, flags);
+}