X-Git-Url: https://git.saurik.com/apple/xnu.git/blobdiff_plain/316670eb35587141e969394ae8537d66b9211e80..3903760236c30e3b5ace7a4eefac3a269d68957c:/bsd/kern/kern_lockf.c

diff --git a/bsd/kern/kern_lockf.c b/bsd/kern/kern_lockf.c
index 13e4c97db..0a3165cf2 100644
--- a/bsd/kern/kern_lockf.c
+++ b/bsd/kern/kern_lockf.c
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2006 Apple Computer, Inc. All rights reserved.
+ * Copyright (c) 2015 Apple Computer, Inc. All rights reserved.
  *
  * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
  * 
@@ -75,6 +75,10 @@
 #include <sys/malloc.h>
 #include <sys/fcntl.h>
 #include <sys/lockf.h>
+#include <sys/sdt.h>
+#include <kern/policy_internal.h>
+
+#include <sys/file_internal.h>
 
 /*
  * This variable controls the maximum number of processes that will
@@ -82,17 +86,25 @@
  */
 static int maxlockdepth = MAXDEPTH;
 
+#if (DEVELOPMENT || DEBUG)
+#define LOCKF_DEBUGGING	1
+#endif
+
 #ifdef LOCKF_DEBUGGING
 #include <sys/sysctl.h>
-#include <ufs/ufs/quota.h>
-#include <ufs/ufs/inode.h>
 void lf_print(const char *tag, struct lockf *lock);
 void lf_printlist(const char *tag, struct lockf *lock);
-static int	lockf_debug = 2;
+
+#define	LF_DBG_LOCKOP	(1 << 0)	/* setlk, getlk, clearlk */
+#define	LF_DBG_LIST	(1 << 1)	/* split, coalesce */
+#define	LF_DBG_IMPINH	(1 << 2)	/* importance inheritance */
+#define	LF_DBG_TRACE	(1 << 3)	/* errors, exit */
+
+static int	lockf_debug = 0;	/* was 2, could be 3 ;-) */
 SYSCTL_INT(_debug, OID_AUTO, lockf_debug, CTLFLAG_RW | CTLFLAG_LOCKED, &lockf_debug, 0, "");
 
 /*
- * If there is no mask bit selector, or there is on, and the selector is
+ * If there is no mask bit selector, or there is one, and the selector is
  * set, then output the debugging diagnostic.
  */
 #define LOCKF_DEBUG(mask, ...)					\
@@ -129,9 +141,15 @@ static overlap_t lf_findoverlap(struct lockf *,
 	    struct lockf *, int, struct lockf ***, struct lockf **);
 static struct lockf *lf_getblock(struct lockf *, pid_t);
 static int	 lf_getlock(struct lockf *, struct flock *, pid_t);
-static int	 lf_setlock(struct lockf *);
+static int	 lf_setlock(struct lockf *, struct timespec *);
 static int	 lf_split(struct lockf *, struct lockf *);
 static void	 lf_wakelock(struct lockf *, boolean_t);
+#if IMPORTANCE_INHERITANCE
+static void	 lf_hold_assertion(task_t, struct lockf *);
+static void	 lf_jump_to_queue_head(struct lockf *, struct lockf *);
+static void	 lf_drop_assertion(struct lockf *);
+static void	 lf_boost_blocking_proc(struct lockf *, struct lockf *);
+#endif /* IMPORTANCE_INHERITANCE */
 
 /*
  * lf_advlock
@@ -150,6 +168,7 @@ static void	 lf_wakelock(struct lockf *, boolean_t);
  *	lf_setlock:EDEADLK
  *	lf_setlock:EINTR
  *	lf_setlock:ENOLCK
+ *	lf_setlock:ETIMEDOUT
  *	lf_clearlock:ENOLCK
  *	vnode_size:???
  *
@@ -177,7 +196,9 @@ lf_advlock(struct vnop_advlock_args *ap)
 	if (*head == (struct lockf *)0) {
 		if (ap->a_op != F_SETLK) {
 			fl->l_type = F_UNLCK;
-			LOCKF_DEBUG(0, "lf_advlock: '%s' unlock without lock\n", vfs_context_proc(context)->p_comm);
+			LOCKF_DEBUG(LF_DBG_TRACE,
+			    "lf_advlock: '%s' unlock without lock\n",
+			    vfs_context_proc(context)->p_comm);
 			return (0);
 		}
 	}
@@ -205,7 +226,8 @@ lf_advlock(struct vnop_advlock_args *ap)
 		 * do this because we will use size to force range checks.
 		 */
 		if ((error = vnode_size(vp, (off_t *)&size, context))) {
-			LOCKF_DEBUG(0, "lf_advlock: vnode_getattr failed: %d\n", error);
+			LOCKF_DEBUG(LF_DBG_TRACE,
+			    "lf_advlock: vnode_getattr failed: %d\n", error);
 			return (error);
 		}
 
@@ -217,22 +239,26 @@ lf_advlock(struct vnop_advlock_args *ap)
 		break;
 
 	default:
-		LOCKF_DEBUG(0, "lf_advlock: unknown whence %d\n", fl->l_whence);
+		LOCKF_DEBUG(LF_DBG_TRACE, "lf_advlock: unknown whence %d\n",
+		    fl->l_whence);
 		return (EINVAL);
 	}
 	if (start < 0) {
-		LOCKF_DEBUG(0, "lf_advlock: start < 0 (%qd)\n", start);
+		LOCKF_DEBUG(LF_DBG_TRACE, "lf_advlock: start < 0 (%qd)\n",
+		    start);
 		return (EINVAL);
 	}
 	if (fl->l_len < 0) {
 		if (start == 0) {
-			LOCKF_DEBUG(0, "lf_advlock: len < 0 & start == 0\n");
+			LOCKF_DEBUG(LF_DBG_TRACE,
+			    "lf_advlock: len < 0 & start == 0\n");
 			return (EINVAL);
 		}
 		end = start - 1;
 		start += fl->l_len;
 		if (start < 0) {
-			LOCKF_DEBUG(0, "lf_advlock: start < 0 (%qd)\n", start);
+			LOCKF_DEBUG(LF_DBG_TRACE,
+			    "lf_advlock: start < 0 (%qd)\n", start);
 			return (EINVAL);
 		}
 	} else if (fl->l_len == 0)
@@ -240,7 +266,7 @@ lf_advlock(struct vnop_advlock_args *ap)
 	else {
 		oadd = fl->l_len - 1;
 		if (oadd > (off_t)(OFF_MAX - start)) {
-			LOCKF_DEBUG(0, "lf_advlock: overflow\n");
+		        LOCKF_DEBUG(LF_DBG_TRACE, "lf_advlock: overflow\n");
 			return (EOVERFLOW);
 		}
 		end = start + oadd;
@@ -260,6 +286,13 @@ lf_advlock(struct vnop_advlock_args *ap)
 	lock->lf_next = (struct lockf *)0;
 	TAILQ_INIT(&lock->lf_blkhd);
 	lock->lf_flags = ap->a_flags;
+#if IMPORTANCE_INHERITANCE
+	lock->lf_boosted = LF_NOT_BOOSTED;
+#endif
+	if (ap->a_flags & F_POSIX)
+		lock->lf_owner = (struct proc *)lock->lf_id;
+	else
+		lock->lf_owner = NULL;
 
 	if (ap->a_flags & F_FLOCK)
 	        lock->lf_flags |= F_WAKE1_SAFE;
@@ -270,7 +303,20 @@ lf_advlock(struct vnop_advlock_args *ap)
 	 */
 	switch(ap->a_op) {
 	case F_SETLK:
-		error = lf_setlock(lock);
+		/*
+		 * For F_OFD_* locks, lf_id is the fileglob.
+		 * Record an "lf_owner" iff this is a confined fd
+		 * i.e. it cannot escape this process and will be
+		 * F_UNLCKed before the owner exits.  (This is
+		 * the implicit guarantee needed to ensure lf_owner
+		 * remains a valid reference here.)
+		 */
+		if (ap->a_flags & F_OFD_LOCK) {
+			struct fileglob *fg = (void *)lock->lf_id;
+			if (fg->fg_lflags & FG_CONFINED)
+				lock->lf_owner = current_proc();
+		}
+		error = lf_setlock(lock, ap->a_timeout);
 		break;
 
 	case F_UNLCK:
@@ -283,12 +329,6 @@ lf_advlock(struct vnop_advlock_args *ap)
 		FREE(lock, M_LOCKF);
 		break;
 
-#if CONFIG_EMBEDDED
-	case F_GETLKPID:
-		error = lf_getlock(lock, fl, fl->l_pid);
-		FREE(lock, M_LOCKF);
-		break;
-#endif
 
 	default:
 		FREE(lock, M_LOCKF);
@@ -297,7 +337,7 @@ lf_advlock(struct vnop_advlock_args *ap)
 	}
 	lck_mtx_unlock(&vp->v_lock);	/* done manipulating the list */
 
-	LOCKF_DEBUG(0, "lf_advlock: normal exit: %d\n\n", error);
+	LOCKF_DEBUG(LF_DBG_TRACE, "lf_advlock: normal exit: %d\n", error);
 	return (error);
 }
 
@@ -384,7 +424,7 @@ lf_coalesce_adjacent(struct lockf *lock)
 		    ((*lf)->lf_end + 1) == lock->lf_start) {
 			struct lockf *adjacent = *lf;
 
-			LOCKF_DEBUG(0, "lf_coalesce_adjacent: coalesce adjacent previous\n");
+			LOCKF_DEBUG(LF_DBG_LIST, "lf_coalesce_adjacent: coalesce adjacent previous\n");
 			lock->lf_start = (*lf)->lf_start;
 			*lf = lock;
 			lf = &(*lf)->lf_next;
@@ -399,7 +439,7 @@ lf_coalesce_adjacent(struct lockf *lock)
 		    (lock->lf_end + 1) == (*lf)->lf_start) {
 			struct lockf *adjacent = *lf;
 
-			LOCKF_DEBUG(0, "lf_coalesce_adjacent: coalesce adjacent following\n");
+			LOCKF_DEBUG(LF_DBG_LIST, "lf_coalesce_adjacent: coalesce adjacent following\n");
 			lock->lf_end = (*lf)->lf_end;
 			lock->lf_next = (*lf)->lf_next;
 			lf = &lock->lf_next;
@@ -415,7 +455,6 @@ lf_coalesce_adjacent(struct lockf *lock)
 	}
 }
 
-
 /*
  * lf_setlock
  *
@@ -427,19 +466,23 @@ lf_coalesce_adjacent(struct lockf *lock)
  *					the set is successful, and freed if the
  *					set is unsuccessful.
  *
+ *		timeout			Timeout specified in the case of
+ * 					SETLKWTIMEOUT.
+ *
  * Returns:	0			Success
  *		EAGAIN
  *		EDEADLK
  *	lf_split:ENOLCK
  *	lf_clearlock:ENOLCK
  *	msleep:EINTR
+ *	msleep:ETIMEDOUT
  *
  * Notes:	We add the lock to the provisional lock list.  We do not
  *		coalesce at this time; this has implications for other lock
  *		requestors in the blocker search mechanism.
  */
 static int
-lf_setlock(struct lockf *lock)
+lf_setlock(struct lockf *lock, struct timespec *timeout)
 {
 	struct lockf *block;
 	struct lockf **head = lock->lf_head;
@@ -450,7 +493,7 @@ lf_setlock(struct lockf *lock)
 	overlap_t ovcase;
 
 #ifdef LOCKF_DEBUGGING
-	if (lockf_debug & 1) {
+	if (lockf_debug & LF_DBG_LOCKOP) {
 		lf_print("lf_setlock", lock);
 		lf_printlist("lf_setlock(in)", lock);
 	}
@@ -471,6 +514,7 @@ lf_setlock(struct lockf *lock)
 		 * Free the structure and return if nonblocking.
 		 */
 		if ((lock->lf_flags & F_WAIT) == 0) {
+			DTRACE_FSINFO(advlock__nowait, vnode_t, vp);
 			FREE(lock, M_LOCKF);
 			return (EAGAIN);
 		}
@@ -478,7 +522,11 @@ lf_setlock(struct lockf *lock)
 		/*
 		 * We are blocked. Since flock style locks cover
 		 * the whole file, there is no chance for deadlock.
-		 * For byte-range locks we must check for deadlock.
+		 *
+		 * OFD byte-range locks currently do NOT support
+		 * deadlock detection.
+		 *
+		 * For POSIX byte-range locks we must check for deadlock.
 		 *
 		 * Deadlock detection is done by looking through the
 		 * wait channels to see if there are any cycles that
@@ -493,7 +541,7 @@ lf_setlock(struct lockf *lock)
 			int i = 0;
 
 			/* The block is waiting on something */
-			wproc = (struct proc *)block->lf_id;
+			wproc = block->lf_owner;
 			proc_lock(wproc);
 			TAILQ_FOREACH(ut, &wproc->p_uthlist, uu_list) {
 				/*
@@ -523,7 +571,7 @@ lf_setlock(struct lockf *lock)
 
 					/*
 					 * Make sure it's an advisory range
-					 * lock and not an overall file lock;
+					 * lock and not any other kind of lock;
 					 * if we mix lock types, it's our own
 					 * fault.
 					 */
@@ -536,8 +584,8 @@ lf_setlock(struct lockf *lock)
 					 * getting the requested lock, then we
 					 * would deadlock, so error out.
 					 */
-					bproc = (struct proc *)waitblock->lf_id;
-					if (bproc == (struct proc *)lock->lf_id) {
+					bproc = waitblock->lf_owner;
+					if (bproc == lock->lf_owner) {
 						proc_unlock(wproc);
 						FREE(lock, M_LOCKF);
 						return (EDEADLK);
@@ -571,43 +619,81 @@ lf_setlock(struct lockf *lock)
 		if ( !(lock->lf_flags & F_FLOCK))
 		        block->lf_flags &= ~F_WAKE1_SAFE;
 
+#if IMPORTANCE_INHERITANCE
+		/*
+		 * Importance donation is done only for cases where the
+		 * owning task can be unambiguously determined.
+		 *
+		 * POSIX type locks are not inherited by child processes;
+		 * we maintain a 1:1 mapping between a lock and its owning
+		 * process.
+		 *
+		 * Flock type locks are inherited across fork() and there is
+		 * no 1:1 mapping in the general case.  However, the fileglobs
+		 * used by OFD locks *may* be confined to the process that
+		 * created them, and thus have an "owner", in which case
+		 * we also attempt importance donation.
+		 */
+		if ((lock->lf_flags & block->lf_flags & F_POSIX) != 0)
+			lf_boost_blocking_proc(lock, block);
+		else if ((lock->lf_flags & block->lf_flags & F_OFD_LOCK) &&
+		    lock->lf_owner != block->lf_owner &&
+		    NULL != lock->lf_owner && NULL != block->lf_owner)
+			lf_boost_blocking_proc(lock, block);
+#endif /* IMPORTANCE_INHERITANCE */
+
 #ifdef LOCKF_DEBUGGING
-		if (lockf_debug & 1) {
+		if (lockf_debug & LF_DBG_LOCKOP) {
 			lf_print("lf_setlock: blocking on", block);
 			lf_printlist("lf_setlock(block)", block);
 		}
 #endif /* LOCKF_DEBUGGING */
-		error = msleep(lock, &vp->v_lock, priority, lockstr, 0);
+		DTRACE_FSINFO(advlock__wait, vnode_t, vp);
 
-		if (!TAILQ_EMPTY(&lock->lf_blkhd)) {
-		        if ((block = lf_getblock(lock, -1))) {
-				lf_move_blocked(block, lock);
-			}
-		}
+		error = msleep(lock, &vp->v_lock, priority, lockstr, timeout);
 
 		if (error == 0 && (lock->lf_flags & F_ABORT) != 0)
 			error = EBADF;
 
-		if (error) {	/* XXX */
+		if (lock->lf_next) {
 			/*
-			 * We may have been awakened by a signal and/or by a
-			 * debugger continuing us (in which cases we must remove
-			 * ourselves from the blocked list) and/or by another
-			 * process releasing a lock (in which case we have
-			 * already been removed from the blocked list and our
-			 * lf_next field set to NOLOCKF).
+			 * lf_wakelock() always sets wakelock->lf_next to
+			 * NULL before a wakeup; so we've been woken early
+			 * - perhaps by a debugger, signal or other event.
+			 *
+			 * Remove 'lock' from the block list (avoids double-add
+			 * in the spurious case, which would create a cycle)
 			 */
-			if (lock->lf_next) {
-				TAILQ_REMOVE(&lock->lf_next->lf_blkhd, lock, lf_block);
-				lock->lf_next = NOLOCKF;
+			TAILQ_REMOVE(&lock->lf_next->lf_blkhd, lock, lf_block);
+			lock->lf_next = NULL;
+
+			if (error == 0) {
+				/*
+				 * If this was a spurious wakeup, retry
+				 */
+				printf("%s: spurious wakeup, retrying lock\n",
+				    __func__);
+				continue;
 			}
+		}
+
+		if (!TAILQ_EMPTY(&lock->lf_blkhd)) {
+		        if ((block = lf_getblock(lock, -1)) != NULL)
+				lf_move_blocked(block, lock);
+		}
+
+		if (error) {
 			if (!TAILQ_EMPTY(&lock->lf_blkhd))
 			        lf_wakelock(lock, TRUE);
-			  
 			FREE(lock, M_LOCKF);
+			/* Return ETIMEDOUT if timeout occoured. */
+			if (error == EWOULDBLOCK) {
+				error = ETIMEDOUT;
+			}
 			return (error);
-		}	/* XXX */
+		}
 	}
+
 	/*
 	 * No blocks!!  Add the lock.  Note that we will
 	 * downgrade or upgrade any overlapping locks this
@@ -740,7 +826,7 @@ lf_setlock(struct lockf *lock)
 	/* Coalesce adjacent locks with identical attributes */
 	lf_coalesce_adjacent(lock);
 #ifdef LOCKF_DEBUGGING
-	if (lockf_debug & 1) {
+	if (lockf_debug & LF_DBG_LOCKOP) {
 		lf_print("lf_setlock: got the lock", lock);
 		lf_printlist("lf_setlock(out)", lock);
 	}
@@ -778,7 +864,7 @@ lf_clearlock(struct lockf *unlock)
 #ifdef LOCKF_DEBUGGING
 	if (unlock->lf_type != F_UNLCK)
 		panic("lf_clearlock: bad type");
-	if (lockf_debug & 1)
+	if (lockf_debug & LF_DBG_LOCKOP)
 		lf_print("lf_clearlock", unlock);
 #endif /* LOCKF_DEBUGGING */
 	prev = head;
@@ -787,6 +873,11 @@ lf_clearlock(struct lockf *unlock)
 		 * Wakeup the list of locks to be retried.
 		 */
 	        lf_wakelock(overlap, FALSE);
+#if IMPORTANCE_INHERITANCE
+		if (overlap->lf_boosted == LF_BOOSTED) {
+			lf_drop_assertion(overlap);
+		}
+#endif /* IMPORTANCE_INHERITANCE */
 
 		switch (ovcase) {
 		case OVERLAP_NONE:	/* satisfy compiler enum/switch */
@@ -830,7 +921,7 @@ lf_clearlock(struct lockf *unlock)
 		break;
 	}
 #ifdef LOCKF_DEBUGGING
-	if (lockf_debug & 1)
+	if (lockf_debug & LF_DBG_LOCKOP)
 		lf_printlist("lf_clearlock", unlock);
 #endif /* LOCKF_DEBUGGING */
 	return (0);
@@ -865,7 +956,7 @@ lf_getlock(struct lockf *lock, struct flock *fl, pid_t matchpid)
 	struct lockf *block;
 
 #ifdef LOCKF_DEBUGGING
-	if (lockf_debug & 1)
+	if (lockf_debug & LF_DBG_LOCKOP)
 		lf_print("lf_getlock", lock);
 #endif /* LOCKF_DEBUGGING */
 
@@ -877,9 +968,13 @@ lf_getlock(struct lockf *lock, struct flock *fl, pid_t matchpid)
 			fl->l_len = 0;
 		else
 			fl->l_len = block->lf_end - block->lf_start + 1;
-		if (block->lf_flags & F_POSIX)
-			fl->l_pid = proc_pid((struct proc *)(block->lf_id));
-		else
+		if (NULL != block->lf_owner) {
+			/*
+			 * lf_owner is only non-NULL when the lock
+			 * "owner" can be unambiguously determined
+			 */
+			fl->l_pid = proc_pid(block->lf_owner);
+		} else
 			fl->l_pid = -1;
 	} else {
 		fl->l_type = F_UNLCK;
@@ -915,12 +1010,14 @@ lf_getblock(struct lockf *lock, pid_t matchpid)
 		 * Found an overlap.
 		 *
 		 * If we're matching pids, and it's a record lock,
+		 * or it's an OFD lock on a process-confined fd,
 		 * but the pid doesn't match, then keep on looking ..
 		 */
 		if (matchpid != -1 &&
-		    (overlap->lf_flags & F_POSIX) != 0 &&
-		    proc_pid((struct proc *)(overlap->lf_id)) != matchpid)
+		    (overlap->lf_flags & (F_POSIX|F_OFD_LOCK)) != 0 &&
+		    proc_pid(overlap->lf_owner) != matchpid)
 			continue;
+
 		/*
 		 * does it block us?
 		 */
@@ -986,7 +1083,7 @@ lf_findoverlap(struct lockf *lf, struct lockf *lock, int type,
 	if (lf == NOLOCKF)
 		return (0);
 #ifdef LOCKF_DEBUGGING
-	if (lockf_debug & 2)
+	if (lockf_debug & LF_DBG_LIST)
 		lf_print("lf_findoverlap: looking for overlap in", lock);
 #endif /* LOCKF_DEBUGGING */
 	start = lock->lf_start;
@@ -1017,7 +1114,7 @@ lf_findoverlap(struct lockf *lf, struct lockf *lock, int type,
 		}
 
 #ifdef LOCKF_DEBUGGING
-		if (lockf_debug & 2)
+		if (lockf_debug & LF_DBG_LIST)
 			lf_print("\tchecking", lf);
 #endif /* LOCKF_DEBUGGING */
 		/*
@@ -1026,7 +1123,7 @@ lf_findoverlap(struct lockf *lf, struct lockf *lock, int type,
 		if ((lf->lf_end != -1 && start > lf->lf_end) ||
 		    (end != -1 && lf->lf_start > end)) {
 			/* Case 0 */
-			LOCKF_DEBUG(2, "no overlap\n");
+			LOCKF_DEBUG(LF_DBG_LIST, "no overlap\n");
 
 			/*
 			 * NOTE: assumes that locks for the same process are 
@@ -1039,30 +1136,30 @@ lf_findoverlap(struct lockf *lf, struct lockf *lock, int type,
 			continue;
 		}
 		if ((lf->lf_start == start) && (lf->lf_end == end)) {
-			LOCKF_DEBUG(2, "overlap == lock\n");
+			LOCKF_DEBUG(LF_DBG_LIST, "overlap == lock\n");
 			return (OVERLAP_EQUALS_LOCK);
 		}
 		if ((lf->lf_start <= start) &&
 		    (end != -1) &&
 		    ((lf->lf_end >= end) || (lf->lf_end == -1))) {
-			LOCKF_DEBUG(2, "overlap contains lock\n");
+			LOCKF_DEBUG(LF_DBG_LIST, "overlap contains lock\n");
 			return (OVERLAP_CONTAINS_LOCK);
 		}
 		if (start <= lf->lf_start &&
 		           (end == -1 ||
 			   (lf->lf_end != -1 && end >= lf->lf_end))) {
-			LOCKF_DEBUG(2, "lock contains overlap\n");
+			LOCKF_DEBUG(LF_DBG_LIST, "lock contains overlap\n");
 			return (OVERLAP_CONTAINED_BY_LOCK);
 		}
 		if ((lf->lf_start < start) &&
 			((lf->lf_end >= start) || (lf->lf_end == -1))) {
-			LOCKF_DEBUG(2, "overlap starts before lock\n");
+			LOCKF_DEBUG(LF_DBG_LIST, "overlap starts before lock\n");
 			return (OVERLAP_STARTS_BEFORE_LOCK);
 		}
 		if ((lf->lf_start > start) &&
 			(end != -1) &&
 			((lf->lf_end > end) || (lf->lf_end == -1))) {
-			LOCKF_DEBUG(2, "overlap ends after lock\n");
+			LOCKF_DEBUG(LF_DBG_LIST, "overlap ends after lock\n");
 			return (OVERLAP_ENDS_AFTER_LOCK);
 		}
 		panic("lf_findoverlap: default");
@@ -1100,13 +1197,13 @@ lf_split(struct lockf *lock1, struct lockf *lock2)
 	struct lockf *splitlock;
 
 #ifdef LOCKF_DEBUGGING
-	if (lockf_debug & 2) {
+	if (lockf_debug & LF_DBG_LIST) {
 		lf_print("lf_split", lock1);
 		lf_print("splitting from", lock2);
 	}
 #endif /* LOCKF_DEBUGGING */
 	/*
-	 * Check to see if spliting into only two pieces.
+	 * Check to see if splitting into only two pieces.
 	 */
 	if (lock1->lf_start == lock2->lf_start) {
 		lock1->lf_start = lock2->lf_end + 1;
@@ -1174,7 +1271,7 @@ lf_wakelock(struct lockf *listhead, boolean_t force_all)
 
 		wakelock->lf_next = NOLOCKF;
 #ifdef LOCKF_DEBUGGING
-		if (lockf_debug & 2)
+		if (lockf_debug & LF_DBG_LOCKOP)
 			lf_print("lf_wakelock: awakening", wakelock);
 #endif /* LOCKF_DEBUGGING */
 		if (wake_all == FALSE) {
@@ -1189,6 +1286,10 @@ lf_wakelock(struct lockf *listhead, boolean_t force_all)
 			        struct lockf *tlock;
 
 			        TAILQ_FOREACH(tlock, &wakelock->lf_blkhd, lf_block) {
+					if (TAILQ_NEXT(tlock, lf_block) == tlock) {
+						/* See rdar://10887303 */
+						panic("cycle in wakelock list");
+					}
 				        tlock->lf_next = wakelock;
 				}
 			}
@@ -1202,6 +1303,8 @@ lf_wakelock(struct lockf *listhead, boolean_t force_all)
 
 
 #ifdef LOCKF_DEBUGGING
+#define GET_LF_OWNER_PID(lf)	(proc_pid((lf)->lf_owner))
+
 /*
  * lf_print DEBUG
  *
@@ -1218,7 +1321,11 @@ lf_print(const char *tag, struct lockf *lock)
 {
 	printf("%s: lock %p for ", tag, (void *)lock);
 	if (lock->lf_flags & F_POSIX)
-		printf("proc %ld", (long)((struct proc *)lock->lf_id)->p_pid);
+		printf("proc %p (owner %d)",
+		    lock->lf_id, GET_LF_OWNER_PID(lock));
+	else if (lock->lf_flags & F_OFD_LOCK)
+		printf("fg %p (owner %d)",
+		    lock->lf_id, GET_LF_OWNER_PID(lock));
 	else
 		printf("id %p", (void *)lock->lf_id);
 	if (lock->lf_vnode != 0)
@@ -1266,8 +1373,11 @@ lf_printlist(const char *tag, struct lockf *lock)
 	for (lf = lock->lf_vnode->v_lockf; lf; lf = lf->lf_next) {
 		printf("\tlock %p for ",(void *)lf);
 		if (lf->lf_flags & F_POSIX)
-			printf("proc %ld",
-			    (long)((struct proc *)lf->lf_id)->p_pid);
+			printf("proc %p (owner %d)",
+			    lf->lf_id, GET_LF_OWNER_PID(lf));
+		else if (lf->lf_flags & F_OFD_LOCK)
+			printf("fg %p (owner %d)",
+			    lf->lf_id, GET_LF_OWNER_PID(lf));
 		else
 			printf("id %p", (void *)lf->lf_id);
 		printf(", %s, start 0x%016llx, end 0x%016llx",
@@ -1278,8 +1388,11 @@ lf_printlist(const char *tag, struct lockf *lock)
 		TAILQ_FOREACH(blk, &lf->lf_blkhd, lf_block) {
 			printf("\n\t\tlock request %p for ", (void *)blk);
 			if (blk->lf_flags & F_POSIX)
-				printf("proc %ld",
-				    (long)((struct proc *)blk->lf_id)->p_pid);
+				printf("proc %p (owner %d)",
+				    blk->lf_id, GET_LF_OWNER_PID(blk));
+			else if (blk->lf_flags & F_OFD_LOCK)
+				printf("fg %p (owner %d)",
+				    blk->lf_id, GET_LF_OWNER_PID(blk));
 			else
 				printf("id %p", (void *)blk->lf_id);
 			printf(", %s, start 0x%016llx, end 0x%016llx",
@@ -1295,3 +1408,106 @@ lf_printlist(const char *tag, struct lockf *lock)
 	}
 }
 #endif /* LOCKF_DEBUGGING */
+
+#if IMPORTANCE_INHERITANCE
+
+/*
+ * lf_hold_assertion
+ *
+ * Call task importance hold assertion on the owner of the lock.
+ *
+ * Parameters: block_task               Owner of the lock blocking 
+ *                                      current thread.
+ *
+ *             block                    lock on which the current thread 
+ *                                      is blocking on.
+ *
+ * Returns:    <void>
+ *
+ * Notes: The task reference on block_task is not needed to be hold since 
+ *        the current thread has vnode lock and block_task has a file 
+ *        lock, thus removing file lock in exit requires block_task to 
+ *        grab the vnode lock.
+ */
+static void 
+lf_hold_assertion(task_t block_task, struct lockf *block)
+{
+	if (task_importance_hold_file_lock_assertion(block_task, 1) == 0) {
+		block->lf_boosted = LF_BOOSTED;
+		LOCKF_DEBUG(LF_DBG_IMPINH,
+		    "lf: importance hold file lock assert on pid %d lock %p\n",
+		    proc_pid(block->lf_owner), block);
+	}
+}
+
+
+/*
+ * lf_jump_to_queue_head
+ *
+ * Jump the lock from the tail of the block queue to the head of
+ * the queue.
+ *
+ * Parameters: block                    lockf struct containing the 
+ *                                      block queue.
+ *             lock                     lockf struct to be jumped to the
+ *                                      front.
+ *
+ * Returns:    <void>
+ */
+static void
+lf_jump_to_queue_head(struct lockf *block, struct lockf *lock) 
+{
+	/* Move the lock to the head of the block queue. */
+	TAILQ_REMOVE(&block->lf_blkhd, lock, lf_block);
+	TAILQ_INSERT_HEAD(&block->lf_blkhd, lock, lf_block);
+}
+
+
+/*
+ * lf_drop_assertion
+ *
+ * Drops the task hold assertion.
+ *
+ * Parameters: block                    lockf struct holding the assertion.
+ *
+ * Returns:    <void>
+ */
+static void 
+lf_drop_assertion(struct lockf *block)
+{
+	LOCKF_DEBUG(LF_DBG_IMPINH, "lf: %d: dropping assertion for lock %p\n",
+	    proc_pid(block->lf_owner), block);
+
+	task_t current_task = proc_task(block->lf_owner);
+	task_importance_drop_file_lock_assertion(current_task, 1);
+	block->lf_boosted = LF_NOT_BOOSTED;
+}
+
+static void
+lf_boost_blocking_proc(struct lockf *lock, struct lockf *block)
+{
+	task_t ltask = proc_task(lock->lf_owner);
+	task_t btask = proc_task(block->lf_owner);
+
+	/*
+	 * Check if ltask can donate importance. The
+	 * check of imp_donor bit is done without holding
+	 * any lock. The value may change after you read it,
+	 * but it is ok to boost a task while someone else is
+	 * unboosting you.
+	 *
+	 * TODO: Support live inheritance on file locks.
+	 */
+	if (task_is_importance_donor(ltask)) {
+		LOCKF_DEBUG(LF_DBG_IMPINH,
+		    "lf: %d: attempt to boost pid %d that holds lock %p\n",
+		    proc_pid(lock->lf_owner), proc_pid(block->lf_owner), block);
+
+		if (block->lf_boosted != LF_BOOSTED &&
+		    task_is_importance_receiver_type(btask)) {
+			lf_hold_assertion(btask, block);
+		}
+		lf_jump_to_queue_head(block, lock);
+	}
+}
+#endif /* IMPORTANCE_INHERITANCE */