2 * Copyright (c) 2002-2016 Apple Inc. All rights reserved.
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
29 * Copyright (c) 1997 Berkeley Software Design, Inc. All rights reserved.
31 * Redistribution and use in source and binary forms, with or without
32 * modification, are permitted provided that the following conditions
34 * 1. Redistributions of source code must retain the above copyright
35 * notice, this list of conditions and the following disclaimer.
36 * 2. Redistributions in binary form must reproduce the above copyright
37 * notice, this list of conditions and the following disclaimer in the
38 * documentation and/or other materials provided with the distribution.
39 * 3. Berkeley Software Design Inc's name may not be used to endorse or
40 * promote products derived from this software without specific prior
43 * THIS SOFTWARE IS PROVIDED BY BERKELEY SOFTWARE DESIGN INC ``AS IS'' AND
44 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
45 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
46 * ARE DISCLAIMED. IN NO EVENT SHALL BERKELEY SOFTWARE DESIGN INC BE LIABLE
47 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
48 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
49 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
50 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
51 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
52 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
55 * from BSDI nfs_lock.c,v 2.4 1998/12/14 23:49:56 jch Exp
58 #include <nfs/nfs_conf.h>
61 #include <sys/cdefs.h>
62 #include <sys/param.h>
63 #include <sys/systm.h>
64 #include <sys/fcntl.h>
65 #include <sys/kernel.h> /* for hz */
66 #include <sys/file_internal.h>
67 #include <sys/malloc.h>
68 #include <sys/lockf.h> /* for hz */ /* Must come after sys/malloc.h */
69 #include <sys/kpi_mbuf.h>
70 #include <sys/mount_internal.h>
71 #include <sys/proc_internal.h> /* for p_start */
72 #include <sys/kauth.h>
73 #include <sys/resourcevar.h>
74 #include <sys/socket.h>
75 #include <sys/unistd.h>
77 #include <sys/vnode_internal.h>
79 #include <kern/thread.h>
80 #include <kern/host.h>
82 #include <machine/limits.h>
86 #include <nfs/rpcv2.h>
87 #include <nfs/nfsproto.h>
89 #include <nfs/nfs_gss.h>
90 #include <nfs/nfsmount.h>
91 #include <nfs/nfsnode.h>
92 #include <nfs/nfs_lock.h>
94 #include <mach/host_priv.h>
95 #include <mach/mig_errors.h>
96 #include <mach/host_special_ports.h>
97 #include <lockd/lockd_mach.h>
99 extern void ipc_port_release_send(ipc_port_t
);
102 * pending lock request messages are kept in this queue which is
103 * kept sorted by transaction ID (xid).
105 static uint64_t nfs_lockxid
= 0;
106 static LOCKD_MSG_QUEUE nfs_pendlockq
= TAILQ_HEAD_INITIALIZER(nfs_pendlockq
);
108 /* list of mounts that are (potentially) making lockd requests */
109 TAILQ_HEAD(nfs_lockd_mount_list
, nfsmount
) nfs_lockd_mount_list
=
110 TAILQ_HEAD_INITIALIZER(nfs_lockd_mount_list
);
112 static LCK_GRP_DECLARE(nfs_lock_lck_grp
, "nfs_lock");
113 static LCK_MTX_DECLARE(nfs_lock_mutex
, &nfs_lock_lck_grp
);
115 void nfs_lockdmsg_enqueue(LOCKD_MSG_REQUEST
*);
116 void nfs_lockdmsg_dequeue(LOCKD_MSG_REQUEST
*);
117 int nfs_lockdmsg_compare_to_answer(LOCKD_MSG_REQUEST
*, struct lockd_ans
*);
118 LOCKD_MSG_REQUEST
*nfs_lockdmsg_find_by_answer(struct lockd_ans
*);
119 LOCKD_MSG_REQUEST
*nfs_lockdmsg_find_by_xid(uint64_t);
120 uint64_t nfs_lockxid_get(void);
121 int nfs_lockd_send_request(LOCKD_MSG
*, int);
124 * Register a mount as (potentially) making lockd requests.
127 nfs_lockd_mount_register(struct nfsmount
*nmp
)
129 lck_mtx_lock(&nfs_lock_mutex
);
130 TAILQ_INSERT_HEAD(&nfs_lockd_mount_list
, nmp
, nm_ldlink
);
132 lck_mtx_unlock(&nfs_lock_mutex
);
136 * Unregister a mount as (potentially) making lockd requests.
138 * When the lockd mount count drops to zero, then send a shutdown request to
139 * lockd if we've sent any requests to it.
142 nfs_lockd_mount_unregister(struct nfsmount
*nmp
)
145 mach_port_t lockd_port
= IPC_PORT_NULL
;
148 lck_mtx_lock(&nfs_lock_mutex
);
149 if (nmp
->nm_ldlink
.tqe_next
== NFSNOLIST
) {
150 lck_mtx_unlock(&nfs_lock_mutex
);
154 TAILQ_REMOVE(&nfs_lockd_mount_list
, nmp
, nm_ldlink
);
155 nmp
->nm_ldlink
.tqe_next
= NFSNOLIST
;
159 /* send a shutdown request if there are no more lockd mounts */
160 send_shutdown
= ((nfs_lockd_mounts
== 0) && nfs_lockd_request_sent
);
162 nfs_lockd_request_sent
= 0;
165 lck_mtx_unlock(&nfs_lock_mutex
);
167 if (!send_shutdown
) {
172 * Let lockd know that it is no longer needed for any NFS mounts
174 kr
= host_get_lockd_port(host_priv_self(), &lockd_port
);
175 if ((kr
!= KERN_SUCCESS
) || !IPC_PORT_VALID(lockd_port
)) {
176 printf("nfs_lockd_mount_change: shutdown couldn't get port, kr %d, port %s\n",
177 kr
, (lockd_port
== IPC_PORT_NULL
) ? "NULL" :
178 (lockd_port
== IPC_PORT_DEAD
) ? "DEAD" : "VALID");
182 kr
= lockd_shutdown(lockd_port
);
183 if (kr
!= KERN_SUCCESS
) {
184 printf("nfs_lockd_mount_change: shutdown %d\n", kr
);
187 ipc_port_release_send(lockd_port
);
191 * insert a lock request message into the pending queue
192 * (nfs_lock_mutex must be held)
195 nfs_lockdmsg_enqueue(LOCKD_MSG_REQUEST
*msgreq
)
197 LOCKD_MSG_REQUEST
*mr
;
199 mr
= TAILQ_LAST(&nfs_pendlockq
, nfs_lock_msg_queue
);
200 if (!mr
|| (msgreq
->lmr_msg
.lm_xid
> mr
->lmr_msg
.lm_xid
)) {
201 /* fast path: empty queue or new largest xid */
202 TAILQ_INSERT_TAIL(&nfs_pendlockq
, msgreq
, lmr_next
);
205 /* slow path: need to walk list to find insertion point */
206 while (mr
&& (msgreq
->lmr_msg
.lm_xid
> mr
->lmr_msg
.lm_xid
)) {
207 mr
= TAILQ_PREV(mr
, nfs_lock_msg_queue
, lmr_next
);
210 TAILQ_INSERT_AFTER(&nfs_pendlockq
, mr
, msgreq
, lmr_next
);
212 TAILQ_INSERT_HEAD(&nfs_pendlockq
, msgreq
, lmr_next
);
217 * remove a lock request message from the pending queue
218 * (nfs_lock_mutex must be held)
221 nfs_lockdmsg_dequeue(LOCKD_MSG_REQUEST
*msgreq
)
223 TAILQ_REMOVE(&nfs_pendlockq
, msgreq
, lmr_next
);
227 * find a pending lock request message by xid
229 * We search from the head of the list assuming that the message we're
230 * looking for is for an older request (because we have an answer to it).
231 * This assumes that lock request will be answered primarily in FIFO order.
232 * However, this may not be the case if there are blocked requests. We may
233 * want to move blocked requests to a separate queue (but that'll complicate
234 * duplicate xid checking).
236 * (nfs_lock_mutex must be held)
239 nfs_lockdmsg_find_by_xid(uint64_t lockxid
)
241 LOCKD_MSG_REQUEST
*mr
;
243 TAILQ_FOREACH(mr
, &nfs_pendlockq
, lmr_next
) {
244 if (mr
->lmr_msg
.lm_xid
== lockxid
) {
247 if (mr
->lmr_msg
.lm_xid
> lockxid
) {
255 * Because we can't depend on nlm_granted messages containing the same
256 * cookie we sent with the original lock request, we need code to test
257 * if an nlm_granted answer matches the lock request. We also need code
258 * that can find a lockd message based solely on the nlm_granted answer.
262 * compare lockd message to answer
264 * returns 0 on equality and 1 if different
267 nfs_lockdmsg_compare_to_answer(LOCKD_MSG_REQUEST
*msgreq
, struct lockd_ans
*ansp
)
269 if (!(ansp
->la_flags
& LOCKD_ANS_LOCK_INFO
)) {
272 if (msgreq
->lmr_msg
.lm_fl
.l_pid
!= ansp
->la_pid
) {
275 if (msgreq
->lmr_msg
.lm_fl
.l_start
!= ansp
->la_start
) {
278 if (msgreq
->lmr_msg
.lm_fl
.l_len
!= ansp
->la_len
) {
281 if (msgreq
->lmr_msg
.lm_fh_len
!= ansp
->la_fh_len
) {
284 if (bcmp(msgreq
->lmr_msg
.lm_fh
, ansp
->la_fh
, ansp
->la_fh_len
)) {
291 * find a pending lock request message based on the lock info provided
292 * in the lockd_ans/nlm_granted data. We need this because we can't
293 * depend on nlm_granted messages containing the same cookie we sent
294 * with the original lock request.
296 * We search from the head of the list assuming that the message we're
297 * looking for is for an older request (because we have an answer to it).
298 * This assumes that lock request will be answered primarily in FIFO order.
299 * However, this may not be the case if there are blocked requests. We may
300 * want to move blocked requests to a separate queue (but that'll complicate
301 * duplicate xid checking).
303 * (nfs_lock_mutex must be held)
306 nfs_lockdmsg_find_by_answer(struct lockd_ans
*ansp
)
308 LOCKD_MSG_REQUEST
*mr
;
310 if (!(ansp
->la_flags
& LOCKD_ANS_LOCK_INFO
)) {
313 TAILQ_FOREACH(mr
, &nfs_pendlockq
, lmr_next
) {
314 if (!nfs_lockdmsg_compare_to_answer(mr
, ansp
)) {
322 * return the next unique lock request transaction ID
323 * (nfs_lock_mutex must be held)
326 nfs_lockxid_get(void)
328 LOCKD_MSG_REQUEST
*mr
;
330 /* derive initial lock xid from system time */
333 * Note: it's OK if this code inits nfs_lockxid to 0 (for example,
334 * due to a broken clock) because we immediately increment it
335 * and we guarantee to never use xid 0. So, nfs_lockxid should only
336 * ever be 0 the first time this function is called.
340 nfs_lockxid
= (uint64_t)tv
.tv_sec
<< 12;
343 /* make sure we get a unique xid */
345 /* Skip zero xid if it should ever happen. */
346 if (++nfs_lockxid
== 0) {
349 if (!(mr
= TAILQ_LAST(&nfs_pendlockq
, nfs_lock_msg_queue
)) ||
350 (mr
->lmr_msg
.lm_xid
< nfs_lockxid
)) {
351 /* fast path: empty queue or new largest xid */
354 /* check if xid is already in use */
355 } while (nfs_lockdmsg_find_by_xid(nfs_lockxid
));
360 #define MACH_MAX_TRIES 3
363 nfs_lockd_send_request(LOCKD_MSG
*msg
, int interruptable
)
367 mach_port_t lockd_port
= IPC_PORT_NULL
;
369 kr
= host_get_lockd_port(host_priv_self(), &lockd_port
);
370 if (kr
!= KERN_SUCCESS
|| !IPC_PORT_VALID(lockd_port
)) {
375 /* In the kernel all mach messaging is interruptable */
387 (uint32_t *)&msg
->lm_addr
,
388 (uint32_t *)&msg
->lm_cred
,
391 if (kr
!= KERN_SUCCESS
) {
392 printf("lockd_request received %d!\n", kr
);
394 } while (!interruptable
&& kr
== MACH_SEND_INTERRUPTED
);
395 } while (kr
== MIG_SERVER_DIED
&& retries
++ < MACH_MAX_TRIES
);
397 ipc_port_release_send(lockd_port
);
399 case MACH_SEND_INTERRUPTED
:
403 * Other MACH or MIG errors we will retry. Eventually
404 * we will call nfs_down and allow the user to disable
412 * NFS advisory byte-level locks (client)
418 LOCKD_MSG_REQUEST
*msgreq
,
422 LOCKD_MSG
*msg
= &msgreq
->lmr_msg
;
424 int interruptable
, slpflag
;
425 struct nfsmount
*nmp
;
427 int timeo
, wentdown
= 0;
428 long starttime
, endtime
, lastmsg
;
430 struct sockaddr
*saddr
;
433 if (!nmp
|| !nmp
->nm_saddr
) {
437 lck_mtx_lock(&nmp
->nm_lock
);
438 saddr
= nmp
->nm_saddr
;
439 bcopy(saddr
, &msg
->lm_addr
, min(sizeof msg
->lm_addr
, saddr
->sa_len
));
440 if (nmp
->nm_vers
== NFS_VER3
) {
441 msg
->lm_flags
|= LOCKD_MSG_NFSV3
;
444 if (nmp
->nm_sotype
!= SOCK_DGRAM
) {
445 msg
->lm_flags
|= LOCKD_MSG_TCP
;
449 starttime
= now
.tv_sec
;
450 lastmsg
= now
.tv_sec
- ((nmp
->nm_tprintf_delay
) - (nmp
->nm_tprintf_initial_delay
));
451 interruptable
= NMFLAG(nmp
, INTR
);
452 lck_mtx_unlock(&nmp
->nm_lock
);
454 lck_mtx_lock(&nfs_lock_mutex
);
456 /* allocate unique xid */
457 msg
->lm_xid
= nfs_lockxid_get();
458 nfs_lockdmsg_enqueue(msgreq
);
463 nfs_lockd_request_sent
= 1;
465 /* need to drop nfs_lock_mutex while calling nfs_lockd_send_request() */
466 lck_mtx_unlock(&nfs_lock_mutex
);
467 error
= nfs_lockd_send_request(msg
, interruptable
);
468 lck_mtx_lock(&nfs_lock_mutex
);
469 if (error
&& error
!= EAGAIN
) {
474 * Always wait for an answer. Not waiting for unlocks could
475 * cause a lock to be left if the unlock request gets dropped.
479 * Retry if it takes too long to get a response.
481 * The timeout numbers were picked out of thin air... they start
482 * at 4 and double each timeout with a max of 30 seconds.
484 * In order to maintain responsiveness, we pass a small timeout
485 * to msleep and calculate the timeouts ourselves. This allows
486 * us to pick up on mount changes quicker.
490 slpflag
= (interruptable
&& (type
!= F_UNLCK
)) ? PCATCH
: 0;
494 endtime
= now
.tv_sec
+ timeo
;
495 while (now
.tv_sec
< endtime
) {
497 if (!msgreq
->lmr_answered
) {
498 error
= msleep(msgreq
, &nfs_lock_mutex
, slpflag
| PUSER
, "lockd", &ts
);
501 if (msgreq
->lmr_answered
) {
503 * Note: it's possible to have a lock granted at
504 * essentially the same time that we get interrupted.
505 * Since the lock may be granted, we can't return an
506 * error from this request or we might not unlock the
507 * lock that's been granted.
510 if ((msgreq
->lmr_errno
== ENOTSUP
) && nmp
&&
511 (nmp
->nm_state
& NFSSTA_LOCKSWORK
)) {
513 * We have evidence that locks work, yet lockd
514 * returned ENOTSUP. This is probably because
515 * it was unable to contact the server's lockd
516 * to send it the request.
518 * Because we know locks work, we'll consider
519 * this failure to be a timeout.
527 if (error
!= EWOULDBLOCK
) {
530 /* check that we still have our mount... */
531 /* ...and that we still support locks */
532 /* ...and that there isn't a recovery pending */
534 if ((error2
= nfs_sigintr(nmp
, NULL
, NULL
, 0))) {
536 if (type
== F_UNLCK
) {
537 printf("nfs3_lockd_request: aborting unlock request, error %d\n", error
);
541 lck_mtx_lock(&nmp
->nm_lock
);
542 if (nmp
->nm_lockmode
== NFS_LOCK_MODE_DISABLED
) {
543 lck_mtx_unlock(&nmp
->nm_lock
);
546 if ((nmp
->nm_state
& NFSSTA_RECOVER
) && !(flags
& R_RECOVER
)) {
547 /* recovery pending... return an error that'll get this operation restarted */
548 error
= NFSERR_GRACE
;
549 lck_mtx_unlock(&nmp
->nm_lock
);
552 interruptable
= NMFLAG(nmp
, INTR
);
553 lck_mtx_unlock(&nmp
->nm_lock
);
557 /* check that we still have our mount... */
559 if ((error2
= nfs_sigintr(nmp
, NULL
, NULL
, 0))) {
561 if (error2
!= EINTR
) {
562 if (type
== F_UNLCK
) {
563 printf("nfs3_lockd_request: aborting unlock request, error %d\n", error
);
568 /* ...and that we still support locks */
569 lck_mtx_lock(&nmp
->nm_lock
);
570 if (nmp
->nm_lockmode
== NFS_LOCK_MODE_DISABLED
) {
571 if (error
== EWOULDBLOCK
) {
574 lck_mtx_unlock(&nmp
->nm_lock
);
577 /* ...and that there isn't a recovery pending */
578 if ((error
== EWOULDBLOCK
) && (nmp
->nm_state
& NFSSTA_RECOVER
) && !(flags
& R_RECOVER
)) {
579 /* recovery pending... return to allow recovery to occur */
580 error
= NFSERR_DENIED
;
581 lck_mtx_unlock(&nmp
->nm_lock
);
584 interruptable
= NMFLAG(nmp
, INTR
);
585 if ((error
!= EWOULDBLOCK
) ||
586 ((nmp
->nm_state
& NFSSTA_RECOVER
) && !(flags
& R_RECOVER
)) ||
587 ((flags
& R_RECOVER
) && ((now
.tv_sec
- starttime
) > 30))) {
588 if ((error
== EWOULDBLOCK
) && (flags
& R_RECOVER
)) {
589 /* give up if this is for recovery and taking too long */
591 } else if ((nmp
->nm_state
& NFSSTA_RECOVER
) && !(flags
& R_RECOVER
)) {
592 /* recovery pending... return an error that'll get this operation restarted */
593 error
= NFSERR_GRACE
;
595 lck_mtx_unlock(&nmp
->nm_lock
);
597 * We're going to bail on this request.
598 * If we were a blocked lock request, send a cancel.
600 if ((msgreq
->lmr_errno
== EINPROGRESS
) &&
601 !(msg
->lm_flags
& LOCKD_MSG_CANCEL
)) {
602 /* set this request up as a cancel */
603 msg
->lm_flags
|= LOCKD_MSG_CANCEL
;
604 nfs_lockdmsg_dequeue(msgreq
);
605 msg
->lm_xid
= nfs_lockxid_get();
606 nfs_lockdmsg_enqueue(msgreq
);
607 msgreq
->lmr_saved_errno
= error
;
608 msgreq
->lmr_errno
= 0;
609 msgreq
->lmr_answered
= 0;
612 /* send cancel request */
618 /* warn if we're not getting any response */
620 if ((msgreq
->lmr_errno
!= EINPROGRESS
) &&
621 !(msg
->lm_flags
& LOCKD_MSG_DENIED_GRACE
) &&
622 (nmp
->nm_tprintf_initial_delay
!= 0) &&
623 ((lastmsg
+ nmp
->nm_tprintf_delay
) < now
.tv_sec
)) {
624 lck_mtx_unlock(&nmp
->nm_lock
);
625 lastmsg
= now
.tv_sec
;
626 nfs_down(nmp
, thd
, 0, NFSSTA_LOCKTIMEO
, "lockd not responding", 1);
629 lck_mtx_unlock(&nmp
->nm_lock
);
632 if (msgreq
->lmr_errno
== EINPROGRESS
) {
634 * We've got a blocked lock request that we are
635 * going to retry. First, we'll want to try to
636 * send a cancel for the previous request.
638 * Clear errno so if we don't get a response
639 * to the resend we'll call nfs_down().
640 * Also reset timeout because we'll expect a
641 * quick response to the cancel/resend (even if
642 * it is NLM_BLOCKED).
644 msg
->lm_flags
|= LOCKD_MSG_CANCEL
;
645 nfs_lockdmsg_dequeue(msgreq
);
646 msg
->lm_xid
= nfs_lockxid_get();
647 nfs_lockdmsg_enqueue(msgreq
);
648 msgreq
->lmr_saved_errno
= msgreq
->lmr_errno
;
649 msgreq
->lmr_errno
= 0;
650 msgreq
->lmr_answered
= 0;
652 /* send cancel then resend request */
657 * We timed out, so we will resend the request.
659 if (!(flags
& R_RECOVER
)) {
669 /* we got a reponse, so the server's lockd is OK */
670 nfs_up(NFSTONMP(np
), thd
, NFSSTA_LOCKTIMEO
,
671 wentdown
? "lockd alive again" : NULL
);
674 if (msgreq
->lmr_answered
&& (msg
->lm_flags
& LOCKD_MSG_DENIED_GRACE
)) {
676 * The lock request was denied because the server lockd is
677 * still in its grace period. So, we need to try the
678 * request again in a little bit. Return the GRACE error so
679 * the higher levels can perform the retry.
681 msgreq
->lmr_saved_errno
= msgreq
->lmr_errno
= error
= NFSERR_GRACE
;
684 if (msgreq
->lmr_errno
== EINPROGRESS
) {
685 /* got NLM_BLOCKED response */
686 /* need to wait for NLM_GRANTED */
688 msgreq
->lmr_answered
= 0;
689 goto wait_for_granted
;
692 if ((msg
->lm_flags
& LOCKD_MSG_CANCEL
) &&
693 (msgreq
->lmr_saved_errno
== EINPROGRESS
)) {
695 * We just got a successful reply to the
696 * cancel of the previous blocked lock request.
697 * Now, go ahead and return a DENIED error so the
698 * higher levels can resend the request.
700 msg
->lm_flags
&= ~LOCKD_MSG_CANCEL
;
701 error
= NFSERR_DENIED
;
702 /* Will dequeue msgreq after the following break at the end of this routine */
707 * If the blocked lock request was cancelled.
708 * Restore the error condition from when we
709 * originally bailed on the request.
711 if (msg
->lm_flags
& LOCKD_MSG_CANCEL
) {
712 msg
->lm_flags
&= ~LOCKD_MSG_CANCEL
;
713 error
= msgreq
->lmr_saved_errno
;
715 error
= msgreq
->lmr_errno
;
719 if ((error
== ENOTSUP
) && nmp
&& !(nmp
->nm_state
& NFSSTA_LOCKSWORK
)) {
721 * We have NO evidence that locks work and lockd
722 * returned ENOTSUP. Let's take this as a hint
723 * that locks aren't supported and disable them
726 nfs_lockdmsg_dequeue(msgreq
);
727 lck_mtx_unlock(&nfs_lock_mutex
);
728 lck_mtx_lock(&nmp
->nm_lock
);
729 if (nmp
->nm_lockmode
== NFS_LOCK_MODE_ENABLED
) {
730 nmp
->nm_lockmode
= NFS_LOCK_MODE_DISABLED
;
731 nfs_lockd_mount_unregister(nmp
);
733 nmp
->nm_state
&= ~NFSSTA_LOCKTIMEO
;
734 lck_mtx_unlock(&nmp
->nm_lock
);
735 printf("lockd returned ENOTSUP, disabling locks for nfs server: %s\n",
736 vfs_statfs(nmp
->nm_mountp
)->f_mntfromname
);
740 /* record that NFS file locking has worked on this mount */
742 lck_mtx_lock(&nmp
->nm_lock
);
743 if (!(nmp
->nm_state
& NFSSTA_LOCKSWORK
)) {
744 nmp
->nm_state
|= NFSSTA_LOCKSWORK
;
746 lck_mtx_unlock(&nmp
->nm_lock
);
752 nfs_lockdmsg_dequeue(msgreq
);
754 lck_mtx_unlock(&nfs_lock_mutex
);
760 * Send an NLM LOCK message to the server
765 struct nfs_open_file
*nofp
,
766 struct nfs_file_lock
*nflp
,
772 struct nfs_lock_owner
*nlop
= nflp
->nfl_owner
;
773 struct nfsmount
*nmp
;
775 LOCKD_MSG_REQUEST msgreq
;
779 if (nfs_mount_gone(nmp
)) {
783 if (!nlop
->nlo_open_owner
) {
784 nfs_open_owner_ref(nofp
->nof_owner
);
785 nlop
->nlo_open_owner
= nofp
->nof_owner
;
787 if ((error
= nfs_lock_owner_set_busy(nlop
, thd
))) {
791 /* set up lock message request structure */
792 bzero(&msgreq
, sizeof(msgreq
));
793 msg
= &msgreq
.lmr_msg
;
794 msg
->lm_version
= LOCKD_MSG_VERSION
;
795 if ((nflp
->nfl_flags
& NFS_FILE_LOCK_WAIT
) && !reclaim
) {
796 msg
->lm_flags
|= LOCKD_MSG_BLOCK
;
799 msg
->lm_flags
|= LOCKD_MSG_RECLAIM
;
801 msg
->lm_fh_len
= (nmp
->nm_vers
== NFS_VER2
) ? NFSX_V2FH
: np
->n_fhsize
;
802 bcopy(np
->n_fhp
, msg
->lm_fh
, msg
->lm_fh_len
);
803 cru2x(cred
, &msg
->lm_cred
);
805 msg
->lm_fl
.l_whence
= SEEK_SET
;
806 msg
->lm_fl
.l_start
= nflp
->nfl_start
;
807 msg
->lm_fl
.l_len
= NFS_FLOCK_LENGTH(nflp
->nfl_start
, nflp
->nfl_end
);
808 msg
->lm_fl
.l_type
= nflp
->nfl_type
;
809 msg
->lm_fl
.l_pid
= nlop
->nlo_pid
;
811 error
= nfs3_lockd_request(np
, 0, &msgreq
, flags
, thd
);
813 nfs_lock_owner_clear_busy(nlop
);
818 * Send an NLM UNLOCK message to the server
823 struct nfs_lock_owner
*nlop
,
831 struct nfsmount
*nmp
;
832 LOCKD_MSG_REQUEST msgreq
;
840 /* set up lock message request structure */
841 bzero(&msgreq
, sizeof(msgreq
));
842 msg
= &msgreq
.lmr_msg
;
843 msg
->lm_version
= LOCKD_MSG_VERSION
;
844 msg
->lm_fh_len
= (nmp
->nm_vers
== NFS_VER2
) ? NFSX_V2FH
: np
->n_fhsize
;
845 bcopy(np
->n_fhp
, msg
->lm_fh
, msg
->lm_fh_len
);
846 cru2x(cred
, &msg
->lm_cred
);
848 msg
->lm_fl
.l_whence
= SEEK_SET
;
849 msg
->lm_fl
.l_start
= start
;
850 msg
->lm_fl
.l_len
= NFS_FLOCK_LENGTH(start
, end
);
851 msg
->lm_fl
.l_type
= F_UNLCK
;
852 msg
->lm_fl
.l_pid
= nlop
->nlo_pid
;
854 return nfs3_lockd_request(np
, F_UNLCK
, &msgreq
, flags
, thd
);
858 * Send an NLM LOCK TEST message to the server
863 struct nfs_lock_owner
*nlop
,
869 struct nfsmount
*nmp
;
871 LOCKD_MSG_REQUEST msgreq
;
875 if (nfs_mount_gone(nmp
)) {
879 /* set up lock message request structure */
880 bzero(&msgreq
, sizeof(msgreq
));
881 msg
= &msgreq
.lmr_msg
;
882 msg
->lm_version
= LOCKD_MSG_VERSION
;
883 msg
->lm_flags
|= LOCKD_MSG_TEST
;
884 msg
->lm_fh_len
= (nmp
->nm_vers
== NFS_VER2
) ? NFSX_V2FH
: np
->n_fhsize
;
885 bcopy(np
->n_fhp
, msg
->lm_fh
, msg
->lm_fh_len
);
886 cru2x(vfs_context_ucred(ctx
), &msg
->lm_cred
);
888 msg
->lm_fl
.l_whence
= SEEK_SET
;
889 msg
->lm_fl
.l_start
= start
;
890 msg
->lm_fl
.l_len
= NFS_FLOCK_LENGTH(start
, end
);
891 msg
->lm_fl
.l_type
= fl
->l_type
;
892 msg
->lm_fl
.l_pid
= nlop
->nlo_pid
;
894 error
= nfs3_lockd_request(np
, 0, &msgreq
, 0, vfs_context_thread(ctx
));
896 if (!error
&& (msg
->lm_flags
& LOCKD_MSG_TEST
) && !msgreq
.lmr_errno
) {
897 if (msg
->lm_fl
.l_type
!= F_UNLCK
) {
898 fl
->l_type
= msg
->lm_fl
.l_type
;
899 fl
->l_pid
= msg
->lm_fl
.l_pid
;
900 fl
->l_start
= msg
->lm_fl
.l_start
;
901 fl
->l_len
= msg
->lm_fl
.l_len
;
902 fl
->l_whence
= SEEK_SET
;
904 fl
->l_type
= F_UNLCK
;
913 * NFS advisory byte-level locks answer from the lock daemon.
916 nfslockdans(proc_t p
, struct lockd_ans
*ansp
)
918 LOCKD_MSG_REQUEST
*msgreq
;
921 /* Let root make this call. */
922 error
= proc_suser(p
);
927 /* the version should match, or we're out of sync */
928 if (ansp
->la_version
!= LOCKD_ANS_VERSION
) {
932 lck_mtx_lock(&nfs_lock_mutex
);
934 /* try to find the lockd message by transaction id (cookie) */
935 msgreq
= nfs_lockdmsg_find_by_xid(ansp
->la_xid
);
936 if (ansp
->la_flags
& LOCKD_ANS_GRANTED
) {
938 * We can't depend on the granted message having our cookie,
939 * so we check the answer against the lockd message found.
940 * If no message was found or it doesn't match the answer,
941 * we look for the lockd message by the answer's lock info.
943 if (!msgreq
|| nfs_lockdmsg_compare_to_answer(msgreq
, ansp
)) {
944 msgreq
= nfs_lockdmsg_find_by_answer(ansp
);
947 * We need to make sure this request isn't being cancelled
948 * If it is, we don't want to accept the granted message.
950 if (msgreq
&& (msgreq
->lmr_msg
.lm_flags
& LOCKD_MSG_CANCEL
)) {
955 lck_mtx_unlock(&nfs_lock_mutex
);
959 msgreq
->lmr_errno
= ansp
->la_errno
;
960 if ((msgreq
->lmr_msg
.lm_flags
& LOCKD_MSG_TEST
) && msgreq
->lmr_errno
== 0) {
961 if (ansp
->la_flags
& LOCKD_ANS_LOCK_INFO
) {
962 if (ansp
->la_flags
& LOCKD_ANS_LOCK_EXCL
) {
963 msgreq
->lmr_msg
.lm_fl
.l_type
= F_WRLCK
;
965 msgreq
->lmr_msg
.lm_fl
.l_type
= F_RDLCK
;
967 msgreq
->lmr_msg
.lm_fl
.l_pid
= ansp
->la_pid
;
968 msgreq
->lmr_msg
.lm_fl
.l_start
= ansp
->la_start
;
969 msgreq
->lmr_msg
.lm_fl
.l_len
= ansp
->la_len
;
971 msgreq
->lmr_msg
.lm_fl
.l_type
= F_UNLCK
;
974 if (ansp
->la_flags
& LOCKD_ANS_DENIED_GRACE
) {
975 msgreq
->lmr_msg
.lm_flags
|= LOCKD_MSG_DENIED_GRACE
;
978 msgreq
->lmr_answered
= 1;
979 lck_mtx_unlock(&nfs_lock_mutex
);
987 * NFS host restart notification from the lock daemon.
989 * Used to initiate reclaiming of held locks when a server we
990 * have mounted reboots.
993 nfslockdnotify(proc_t p
, user_addr_t argp
)
995 int error
, i
, headsize
;
996 struct lockd_notify ln
;
997 struct nfsmount
*nmp
;
998 struct sockaddr
*saddr
;
1000 /* Let root make this call. */
1001 error
= proc_suser(p
);
1006 headsize
= (char*)&ln
.ln_addr
[0] - (char*)&ln
.ln_version
;
1007 error
= copyin(argp
, &ln
, headsize
);
1011 if (ln
.ln_version
!= LOCKD_NOTIFY_VERSION
) {
1014 if ((ln
.ln_addrcount
< 1) || (ln
.ln_addrcount
> 128)) {
1018 saddr
= (struct sockaddr
*)&ln
.ln_addr
[0];
1020 lck_mtx_lock(&nfs_lock_mutex
);
1022 for (i
= 0; i
< ln
.ln_addrcount
; i
++) {
1023 error
= copyin(argp
, &ln
.ln_addr
[0], sizeof(ln
.ln_addr
[0]));
1027 argp
+= sizeof(ln
.ln_addr
[0]);
1028 /* scan lockd mount list for match to this address */
1029 TAILQ_FOREACH(nmp
, &nfs_lockd_mount_list
, nm_ldlink
) {
1030 /* check if address matches this mount's server address */
1031 if (!nmp
->nm_saddr
|| nfs_sockaddr_cmp(saddr
, nmp
->nm_saddr
)) {
1034 /* We have a match! Mark it as needing recovery. */
1035 lck_mtx_lock(&nmp
->nm_lock
);
1036 nfs_need_recover(nmp
, 0);
1037 lck_mtx_unlock(&nmp
->nm_lock
);
1041 lck_mtx_unlock(&nfs_lock_mutex
);
1046 #endif /* CONFIG_NFS_CLIENT */