]> git.saurik.com Git - apple/xnu.git/blame - bsd/nfs/nfs_node.c
xnu-2782.30.5.tar.gz
[apple/xnu.git] / bsd / nfs / nfs_node.c
CommitLineData
1c79356b 1/*
4b17d6b6 2 * Copyright (c) 2000-2013 Apple Inc. All rights reserved.
5d5c5d0d 3 *
2d21ac55 4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
1c79356b 5 *
2d21ac55
A
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
8f6c56a5 14 *
2d21ac55
A
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
17 *
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
8f6c56a5
A
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
2d21ac55
A
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
8f6c56a5 25 *
2d21ac55 26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
1c79356b
A
27 */
28/* Copyright (c) 1995 NeXT Computer, Inc. All Rights Reserved */
29/*
30 * Copyright (c) 1989, 1993
31 * The Regents of the University of California. All rights reserved.
32 *
33 * This code is derived from software contributed to Berkeley by
34 * Rick Macklem at The University of Guelph.
35 *
36 * Redistribution and use in source and binary forms, with or without
37 * modification, are permitted provided that the following conditions
38 * are met:
39 * 1. Redistributions of source code must retain the above copyright
40 * notice, this list of conditions and the following disclaimer.
41 * 2. Redistributions in binary form must reproduce the above copyright
42 * notice, this list of conditions and the following disclaimer in the
43 * documentation and/or other materials provided with the distribution.
44 * 3. All advertising materials mentioning features or use of this software
45 * must display the following acknowledgement:
46 * This product includes software developed by the University of
47 * California, Berkeley and its contributors.
48 * 4. Neither the name of the University nor the names of its contributors
49 * may be used to endorse or promote products derived from this software
50 * without specific prior written permission.
51 *
52 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
53 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
54 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
55 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
56 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
57 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
58 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
59 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
60 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
61 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
62 * SUCH DAMAGE.
63 *
64 * @(#)nfs_node.c 8.6 (Berkeley) 5/22/95
65 * FreeBSD-Id: nfs_node.c,v 1.22 1997/10/28 14:06:20 bde Exp $
66 */
67
68
69#include <sys/param.h>
b0d623f7 70#include <sys/kernel.h>
1c79356b
A
71#include <sys/systm.h>
72#include <sys/proc.h>
91447636
A
73#include <sys/kauth.h>
74#include <sys/mount_internal.h>
4b17d6b6 75#include <sys/vnode_internal.h>
1c79356b 76#include <sys/vnode.h>
91447636 77#include <sys/ubc.h>
1c79356b 78#include <sys/malloc.h>
6d2010ae 79#include <sys/fcntl.h>
316670eb 80#include <sys/time.h>
1c79356b
A
81
82#include <nfs/rpcv2.h>
83#include <nfs/nfsproto.h>
84#include <nfs/nfs.h>
85#include <nfs/nfsnode.h>
2d21ac55 86#include <nfs/nfs_gss.h>
1c79356b
A
87#include <nfs/nfsmount.h>
88
2d21ac55
A
89#define NFSNOHASH(fhsum) \
90 (&nfsnodehashtbl[(fhsum) & nfsnodehash])
91static LIST_HEAD(nfsnodehashhead, nfsnode) *nfsnodehashtbl;
92static u_long nfsnodehash;
1c79356b 93
2d21ac55
A
94static lck_grp_t *nfs_node_hash_lck_grp;
95static lck_grp_t *nfs_node_lck_grp;
b0d623f7 96static lck_grp_t *nfs_data_lck_grp;
91447636 97lck_mtx_t *nfs_node_hash_mutex;
1c79356b 98
39236c6e
A
99#define NFS_NODE_DBG(...) NFS_DBG(NFS_FAC_NODE, 7, ## __VA_ARGS__)
100
1c79356b
A
101/*
102 * Initialize hash links for nfsnodes
103 * and build nfsnode free list.
104 */
105void
e5568f75 106nfs_nhinit(void)
1c79356b 107{
2d21ac55
A
108 nfs_node_hash_lck_grp = lck_grp_alloc_init("nfs_node_hash", LCK_GRP_ATTR_NULL);
109 nfs_node_hash_mutex = lck_mtx_alloc_init(nfs_node_hash_lck_grp, LCK_ATTR_NULL);
110 nfs_node_lck_grp = lck_grp_alloc_init("nfs_node", LCK_GRP_ATTR_NULL);
b0d623f7 111 nfs_data_lck_grp = lck_grp_alloc_init("nfs_data", LCK_GRP_ATTR_NULL);
2d21ac55 112}
91447636 113
2d21ac55
A
114void
115nfs_nhinit_finish(void)
116{
117 lck_mtx_lock(nfs_node_hash_mutex);
118 if (!nfsnodehashtbl)
119 nfsnodehashtbl = hashinit(desiredvnodes, M_NFSNODE, &nfsnodehash);
120 lck_mtx_unlock(nfs_node_hash_mutex);
1c79356b
A
121}
122
123/*
124 * Compute an entry in the NFS hash table structure
125 */
126u_long
91447636 127nfs_hash(u_char *fhp, int fhsize)
1c79356b 128{
91447636
A
129 u_long fhsum;
130 int i;
1c79356b 131
1c79356b
A
132 fhsum = 0;
133 for (i = 0; i < fhsize; i++)
91447636 134 fhsum += *fhp++;
1c79356b
A
135 return (fhsum);
136}
137
4b17d6b6
A
138
139int nfs_case_insensitive(mount_t);
140
141int
142nfs_case_insensitive(mount_t mp)
143{
144 struct nfsmount *nmp = VFSTONFS(mp);
145 int answer = 0;
146 int skip = 0;
147
fe8ab488 148 if (nfs_mount_gone(nmp)) {
4b17d6b6
A
149 return (0);
150 }
151
152 if (nmp->nm_vers == NFS_VER2) {
153 /* V2 has no way to know */
154 return (0);
155 }
156
157 lck_mtx_lock(&nmp->nm_lock);
158 if (nmp->nm_vers == NFS_VER3) {
159 if (!(nmp->nm_state & NFSSTA_GOTPATHCONF)) {
160 /* We're holding the node lock so we just return
161 * with answer as case sensitive. Is very rare
162 * for file systems not to be homogenous w.r.t. pathconf
163 */
164 skip = 1;
165 }
166 } else if (!(nmp->nm_fsattr.nfsa_flags & NFS_FSFLAG_HOMOGENEOUS)) {
167 /* no pathconf info cached */
168 skip = 1;
169 }
170
171 if (!skip && NFS_BITMAP_ISSET(nmp->nm_fsattr.nfsa_bitmap, NFS_FATTR_CASE_INSENSITIVE))
172 answer = 1;
173
174 lck_mtx_unlock(&nmp->nm_lock);
175
176 return (answer);
177}
178
179
1c79356b
A
180/*
181 * Look up a vnode/nfsnode by file handle.
182 * Callers must check for mount points!!
183 * In all cases, a pointer to a
184 * nfsnode structure is returned.
185 */
1c79356b 186int
91447636 187nfs_nget(
2d21ac55
A
188 mount_t mp,
189 nfsnode_t dnp,
91447636
A
190 struct componentname *cnp,
191 u_char *fhp,
192 int fhsize,
193 struct nfs_vattr *nvap,
194 u_int64_t *xidp,
6d2010ae 195 uint32_t auth,
91447636 196 int flags,
2d21ac55 197 nfsnode_t *npp)
1c79356b 198{
2d21ac55 199 nfsnode_t np;
1c79356b 200 struct nfsnodehashhead *nhpp;
2d21ac55
A
201 vnode_t vp;
202 int error, nfsvers;
203 mount_t mp2;
91447636
A
204 struct vnode_fsparam vfsp;
205 uint32_t vid;
1c79356b 206
2d21ac55
A
207 FSDBG_TOP(263, mp, dnp, flags, npp);
208
1c79356b 209 /* Check for unmount in progress */
fe8ab488 210 if (!mp || vfs_isforce(mp)) {
2d21ac55
A
211 *npp = NULL;
212 error = ENXIO;
213 FSDBG_BOT(263, mp, dnp, 0xd1e, error);
214 return (error);
1c79356b 215 }
2d21ac55 216 nfsvers = VFSTONFS(mp)->nm_vers;
1c79356b
A
217
218 nhpp = NFSNOHASH(nfs_hash(fhp, fhsize));
219loop:
91447636 220 lck_mtx_lock(nfs_node_hash_mutex);
1c79356b 221 for (np = nhpp->lh_first; np != 0; np = np->n_hash.le_next) {
2d21ac55
A
222 mp2 = (np->n_hflag & NHINIT) ? np->n_mount : NFSTOMP(np);
223 if (mp != mp2 || np->n_fhsize != fhsize ||
91447636 224 bcmp(fhp, np->n_fhp, fhsize))
1c79356b 225 continue;
6d2010ae
A
226 if (nvap && (nvap->nva_flags & NFS_FFLAG_TRIGGER_REFERRAL) &&
227 cnp && (cnp->cn_namelen > (fhsize - (int)sizeof(dnp)))) {
228 /* The name was too long to fit in the file handle. Check it against the node's name. */
229 int namecmp = 0;
230 const char *vname = vnode_getname(NFSTOV(np));
231 if (vname) {
232 if (cnp->cn_namelen != (int)strlen(vname))
233 namecmp = 1;
234 else
235 namecmp = strncmp(vname, cnp->cn_nameptr, cnp->cn_namelen);
236 vnode_putname(vname);
237 }
238 if (namecmp) /* full name didn't match */
239 continue;
240 }
2d21ac55
A
241 FSDBG(263, dnp, np, np->n_flag, 0xcace0000);
242 /* if the node is locked, sleep on it */
b0d623f7 243 if ((np->n_hflag & NHLOCKED) && !(flags & NG_NOCREATE)) {
2d21ac55
A
244 np->n_hflag |= NHLOCKWANT;
245 FSDBG(263, dnp, np, np->n_flag, 0xcace2222);
246 msleep(np, nfs_node_hash_mutex, PDROP | PINOD, "nfs_nget", NULL);
247 FSDBG(263, dnp, np, np->n_flag, 0xcace3333);
55e303ae
A
248 goto loop;
249 }
1c79356b 250 vp = NFSTOV(np);
91447636
A
251 vid = vnode_vid(vp);
252 lck_mtx_unlock(nfs_node_hash_mutex);
253 if ((error = vnode_getwithvid(vp, vid))) {
254 /*
255 * If vnode is being reclaimed or has already
256 * changed identity, no need to wait.
257 */
2d21ac55 258 FSDBG_BOT(263, dnp, *npp, 0xcace0d1e, error);
91447636 259 return (error);
2d21ac55 260 }
b0d623f7 261 if ((error = nfs_node_lock(np))) {
2d21ac55
A
262 /* this only fails if the node is now unhashed */
263 /* so let's see if we can find/create it again */
264 FSDBG(263, dnp, *npp, 0xcaced1e2, error);
265 vnode_put(vp);
b0d623f7
A
266 if (flags & NG_NOCREATE) {
267 *npp = 0;
268 FSDBG_BOT(263, dnp, *npp, 0xcaced1e0, ENOENT);
269 return (ENOENT);
270 }
2d21ac55
A
271 goto loop;
272 }
91447636 273 /* update attributes */
b0d623f7
A
274 if (nvap)
275 error = nfs_loadattrcache(np, nvap, xidp, 0);
91447636 276 if (error) {
b0d623f7 277 nfs_node_unlock(np);
91447636
A
278 vnode_put(vp);
279 } else {
2d21ac55
A
280 if (dnp && cnp && (flags & NG_MAKEENTRY))
281 cache_enter(NFSTOV(dnp), vp, cnp);
4b17d6b6
A
282 /*
283 * Update the vnode if the name/and or the parent has
284 * changed. We need to do this so that if getattrlist is
285 * called asking for ATTR_CMN_NAME, that the "most"
39236c6e
A
286 * correct name is being returned. In addition for
287 * monitored vnodes we need to kick the vnode out of the
288 * name cache. We do this so that if there are hard
289 * links in the same directory the link will not be
290 * found and a lookup will get us here to return the
291 * name of the current link. In addition by removing the
292 * name from the name cache the old name will not be
293 * found after a rename done on another client or the
294 * server. The principle reason to do this is because
295 * Finder is asking for notifications on a directory.
296 * The directory changes, Finder gets notified, reads
297 * the directory (which we have purged) and for each
298 * entry returned calls getattrlist with the name
299 * returned from readdir. gettattrlist has to call
300 * namei/lookup to resolve the name, because its not in
301 * the cache we end up here. We need to update the name
302 * so Finder will get the name it called us with.
4b17d6b6
A
303 *
304 * We had an imperfect solution with respect to case
305 * sensitivity. There is a test that is run in
306 * FileBuster that does renames from some name to
307 * another name differing only in case. It then reads
308 * the directory looking for the new name, after it
309 * finds that new name, it ask gettattrlist to verify
310 * that the name is the new name. Usually that works,
311 * but renames generate fsevents and fseventsd will do a
312 * lookup on the name via lstat. Since that test renames
313 * old name to new name back and forth there is a race
314 * that an fsevent will be behind and will access the
315 * file by the old name, on a case insensitive file
316 * system that will work. Problem is if we do a case
317 * sensitive compare, we're going to change the name,
318 * which the test's getattrlist verification step is
319 * going to fail. So we will check the case sensitivity
320 * of the file system and do the appropriate compare. In
321 * a rare instance for non homogeneous file systems
322 * w.r.t. pathconf we will use case sensitive compares.
323 * That could break if the file system is actually case
324 * insensitive.
325 *
326 * Note that V2 does not know the case, so we just
327 * assume case sensitivity.
328 *
329 * This is clearly not perfect due to races, but this is
330 * as good as its going to get. You can defeat the
331 * handling of hard links simply by doing:
332 *
333 * while :; do ls -l > /dev/null; done
334 *
335 * in a terminal window. Even a single ls -l can cause a
336 * race.
337 *
338 * <rant>What we really need is for the caller, that
339 * knows the name being used is valid since it got it
340 * from a readdir to use that name and not ask for the
341 * ATTR_CMN_NAME</rant>
342 */
343 if (dnp && cnp && (vp != NFSTOV(dnp))) {
39236c6e 344 int update_flags = (vnode_ismonitored((NFSTOV(dnp)))) ? VNODE_UPDATE_CACHE : 0;
4b17d6b6
A
345 int (*cmp)(const char *s1, const char *s2, size_t n);
346
347 cmp = nfs_case_insensitive(mp) ? strncasecmp : strncmp;
348
349 if (vp->v_name && cnp->cn_namelen && (*cmp)(cnp->cn_nameptr, vp->v_name, cnp->cn_namelen))
350 update_flags |= VNODE_UPDATE_NAME;
351 if ((vp->v_name == NULL && cnp->cn_namelen != 0) || (vp->v_name != NULL && cnp->cn_namelen == 0))
352 update_flags |= VNODE_UPDATE_NAME;
353 if (vnode_parent(vp) != NFSTOV(dnp))
354 update_flags |= VNODE_UPDATE_PARENT;
39236c6e
A
355 if (update_flags) {
356 NFS_NODE_DBG("vnode_update_identity old name %s new name %*s\n",
357 vp->v_name, cnp->cn_namelen, cnp->cn_nameptr ? cnp->cn_nameptr : "");
4b17d6b6 358 vnode_update_identity(vp, NFSTOV(dnp), cnp->cn_nameptr, cnp->cn_namelen, 0, update_flags);
39236c6e 359 }
4b17d6b6
A
360 }
361
91447636 362 *npp = np;
1c79356b 363 }
2d21ac55 364 FSDBG_BOT(263, dnp, *npp, 0xcace0000, error);
91447636 365 return(error);
1c79356b 366 }
1c79356b 367
2d21ac55
A
368 FSDBG(263, mp, dnp, npp, 0xaaaaaaaa);
369
b0d623f7
A
370 if (flags & NG_NOCREATE) {
371 lck_mtx_unlock(nfs_node_hash_mutex);
372 *npp = 0;
373 FSDBG_BOT(263, dnp, *npp, 0x80000001, ENOENT);
374 return (ENOENT);
375 }
376
1c79356b 377 /*
55e303ae
A
378 * allocate and initialize nfsnode and stick it in the hash
379 * before calling getnewvnode(). Anyone finding it in the
380 * hash before initialization is complete will wait for it.
1c79356b 381 */
2d21ac55 382 MALLOC_ZONE(np, nfsnode_t, sizeof *np, M_NFSNODE, M_WAITOK);
91447636
A
383 if (!np) {
384 lck_mtx_unlock(nfs_node_hash_mutex);
385 *npp = 0;
2d21ac55 386 FSDBG_BOT(263, dnp, *npp, 0x80000001, ENOMEM);
91447636
A
387 return (ENOMEM);
388 }
2d21ac55
A
389 bzero(np, sizeof *np);
390 np->n_hflag |= (NHINIT | NHLOCKED);
391 np->n_mount = mp;
6d2010ae 392 np->n_auth = auth;
b0d623f7
A
393 TAILQ_INIT(&np->n_opens);
394 TAILQ_INIT(&np->n_lock_owners);
395 TAILQ_INIT(&np->n_locks);
396 np->n_dlink.tqe_next = NFSNOLIST;
6d2010ae
A
397 np->n_dreturn.tqe_next = NFSNOLIST;
398 np->n_monlink.le_next = NFSNOLIST;
399
400 /* ugh... need to keep track of ".zfs" directories to workaround server bugs */
401 if ((nvap->nva_type == VDIR) && cnp && (cnp->cn_namelen == 4) &&
402 (cnp->cn_nameptr[0] == '.') && (cnp->cn_nameptr[1] == 'z') &&
403 (cnp->cn_nameptr[2] == 'f') && (cnp->cn_nameptr[3] == 's'))
404 np->n_flag |= NISDOTZFS;
405 if (dnp && (dnp->n_flag & NISDOTZFS))
406 np->n_flag |= NISDOTZFSCHILD;
2d21ac55
A
407
408 if (dnp && cnp && ((cnp->cn_namelen != 2) ||
409 (cnp->cn_nameptr[0] != '.') || (cnp->cn_nameptr[1] != '.'))) {
410 vnode_t dvp = NFSTOV(dnp);
411 if (!vnode_get(dvp)) {
412 if (!vnode_ref(dvp))
413 np->n_parent = dvp;
414 vnode_put(dvp);
415 }
416 }
55e303ae 417
91447636 418 /* setup node's file handle */
1c79356b 419 if (fhsize > NFS_SMALLFH) {
91447636 420 MALLOC_ZONE(np->n_fhp, u_char *,
1c79356b 421 fhsize, M_NFSBIGFH, M_WAITOK);
91447636
A
422 if (!np->n_fhp) {
423 lck_mtx_unlock(nfs_node_hash_mutex);
424 FREE_ZONE(np, sizeof *np, M_NFSNODE);
425 *npp = 0;
2d21ac55 426 FSDBG_BOT(263, dnp, *npp, 0x80000002, ENOMEM);
91447636
A
427 return (ENOMEM);
428 }
429 } else {
430 np->n_fhp = &np->n_fh[0];
431 }
432 bcopy(fhp, np->n_fhp, fhsize);
1c79356b 433 np->n_fhsize = fhsize;
91447636
A
434
435 /* Insert the nfsnode in the hash queue for its new file handle */
91447636 436 LIST_INSERT_HEAD(nhpp, np, n_hash);
2d21ac55
A
437 np->n_hflag |= NHHASHED;
438 FSDBG(266, 0, np, np->n_flag, np->n_hflag);
439
440 /* lock the new nfsnode */
b0d623f7
A
441 lck_mtx_init(&np->n_lock, nfs_node_lck_grp, LCK_ATTR_NULL);
442 lck_rw_init(&np->n_datalock, nfs_data_lck_grp, LCK_ATTR_NULL);
443 lck_mtx_init(&np->n_openlock, nfs_open_grp, LCK_ATTR_NULL);
444 lck_mtx_lock(&np->n_lock);
1c79356b 445
55e303ae 446 /* release lock on hash table */
91447636
A
447 lck_mtx_unlock(nfs_node_hash_mutex);
448
449 /* do initial loading of attributes */
6d2010ae
A
450 NACLINVALIDATE(np);
451 NACCESSINVALIDATE(np);
91447636
A
452 error = nfs_loadattrcache(np, nvap, xidp, 1);
453 if (error) {
2d21ac55 454 FSDBG(266, 0, np, np->n_flag, 0xb1eb1e);
b0d623f7 455 nfs_node_unlock(np);
91447636
A
456 lck_mtx_lock(nfs_node_hash_mutex);
457 LIST_REMOVE(np, n_hash);
2d21ac55
A
458 np->n_hflag &= ~(NHHASHED|NHINIT|NHLOCKED);
459 if (np->n_hflag & NHLOCKWANT) {
460 np->n_hflag &= ~NHLOCKWANT;
461 wakeup(np);
91447636
A
462 }
463 lck_mtx_unlock(nfs_node_hash_mutex);
2d21ac55
A
464 if (np->n_parent) {
465 if (!vnode_get(np->n_parent)) {
466 vnode_rele(np->n_parent);
467 vnode_put(np->n_parent);
468 }
469 np->n_parent = NULL;
470 }
b0d623f7
A
471 lck_mtx_destroy(&np->n_lock, nfs_node_lck_grp);
472 lck_rw_destroy(&np->n_datalock, nfs_data_lck_grp);
473 lck_mtx_destroy(&np->n_openlock, nfs_open_grp);
91447636
A
474 if (np->n_fhsize > NFS_SMALLFH)
475 FREE_ZONE(np->n_fhp, np->n_fhsize, M_NFSBIGFH);
476 FREE_ZONE(np, sizeof *np, M_NFSNODE);
477 *npp = 0;
2d21ac55 478 FSDBG_BOT(263, dnp, *npp, 0x80000003, error);
91447636
A
479 return (error);
480 }
2d21ac55 481 NFS_CHANGED_UPDATE(nfsvers, np, nvap);
91447636 482 if (nvap->nva_type == VDIR)
2d21ac55 483 NFS_CHANGED_UPDATE_NC(nfsvers, np, nvap);
1c79356b 484
55e303ae 485 /* now, attempt to get a new vnode */
2d21ac55 486 vfsp.vnfs_mp = mp;
91447636
A
487 vfsp.vnfs_vtype = nvap->nva_type;
488 vfsp.vnfs_str = "nfs";
2d21ac55 489 vfsp.vnfs_dvp = dnp ? NFSTOV(dnp) : NULL;
91447636 490 vfsp.vnfs_fsnode = np;
2d21ac55
A
491 if (nfsvers == NFS_VER4) {
492#if FIFO
493 if (nvap->nva_type == VFIFO)
494 vfsp.vnfs_vops = fifo_nfsv4nodeop_p;
495 else
496#endif /* FIFO */
497 if (nvap->nva_type == VBLK || nvap->nva_type == VCHR)
498 vfsp.vnfs_vops = spec_nfsv4nodeop_p;
499 else
500 vfsp.vnfs_vops = nfsv4_vnodeop_p;
501 } else {
502#if FIFO
503 if (nvap->nva_type == VFIFO)
504 vfsp.vnfs_vops = fifo_nfsv2nodeop_p;
505 else
506#endif /* FIFO */
507 if (nvap->nva_type == VBLK || nvap->nva_type == VCHR)
508 vfsp.vnfs_vops = spec_nfsv2nodeop_p;
509 else
510 vfsp.vnfs_vops = nfsv2_vnodeop_p;
511 }
91447636
A
512 vfsp.vnfs_markroot = (flags & NG_MARKROOT) ? 1 : 0;
513 vfsp.vnfs_marksystem = 0;
514 vfsp.vnfs_rdev = 0;
515 vfsp.vnfs_filesize = nvap->nva_size;
516 vfsp.vnfs_cnp = cnp;
2d21ac55
A
517 vfsp.vnfs_flags = VNFS_ADDFSREF;
518 if (!dnp || !cnp || !(flags & NG_MAKEENTRY))
519 vfsp.vnfs_flags |= VNFS_NOCACHE;
520
6d2010ae
A
521#if CONFIG_TRIGGERS
522 if ((nfsvers >= NFS_VER4) && (nvap->nva_type == VDIR) && (np->n_vattr.nva_flags & NFS_FFLAG_TRIGGER)) {
523 struct vnode_trigger_param vtp;
524 bzero(&vtp, sizeof(vtp));
525 bcopy(&vfsp, &vtp.vnt_params, sizeof(vfsp));
526 vtp.vnt_resolve_func = nfs_mirror_mount_trigger_resolve;
527 vtp.vnt_unresolve_func = nfs_mirror_mount_trigger_unresolve;
528 vtp.vnt_rearm_func = nfs_mirror_mount_trigger_rearm;
529 vtp.vnt_flags = VNT_AUTO_REARM;
530 error = vnode_create(VNCREATE_TRIGGER, VNCREATE_TRIGGER_SIZE, &vtp, &np->n_vnode);
531 } else
532#endif
533 {
534 error = vnode_create(VNCREATE_FLAVOR, VCREATESIZE, &vfsp, &np->n_vnode);
535 }
55e303ae 536 if (error) {
2d21ac55 537 FSDBG(266, 0, np, np->n_flag, 0xb1eb1e);
b0d623f7 538 nfs_node_unlock(np);
91447636 539 lck_mtx_lock(nfs_node_hash_mutex);
55e303ae 540 LIST_REMOVE(np, n_hash);
2d21ac55
A
541 np->n_hflag &= ~(NHHASHED|NHINIT|NHLOCKED);
542 if (np->n_hflag & NHLOCKWANT) {
543 np->n_hflag &= ~NHLOCKWANT;
544 wakeup(np);
91447636
A
545 }
546 lck_mtx_unlock(nfs_node_hash_mutex);
2d21ac55
A
547 if (np->n_parent) {
548 if (!vnode_get(np->n_parent)) {
549 vnode_rele(np->n_parent);
550 vnode_put(np->n_parent);
551 }
552 np->n_parent = NULL;
553 }
b0d623f7
A
554 lck_mtx_destroy(&np->n_lock, nfs_node_lck_grp);
555 lck_rw_destroy(&np->n_datalock, nfs_data_lck_grp);
556 lck_mtx_destroy(&np->n_openlock, nfs_open_grp);
55e303ae 557 if (np->n_fhsize > NFS_SMALLFH)
91447636 558 FREE_ZONE(np->n_fhp, np->n_fhsize, M_NFSBIGFH);
55e303ae
A
559 FREE_ZONE(np, sizeof *np, M_NFSNODE);
560 *npp = 0;
2d21ac55 561 FSDBG_BOT(263, dnp, *npp, 0x80000004, error);
55e303ae
A
562 return (error);
563 }
2d21ac55
A
564 vp = np->n_vnode;
565 vnode_settag(vp, VT_NFS);
91447636 566 /* node is now initialized */
55e303ae 567
91447636
A
568 /* check if anyone's waiting on this node */
569 lck_mtx_lock(nfs_node_hash_mutex);
2d21ac55
A
570 np->n_hflag &= ~(NHINIT|NHLOCKED);
571 if (np->n_hflag & NHLOCKWANT) {
572 np->n_hflag &= ~NHLOCKWANT;
573 wakeup(np);
55e303ae 574 }
91447636 575 lck_mtx_unlock(nfs_node_hash_mutex);
1c79356b 576
2d21ac55
A
577 *npp = np;
578
579 FSDBG_BOT(263, dnp, vp, *npp, error);
fa4905b1 580 return (error);
1c79356b
A
581}
582
91447636 583
1c79356b 584int
2d21ac55 585nfs_vnop_inactive(ap)
91447636
A
586 struct vnop_inactive_args /* {
587 struct vnodeop_desc *a_desc;
588 vnode_t a_vp;
589 vfs_context_t a_context;
1c79356b
A
590 } */ *ap;
591{
b0d623f7
A
592 vnode_t vp = ap->a_vp;
593 vfs_context_t ctx = ap->a_context;
39236c6e 594 nfsnode_t np;
2d21ac55
A
595 struct nfs_sillyrename *nsp;
596 struct nfs_vattr nvattr;
6d2010ae 597 int unhash, attrerr, busyerror, error, inuse, busied, force;
b0d623f7 598 struct nfs_open_file *nofp;
b0d623f7 599 struct componentname cn;
39236c6e
A
600 struct nfsmount *nmp;
601 mount_t mp;
602
603 if (vp == NULL)
604 panic("nfs_vnop_inactive: vp == NULL");
605 np = VTONFS(vp);
606 if (np == NULL)
607 panic("nfs_vnop_inactive: np == NULL");
608
609 nmp = NFSTONMP(np);
610 mp = vnode_mount(vp);
b0d623f7
A
611
612restart:
fe8ab488 613 force = (!mp || vfs_isforce(mp));
b0d623f7 614 error = 0;
6d2010ae 615 inuse = (nfs_mount_state_in_use_start(nmp, NULL) == 0);
b0d623f7
A
616
617 /* There shouldn't be any open or lock state at this point */
618 lck_mtx_lock(&np->n_openlock);
39236c6e
A
619 if (np->n_openrefcnt && !force) {
620 /*
621 * vnode_rele and vnode_put drop the vnode lock before
622 * calling VNOP_INACTIVE, so there is a race were the
623 * vnode could become active again. Perhaps there are
624 * other places where this can happen, so if we've got
625 * here we need to get out.
626 */
627#ifdef NFS_NODE_DEBUG
6d2010ae 628 NP(np, "nfs_vnop_inactive: still open: %d", np->n_openrefcnt);
39236c6e
A
629#endif
630 lck_mtx_unlock(&np->n_openlock);
631 return 0;
632 }
633
b0d623f7
A
634 TAILQ_FOREACH(nofp, &np->n_opens, nof_link) {
635 lck_mtx_lock(&nofp->nof_lock);
636 if (nofp->nof_flags & NFS_OPEN_FILE_BUSY) {
6d2010ae
A
637 if (!force)
638 NP(np, "nfs_vnop_inactive: open file busy");
b0d623f7
A
639 busied = 0;
640 } else {
641 nofp->nof_flags |= NFS_OPEN_FILE_BUSY;
642 busied = 1;
643 }
644 lck_mtx_unlock(&nofp->nof_lock);
6d2010ae
A
645 if ((np->n_flag & NREVOKE) || (nofp->nof_flags & NFS_OPEN_FILE_LOST)) {
646 if (busied)
647 nfs_open_file_clear_busy(nofp);
648 continue;
649 }
b0d623f7
A
650 /*
651 * If we just created the file, we already had it open in
652 * anticipation of getting a subsequent open call. If the
653 * node has gone inactive without being open, we need to
654 * clean up (close) the open done in the create.
655 */
6d2010ae 656 if ((nofp->nof_flags & NFS_OPEN_FILE_CREATE) && nofp->nof_creator && !force) {
b0d623f7
A
657 if (nofp->nof_flags & NFS_OPEN_FILE_REOPEN) {
658 lck_mtx_unlock(&np->n_openlock);
659 if (busied)
660 nfs_open_file_clear_busy(nofp);
661 if (inuse)
662 nfs_mount_state_in_use_end(nmp, 0);
6d2010ae
A
663 if (!nfs4_reopen(nofp, NULL))
664 goto restart;
b0d623f7
A
665 }
666 nofp->nof_flags &= ~NFS_OPEN_FILE_CREATE;
667 lck_mtx_unlock(&np->n_openlock);
6d2010ae 668 error = nfs_close(np, nofp, NFS_OPEN_SHARE_ACCESS_BOTH, NFS_OPEN_SHARE_DENY_NONE, ctx);
b0d623f7 669 if (error) {
6d2010ae 670 NP(np, "nfs_vnop_inactive: create close error: %d", error);
b0d623f7
A
671 nofp->nof_flags |= NFS_OPEN_FILE_CREATE;
672 }
673 if (busied)
674 nfs_open_file_clear_busy(nofp);
675 if (inuse)
676 nfs_mount_state_in_use_end(nmp, error);
677 goto restart;
678 }
679 if (nofp->nof_flags & NFS_OPEN_FILE_NEEDCLOSE) {
680 /*
681 * If the file is marked as needing reopen, but this was the only
682 * open on the file, just drop the open.
683 */
684 nofp->nof_flags &= ~NFS_OPEN_FILE_NEEDCLOSE;
685 if ((nofp->nof_flags & NFS_OPEN_FILE_REOPEN) && (nofp->nof_opencnt == 1)) {
686 nofp->nof_flags &= ~NFS_OPEN_FILE_REOPEN;
687 nofp->nof_r--;
688 nofp->nof_opencnt--;
689 nofp->nof_access = 0;
6d2010ae 690 } else if (!force) {
b0d623f7
A
691 lck_mtx_unlock(&np->n_openlock);
692 if (nofp->nof_flags & NFS_OPEN_FILE_REOPEN) {
693 if (busied)
694 nfs_open_file_clear_busy(nofp);
695 if (inuse)
696 nfs_mount_state_in_use_end(nmp, 0);
6d2010ae
A
697 if (!nfs4_reopen(nofp, NULL))
698 goto restart;
b0d623f7 699 }
6d2010ae 700 error = nfs_close(np, nofp, NFS_OPEN_SHARE_ACCESS_READ, NFS_OPEN_SHARE_DENY_NONE, ctx);
b0d623f7 701 if (error) {
6d2010ae 702 NP(np, "nfs_vnop_inactive: need close error: %d", error);
b0d623f7
A
703 nofp->nof_flags |= NFS_OPEN_FILE_NEEDCLOSE;
704 }
705 if (busied)
706 nfs_open_file_clear_busy(nofp);
707 if (inuse)
708 nfs_mount_state_in_use_end(nmp, error);
709 goto restart;
710 }
711 }
6d2010ae
A
712 if (nofp->nof_opencnt && !force)
713 NP(np, "nfs_vnop_inactive: file still open: %d", nofp->nof_opencnt);
714 if (!force && (nofp->nof_access || nofp->nof_deny ||
b0d623f7
A
715 nofp->nof_mmap_access || nofp->nof_mmap_deny ||
716 nofp->nof_r || nofp->nof_w || nofp->nof_rw ||
717 nofp->nof_r_dw || nofp->nof_w_dw || nofp->nof_rw_dw ||
6d2010ae
A
718 nofp->nof_r_drw || nofp->nof_w_drw || nofp->nof_rw_drw ||
719 nofp->nof_d_r || nofp->nof_d_w || nofp->nof_d_rw ||
720 nofp->nof_d_r_dw || nofp->nof_d_w_dw || nofp->nof_d_rw_dw ||
721 nofp->nof_d_r_drw || nofp->nof_d_w_drw || nofp->nof_d_rw_drw)) {
722 NP(np, "nfs_vnop_inactive: non-zero access: %d %d %d %d # %u.%u %u.%u %u.%u dw %u.%u %u.%u %u.%u drw %u.%u %u.%u %u.%u",
b0d623f7
A
723 nofp->nof_access, nofp->nof_deny,
724 nofp->nof_mmap_access, nofp->nof_mmap_deny,
6d2010ae
A
725 nofp->nof_r, nofp->nof_d_r,
726 nofp->nof_w, nofp->nof_d_w,
727 nofp->nof_rw, nofp->nof_d_rw,
728 nofp->nof_r_dw, nofp->nof_d_r_dw,
729 nofp->nof_w_dw, nofp->nof_d_w_dw,
730 nofp->nof_rw_dw, nofp->nof_d_rw_dw,
731 nofp->nof_r_drw, nofp->nof_d_r_drw,
732 nofp->nof_w_drw, nofp->nof_d_w_drw,
733 nofp->nof_rw_drw, nofp->nof_d_rw_drw);
b0d623f7
A
734 }
735 if (busied)
736 nfs_open_file_clear_busy(nofp);
737 }
738 lck_mtx_unlock(&np->n_openlock);
1c79356b 739
b0d623f7
A
740 if (inuse && nfs_mount_state_in_use_end(nmp, error))
741 goto restart;
2d21ac55 742
b0d623f7 743 nfs_node_lock_force(np);
2d21ac55
A
744
745 if (vnode_vtype(vp) != VDIR) {
b0d623f7 746 nsp = np->n_sillyrename;
2d21ac55 747 np->n_sillyrename = NULL;
b0d623f7 748 } else {
2d21ac55 749 nsp = NULL;
b0d623f7 750 }
1c79356b 751
2d21ac55
A
752 FSDBG_TOP(264, vp, np, np->n_flag, nsp);
753
754 if (!nsp) {
755 /* no silly file to clean up... */
756 /* clear all flags other than these */
757 np->n_flag &= (NMODIFIED);
b0d623f7 758 nfs_node_unlock(np);
2d21ac55
A
759 FSDBG_BOT(264, vp, np, np->n_flag, 0);
760 return (0);
761 }
b0d623f7 762 nfs_node_unlock(np);
2d21ac55
A
763
764 /* Remove the silly file that was rename'd earlier */
765
766 /* flush all the buffers */
b0d623f7 767 nfs_vinvalbuf2(vp, V_SAVE, vfs_context_thread(ctx), nsp->nsr_cred, 1);
2d21ac55
A
768
769 /* try to get the latest attributes */
b0d623f7 770 attrerr = nfs_getattr(np, &nvattr, ctx, NGA_UNCACHED);
2d21ac55
A
771
772 /* Check if we should remove it from the node hash. */
773 /* Leave it if inuse or it has multiple hard links. */
774 if (vnode_isinuse(vp, 0) || (!attrerr && (nvattr.nva_nlink > 1))) {
775 unhash = 0;
776 } else {
777 unhash = 1;
778 ubc_setsize(vp, 0);
779 }
780
b0d623f7
A
781 /* mark this node and the directory busy while we do the remove */
782 busyerror = nfs_node_set_busy2(nsp->nsr_dnp, np, vfs_context_thread(ctx));
2d21ac55
A
783
784 /* lock the node while we remove the silly file */
785 lck_mtx_lock(nfs_node_hash_mutex);
786 while (np->n_hflag & NHLOCKED) {
787 np->n_hflag |= NHLOCKWANT;
788 msleep(np, nfs_node_hash_mutex, PINOD, "nfs_inactive", NULL);
789 }
790 np->n_hflag |= NHLOCKED;
791 lck_mtx_unlock(nfs_node_hash_mutex);
792
b0d623f7
A
793 /* purge the name cache to deter others from finding it */
794 bzero(&cn, sizeof(cn));
795 cn.cn_nameptr = nsp->nsr_name;
796 cn.cn_namelen = nsp->nsr_namlen;
797 nfs_name_cache_purge(nsp->nsr_dnp, np, &cn, ctx);
2d21ac55
A
798
799 FSDBG(264, np, np->n_size, np->n_vattr.nva_size, 0xf00d00f1);
800
801 /* now remove the silly file */
802 nfs_removeit(nsp);
803
804 /* clear all flags other than these */
b0d623f7 805 nfs_node_lock_force(np);
2d21ac55 806 np->n_flag &= (NMODIFIED);
b0d623f7
A
807 nfs_node_unlock(np);
808
809 if (!busyerror)
810 nfs_node_clear_busy2(nsp->nsr_dnp, np);
2d21ac55
A
811
812 if (unhash && vnode_isinuse(vp, 0)) {
813 /* vnode now inuse after silly remove? */
814 unhash = 0;
815 ubc_setsize(vp, np->n_size);
816 }
817
818 lck_mtx_lock(nfs_node_hash_mutex);
819 if (unhash) {
55e303ae
A
820 /*
821 * remove nfsnode from hash now so we can't accidentally find it
822 * again if another object gets created with the same filehandle
823 * before this vnode gets reclaimed
824 */
2d21ac55
A
825 if (np->n_hflag & NHHASHED) {
826 LIST_REMOVE(np, n_hash);
827 np->n_hflag &= ~NHHASHED;
828 FSDBG(266, 0, np, np->n_flag, 0xb1eb1e);
1c79356b 829 }
2d21ac55 830 vnode_recycle(vp);
1c79356b 831 }
2d21ac55
A
832 /* unlock the node */
833 np->n_hflag &= ~NHLOCKED;
834 if (np->n_hflag & NHLOCKWANT) {
835 np->n_hflag &= ~NHLOCKWANT;
836 wakeup(np);
837 }
838 lck_mtx_unlock(nfs_node_hash_mutex);
839
840 /* cleanup sillyrename info */
841 if (nsp->nsr_cred != NOCRED)
842 kauth_cred_unref(&nsp->nsr_cred);
843 vnode_rele(NFSTOV(nsp->nsr_dnp));
844 FREE_ZONE(nsp, sizeof(*nsp), M_NFSREQ);
845
846 FSDBG_BOT(264, vp, np, np->n_flag, 0);
1c79356b
A
847 return (0);
848}
849
850/*
851 * Reclaim an nfsnode so that it can be used for other purposes.
852 */
853int
2d21ac55 854nfs_vnop_reclaim(ap)
91447636
A
855 struct vnop_reclaim_args /* {
856 struct vnodeop_desc *a_desc;
857 vnode_t a_vp;
858 vfs_context_t a_context;
1c79356b
A
859 } */ *ap;
860{
91447636 861 vnode_t vp = ap->a_vp;
2d21ac55 862 nfsnode_t np = VTONFS(vp);
b0d623f7
A
863 vfs_context_t ctx = ap->a_context;
864 struct nfs_open_file *nofp, *nextnofp;
865 struct nfs_file_lock *nflp, *nextnflp;
866 struct nfs_lock_owner *nlop, *nextnlop;
b0d623f7 867 struct nfsmount *nmp = np->n_mount ? VFSTONFS(np->n_mount) : NFSTONMP(np);
6d2010ae
A
868 mount_t mp = vnode_mount(vp);
869 int force;
1c79356b 870
2d21ac55 871 FSDBG_TOP(265, vp, np, np->n_flag, 0);
fe8ab488 872 force = (!mp || vfs_isforce(mp) || nfs_mount_gone(nmp));
2d21ac55 873
b0d623f7
A
874 /* There shouldn't be any open or lock state at this point */
875 lck_mtx_lock(&np->n_openlock);
876
877 if (nmp && (nmp->nm_vers >= NFS_VER4)) {
878 /* need to drop a delegation */
6d2010ae
A
879 if (np->n_dreturn.tqe_next != NFSNOLIST) {
880 /* remove this node from the delegation return list */
881 lck_mtx_lock(&nmp->nm_lock);
882 if (np->n_dreturn.tqe_next != NFSNOLIST) {
883 TAILQ_REMOVE(&nmp->nm_dreturnq, np, n_dreturn);
884 np->n_dreturn.tqe_next = NFSNOLIST;
885 }
886 lck_mtx_unlock(&nmp->nm_lock);
887 }
b0d623f7 888 if (np->n_dlink.tqe_next != NFSNOLIST) {
6d2010ae 889 /* remove this node from the delegation list */
b0d623f7
A
890 lck_mtx_lock(&nmp->nm_lock);
891 if (np->n_dlink.tqe_next != NFSNOLIST) {
6d2010ae 892 TAILQ_REMOVE(&nmp->nm_delegations, np, n_dlink);
b0d623f7
A
893 np->n_dlink.tqe_next = NFSNOLIST;
894 }
895 lck_mtx_unlock(&nmp->nm_lock);
896 }
6d2010ae
A
897 if ((np->n_openflags & N_DELEG_MASK) && !force) {
898 /* try to return the delegation */
b0d623f7
A
899 np->n_openflags &= ~N_DELEG_MASK;
900 nfs4_delegreturn_rpc(nmp, np->n_fhp, np->n_fhsize, &np->n_dstateid,
6d2010ae
A
901 R_RECOVER, vfs_context_thread(ctx), vfs_context_ucred(ctx));
902 }
903 if (np->n_attrdirfh) {
904 FREE(np->n_attrdirfh, M_TEMP);
905 np->n_attrdirfh = NULL;
b0d623f7
A
906 }
907 }
908
909 /* clean up file locks */
910 TAILQ_FOREACH_SAFE(nflp, &np->n_locks, nfl_link, nextnflp) {
6d2010ae
A
911 if (!(nflp->nfl_flags & NFS_FILE_LOCK_DEAD) && !force) {
912 NP(np, "nfs_vnop_reclaim: lock 0x%llx 0x%llx 0x%x (bc %d)",
913 nflp->nfl_start, nflp->nfl_end, nflp->nfl_flags, nflp->nfl_blockcnt);
b0d623f7 914 }
6d2010ae
A
915 if (!(nflp->nfl_flags & (NFS_FILE_LOCK_BLOCKED|NFS_FILE_LOCK_DEAD))) {
916 /* try sending an unlock RPC if it wasn't delegated */
917 if (!(nflp->nfl_flags & NFS_FILE_LOCK_DELEGATED) && !force)
918 nmp->nm_funcs->nf_unlock_rpc(np, nflp->nfl_owner, F_WRLCK, nflp->nfl_start, nflp->nfl_end, R_RECOVER,
919 NULL, nflp->nfl_owner->nlo_open_owner->noo_cred);
b0d623f7
A
920 lck_mtx_lock(&nflp->nfl_owner->nlo_lock);
921 TAILQ_REMOVE(&nflp->nfl_owner->nlo_locks, nflp, nfl_lolink);
922 lck_mtx_unlock(&nflp->nfl_owner->nlo_lock);
923 }
924 TAILQ_REMOVE(&np->n_locks, nflp, nfl_link);
925 nfs_file_lock_destroy(nflp);
926 }
927 /* clean up lock owners */
928 TAILQ_FOREACH_SAFE(nlop, &np->n_lock_owners, nlo_link, nextnlop) {
6d2010ae
A
929 if (!TAILQ_EMPTY(&nlop->nlo_locks) && !force)
930 NP(np, "nfs_vnop_reclaim: lock owner with locks");
b0d623f7
A
931 TAILQ_REMOVE(&np->n_lock_owners, nlop, nlo_link);
932 nfs_lock_owner_destroy(nlop);
933 }
934 /* clean up open state */
6d2010ae
A
935 if (np->n_openrefcnt && !force)
936 NP(np, "nfs_vnop_reclaim: still open: %d", np->n_openrefcnt);
b0d623f7 937 TAILQ_FOREACH_SAFE(nofp, &np->n_opens, nof_link, nextnofp) {
6d2010ae
A
938 if (nofp->nof_flags & NFS_OPEN_FILE_BUSY)
939 NP(np, "nfs_vnop_reclaim: open file busy");
940 if (!(np->n_flag & NREVOKE) && !(nofp->nof_flags & NFS_OPEN_FILE_LOST)) {
941 if (nofp->nof_opencnt && !force)
942 NP(np, "nfs_vnop_reclaim: file still open: %d", nofp->nof_opencnt);
943 if (!force && (nofp->nof_access || nofp->nof_deny ||
944 nofp->nof_mmap_access || nofp->nof_mmap_deny ||
945 nofp->nof_r || nofp->nof_w || nofp->nof_rw ||
946 nofp->nof_r_dw || nofp->nof_w_dw || nofp->nof_rw_dw ||
947 nofp->nof_r_drw || nofp->nof_w_drw || nofp->nof_rw_drw ||
948 nofp->nof_d_r || nofp->nof_d_w || nofp->nof_d_rw ||
949 nofp->nof_d_r_dw || nofp->nof_d_w_dw || nofp->nof_d_rw_dw ||
950 nofp->nof_d_r_drw || nofp->nof_d_w_drw || nofp->nof_d_rw_drw)) {
951 NP(np, "nfs_vnop_reclaim: non-zero access: %d %d %d %d # %u.%u %u.%u %u.%u dw %u.%u %u.%u %u.%u drw %u.%u %u.%u %u.%u",
952 nofp->nof_access, nofp->nof_deny,
953 nofp->nof_mmap_access, nofp->nof_mmap_deny,
954 nofp->nof_r, nofp->nof_d_r,
955 nofp->nof_w, nofp->nof_d_w,
956 nofp->nof_rw, nofp->nof_d_rw,
957 nofp->nof_r_dw, nofp->nof_d_r_dw,
958 nofp->nof_w_dw, nofp->nof_d_w_dw,
959 nofp->nof_rw_dw, nofp->nof_d_rw_dw,
960 nofp->nof_r_drw, nofp->nof_d_r_drw,
961 nofp->nof_w_drw, nofp->nof_d_w_drw,
962 nofp->nof_rw_drw, nofp->nof_d_rw_drw);
963 /* try sending a close RPC if it wasn't delegated */
964 if (nofp->nof_r || nofp->nof_w || nofp->nof_rw ||
965 nofp->nof_r_dw || nofp->nof_w_dw || nofp->nof_rw_dw ||
966 nofp->nof_r_drw || nofp->nof_w_drw || nofp->nof_rw_drw)
967 nfs4_close_rpc(np, nofp, NULL, nofp->nof_owner->noo_cred, R_RECOVER);
968 }
b0d623f7
A
969 }
970 TAILQ_REMOVE(&np->n_opens, nofp, nof_link);
971 nfs_open_file_destroy(nofp);
972 }
973 lck_mtx_unlock(&np->n_openlock);
974
6d2010ae
A
975 if (np->n_monlink.le_next != NFSNOLIST) {
976 /* Wait for any in-progress getattr to complete, */
977 /* then remove this node from the monitored node list. */
978 lck_mtx_lock(&nmp->nm_lock);
979 while (np->n_mflag & NMMONSCANINPROG) {
980 struct timespec ts = { 1, 0 };
981 np->n_mflag |= NMMONSCANWANT;
982 msleep(&np->n_mflag, &nmp->nm_lock, PZERO-1, "nfswaitmonscan", &ts);
983 }
984 if (np->n_monlink.le_next != NFSNOLIST) {
985 LIST_REMOVE(np, n_monlink);
986 np->n_monlink.le_next = NFSNOLIST;
987 }
988 lck_mtx_unlock(&nmp->nm_lock);
b0d623f7 989 }
6d2010ae
A
990
991 lck_mtx_lock(nfs_buf_mutex);
992 if (!force && (!LIST_EMPTY(&np->n_dirtyblkhd) || !LIST_EMPTY(&np->n_cleanblkhd)))
993 NP(np, "nfs_reclaim: dropping %s buffers", (!LIST_EMPTY(&np->n_dirtyblkhd) ? "dirty" : "clean"));
b0d623f7 994 lck_mtx_unlock(nfs_buf_mutex);
b0d623f7
A
995 nfs_vinvalbuf(vp, V_IGNORE_WRITEERR, ap->a_context, 0);
996
2d21ac55
A
997 lck_mtx_lock(nfs_node_hash_mutex);
998
b0d623f7 999 if ((vnode_vtype(vp) != VDIR) && np->n_sillyrename) {
6d2010ae
A
1000 if (!force)
1001 NP(np, "nfs_reclaim: leaving unlinked file %s", np->n_sillyrename->nsr_name);
b0d623f7
A
1002 if (np->n_sillyrename->nsr_cred != NOCRED)
1003 kauth_cred_unref(&np->n_sillyrename->nsr_cred);
1004 vnode_rele(NFSTOV(np->n_sillyrename->nsr_dnp));
1005 FREE_ZONE(np->n_sillyrename, sizeof(*np->n_sillyrename), M_NFSREQ);
1006 }
2d21ac55 1007
91447636 1008 vnode_removefsref(vp);
1c79356b 1009
2d21ac55 1010 if (np->n_hflag & NHHASHED) {
55e303ae 1011 LIST_REMOVE(np, n_hash);
2d21ac55
A
1012 np->n_hflag &= ~NHHASHED;
1013 FSDBG(266, 0, np, np->n_flag, 0xb1eb1e);
1c79356b 1014 }
2d21ac55 1015 lck_mtx_unlock(nfs_node_hash_mutex);
1c79356b
A
1016
1017 /*
b0d623f7
A
1018 * Free up any directory cookie structures and large file handle
1019 * structures that might be associated with this nfs node.
1c79356b 1020 */
b0d623f7
A
1021 nfs_node_lock_force(np);
1022 if ((vnode_vtype(vp) == VDIR) && np->n_cookiecache)
1023 FREE_ZONE(np->n_cookiecache, sizeof(struct nfsdmap), M_NFSDIROFF);
1024 if (np->n_fhsize > NFS_SMALLFH)
91447636 1025 FREE_ZONE(np->n_fhp, np->n_fhsize, M_NFSBIGFH);
6d2010ae
A
1026 if (np->n_vattr.nva_acl)
1027 kauth_acl_free(np->n_vattr.nva_acl);
b0d623f7 1028 nfs_node_unlock(np);
91447636 1029 vnode_clearfsnode(vp);
1c79356b 1030
2d21ac55
A
1031 if (np->n_parent) {
1032 if (!vnode_get(np->n_parent)) {
1033 vnode_rele(np->n_parent);
1034 vnode_put(np->n_parent);
1035 }
1036 np->n_parent = NULL;
1037 }
1038
b0d623f7
A
1039 lck_mtx_destroy(&np->n_lock, nfs_node_lck_grp);
1040 lck_rw_destroy(&np->n_datalock, nfs_data_lck_grp);
1041 lck_mtx_destroy(&np->n_openlock, nfs_open_grp);
2d21ac55
A
1042
1043 FSDBG_BOT(265, vp, np, np->n_flag, 0xd1ed1e);
91447636 1044 FREE_ZONE(np, sizeof(struct nfsnode), M_NFSNODE);
1c79356b
A
1045 return (0);
1046}
1047
2d21ac55
A
1048/*
1049 * Acquire an NFS node lock
1050 */
b0d623f7 1051
2d21ac55 1052int
b0d623f7 1053nfs_node_lock_internal(nfsnode_t np, int force)
2d21ac55 1054{
b0d623f7
A
1055 FSDBG_TOP(268, np, force, 0, 0);
1056 lck_mtx_lock(&np->n_lock);
1057 if (!force && !(np->n_hflag && NHHASHED)) {
1058 FSDBG_BOT(268, np, 0xdead, 0, 0);
1059 lck_mtx_unlock(&np->n_lock);
2d21ac55
A
1060 return (ENOENT);
1061 }
b0d623f7 1062 FSDBG_BOT(268, np, force, 0, 0);
2d21ac55
A
1063 return (0);
1064}
1065
b0d623f7
A
1066int
1067nfs_node_lock(nfsnode_t np)
1068{
1069 return nfs_node_lock_internal(np, 0);
1070}
1071
1072void
1073nfs_node_lock_force(nfsnode_t np)
1074{
1075 nfs_node_lock_internal(np, 1);
1076}
1077
2d21ac55
A
1078/*
1079 * Release an NFS node lock
1080 */
1081void
b0d623f7 1082nfs_node_unlock(nfsnode_t np)
2d21ac55 1083{
b0d623f7
A
1084 FSDBG(269, np, current_thread(), 0, 0);
1085 lck_mtx_unlock(&np->n_lock);
2d21ac55
A
1086}
1087
1088/*
1089 * Acquire 2 NFS node locks
b0d623f7 1090 * - locks taken in reverse address order
2d21ac55
A
1091 * - both or neither of the locks are taken
1092 * - only one lock taken per node (dup nodes are skipped)
1093 */
1094int
b0d623f7 1095nfs_node_lock2(nfsnode_t np1, nfsnode_t np2)
2d21ac55 1096{
b0d623f7 1097 nfsnode_t first, second;
2d21ac55
A
1098 int error;
1099
b0d623f7
A
1100 first = (np1 > np2) ? np1 : np2;
1101 second = (np1 > np2) ? np2 : np1;
1102 if ((error = nfs_node_lock(first)))
2d21ac55
A
1103 return (error);
1104 if (np1 == np2)
1105 return (error);
b0d623f7
A
1106 if ((error = nfs_node_lock(second)))
1107 nfs_node_unlock(first);
2d21ac55
A
1108 return (error);
1109}
1110
2d21ac55 1111void
b0d623f7 1112nfs_node_unlock2(nfsnode_t np1, nfsnode_t np2)
2d21ac55 1113{
b0d623f7 1114 nfs_node_unlock(np1);
2d21ac55 1115 if (np1 != np2)
b0d623f7 1116 nfs_node_unlock(np2);
2d21ac55
A
1117}
1118
1119/*
b0d623f7
A
1120 * Manage NFS node busy state.
1121 * (Similar to NFS node locks above)
2d21ac55
A
1122 */
1123int
b0d623f7 1124nfs_node_set_busy(nfsnode_t np, thread_t thd)
2d21ac55 1125{
b0d623f7
A
1126 struct timespec ts = { 2, 0 };
1127 int error;
1128
1129 if ((error = nfs_node_lock(np)))
1130 return (error);
1131 while (ISSET(np->n_flag, NBUSY)) {
1132 SET(np->n_flag, NBUSYWANT);
1133 msleep(np, &np->n_lock, PZERO-1, "nfsbusywant", &ts);
1134 if ((error = nfs_sigintr(NFSTONMP(np), NULL, thd, 0)))
1135 break;
2d21ac55 1136 }
b0d623f7
A
1137 if (!error)
1138 SET(np->n_flag, NBUSY);
1139 nfs_node_unlock(np);
1140 return (error);
1141}
2d21ac55 1142
b0d623f7
A
1143void
1144nfs_node_clear_busy(nfsnode_t np)
1145{
1146 int wanted;
1147
1148 nfs_node_lock_force(np);
1149 wanted = ISSET(np->n_flag, NBUSYWANT);
1150 CLR(np->n_flag, NBUSY|NBUSYWANT);
1151 nfs_node_unlock(np);
1152 if (wanted)
1153 wakeup(np);
1154}
1155
1156int
1157nfs_node_set_busy2(nfsnode_t np1, nfsnode_t np2, thread_t thd)
1158{
1159 nfsnode_t first, second;
1160 int error;
1161
1162 first = (np1 > np2) ? np1 : np2;
1163 second = (np1 > np2) ? np2 : np1;
1164 if ((error = nfs_node_set_busy(first, thd)))
1165 return (error);
1166 if (np1 == np2)
1167 return (error);
1168 if ((error = nfs_node_set_busy(second, thd)))
1169 nfs_node_clear_busy(first);
1170 return (error);
1171}
1172
1173void
1174nfs_node_clear_busy2(nfsnode_t np1, nfsnode_t np2)
1175{
1176 nfs_node_clear_busy(np1);
1177 if (np1 != np2)
1178 nfs_node_clear_busy(np2);
1179}
1180
1181/* helper function to sort four nodes in reverse address order (no dupes) */
1182static void
1183nfs_node_sort4(nfsnode_t np1, nfsnode_t np2, nfsnode_t np3, nfsnode_t np4, nfsnode_t *list, int *lcntp)
1184{
1185 nfsnode_t na[2], nb[2];
1186 int a, b, i, lcnt;
1187
1188 /* sort pairs then merge */
1189 na[0] = (np1 > np2) ? np1 : np2;
1190 na[1] = (np1 > np2) ? np2 : np1;
1191 nb[0] = (np3 > np4) ? np3 : np4;
1192 nb[1] = (np3 > np4) ? np4 : np3;
1193 for (a = b = i = lcnt = 0; i < 4; i++) {
1194 if (a >= 2)
1195 list[lcnt] = nb[b++];
1196 else if ((b >= 2) || (na[a] >= nb[b]))
1197 list[lcnt] = na[a++];
1198 else
1199 list[lcnt] = nb[b++];
1200 if ((lcnt <= 0) || (list[lcnt] != list[lcnt-1]))
1201 lcnt++; /* omit dups */
2d21ac55 1202 }
b0d623f7
A
1203 if (list[lcnt-1] == NULL)
1204 lcnt--;
1205 *lcntp = lcnt;
1206}
1207
1208int
1209nfs_node_set_busy4(nfsnode_t np1, nfsnode_t np2, nfsnode_t np3, nfsnode_t np4, thread_t thd)
1210{
1211 nfsnode_t list[4];
1212 int i, lcnt, error;
1213
1214 nfs_node_sort4(np1, np2, np3, np4, list, &lcnt);
2d21ac55
A
1215
1216 /* Now we can lock using list[0 - lcnt-1] */
b0d623f7
A
1217 for (i = 0; i < lcnt; ++i)
1218 if ((error = nfs_node_set_busy(list[i], thd))) {
1219 /* Drop any locks we acquired. */
1220 while (--i >= 0)
1221 nfs_node_clear_busy(list[i]);
1222 return (error);
1223 }
2d21ac55
A
1224 return (0);
1225}
1226
2d21ac55 1227void
b0d623f7 1228nfs_node_clear_busy4(nfsnode_t np1, nfsnode_t np2, nfsnode_t np3, nfsnode_t np4)
2d21ac55
A
1229{
1230 nfsnode_t list[4];
b0d623f7
A
1231 int lcnt;
1232
1233 nfs_node_sort4(np1, np2, np3, np4, list, &lcnt);
1234 while (--lcnt >= 0)
1235 nfs_node_clear_busy(list[lcnt]);
2d21ac55
A
1236}
1237
1238/*
1239 * Acquire an NFS node data lock
1240 */
1241void
1242nfs_data_lock(nfsnode_t np, int locktype)
1243{
b0d623f7
A
1244 nfs_data_lock_internal(np, locktype, 1);
1245}
1246void
1247nfs_data_lock_noupdate(nfsnode_t np, int locktype)
1248{
1249 nfs_data_lock_internal(np, locktype, 0);
2d21ac55
A
1250}
1251void
b0d623f7 1252nfs_data_lock_internal(nfsnode_t np, int locktype, int updatesize)
2d21ac55
A
1253{
1254 FSDBG_TOP(270, np, locktype, np->n_datalockowner, 0);
b0d623f7 1255 if (locktype == NFS_DATA_LOCK_SHARED) {
2d21ac55
A
1256 if (updatesize && ISSET(np->n_flag, NUPDATESIZE))
1257 nfs_data_update_size(np, 0);
1258 lck_rw_lock_shared(&np->n_datalock);
1259 } else {
1260 lck_rw_lock_exclusive(&np->n_datalock);
1261 np->n_datalockowner = current_thread();
1262 if (updatesize && ISSET(np->n_flag, NUPDATESIZE))
1263 nfs_data_update_size(np, 1);
1264 }
1265 FSDBG_BOT(270, np, locktype, np->n_datalockowner, 0);
1266}
1267
1268/*
1269 * Release an NFS node data lock
1270 */
1271void
1272nfs_data_unlock(nfsnode_t np)
1273{
b0d623f7
A
1274 nfs_data_unlock_internal(np, 1);
1275}
1276void
1277nfs_data_unlock_noupdate(nfsnode_t np)
1278{
1279 nfs_data_unlock_internal(np, 0);
2d21ac55
A
1280}
1281void
b0d623f7 1282nfs_data_unlock_internal(nfsnode_t np, int updatesize)
2d21ac55
A
1283{
1284 int mine = (np->n_datalockowner == current_thread());
1285 FSDBG_TOP(271, np, np->n_datalockowner, current_thread(), 0);
1286 if (updatesize && mine && ISSET(np->n_flag, NUPDATESIZE))
1287 nfs_data_update_size(np, 1);
1288 np->n_datalockowner = NULL;
1289 lck_rw_done(&np->n_datalock);
1290 if (updatesize && !mine && ISSET(np->n_flag, NUPDATESIZE))
1291 nfs_data_update_size(np, 0);
1292 FSDBG_BOT(271, np, np->n_datalockowner, current_thread(), 0);
1293}
1294
1295
1296/*
1297 * update an NFS node's size
1298 */
1299void
1300nfs_data_update_size(nfsnode_t np, int datalocked)
1301{
1302 int error;
1303
1304 FSDBG_TOP(272, np, np->n_flag, np->n_size, np->n_newsize);
1305 if (!datalocked) {
b0d623f7 1306 nfs_data_lock(np, NFS_DATA_LOCK_EXCLUSIVE);
2d21ac55
A
1307 /* grabbing data lock will automatically update size */
1308 nfs_data_unlock(np);
1309 FSDBG_BOT(272, np, np->n_flag, np->n_size, np->n_newsize);
1310 return;
1311 }
b0d623f7 1312 error = nfs_node_lock(np);
2d21ac55
A
1313 if (error || !ISSET(np->n_flag, NUPDATESIZE)) {
1314 if (!error)
b0d623f7 1315 nfs_node_unlock(np);
2d21ac55
A
1316 FSDBG_BOT(272, np, np->n_flag, np->n_size, np->n_newsize);
1317 return;
1318 }
1319 CLR(np->n_flag, NUPDATESIZE);
1320 np->n_size = np->n_newsize;
1321 /* make sure we invalidate buffers the next chance we get */
1322 SET(np->n_flag, NNEEDINVALIDATE);
b0d623f7 1323 nfs_node_unlock(np);
2d21ac55
A
1324 ubc_setsize(NFSTOV(np), (off_t)np->n_size); /* XXX error? */
1325 FSDBG_BOT(272, np, np->n_flag, np->n_size, np->n_newsize);
1326}
1327
316670eb 1328#define DODEBUG 1
39236c6e 1329
316670eb
A
1330int
1331nfs_mount_is_dirty(mount_t mp)
1332{
1333 u_long i;
1334 nfsnode_t np;
1335#ifdef DODEBUG
1336 struct timeval now, then, diff;
1337 u_long ncnt = 0;
1338 microuptime(&now);
1339#endif
1340 lck_mtx_lock(nfs_node_hash_mutex);
1341 for (i = 0; i <= nfsnodehash; i++) {
1342 LIST_FOREACH(np, &nfsnodehashtbl[i], n_hash) {
1343#ifdef DODEBUG
1344 ncnt++;
1345#endif
1346 if (np->n_mount == mp && !LIST_EMPTY(&np->n_dirtyblkhd))
1347 goto out;
1348 }
1349 }
1350out:
1351 lck_mtx_unlock(nfs_node_hash_mutex);
1352#ifdef DODEBUG
1353 microuptime(&then);
1354 timersub(&then, &now, &diff);
1355
39236c6e
A
1356 NFS_DBG(NFS_FAC_SOCK, 7, "mount_is_dirty for %s took %lld mics for %ld slots and %ld nodes return %d\n",
1357 vfs_statfs(mp)->f_mntfromname, (uint64_t)diff.tv_sec * 1000000LL + diff.tv_usec, i, ncnt, (i <= nfsnodehash));
316670eb
A
1358#endif
1359
1360 return (i <= nfsnodehash);
1361}