]> git.saurik.com Git - apple/xnu.git/blob - bsd/nfs/nfs_node.c
90400cfa5a47f3ccbac7db46edfb33881fd9b4cf
[apple/xnu.git] / bsd / nfs / nfs_node.c
1 /*
2 * Copyright (c) 2000-2019 Apple Inc. All rights reserved.
3 *
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
5 *
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
14 *
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
17 *
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
25 *
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
27 */
28 /* Copyright (c) 1995 NeXT Computer, Inc. All Rights Reserved */
29 /*
30 * Copyright (c) 1989, 1993
31 * The Regents of the University of California. All rights reserved.
32 *
33 * This code is derived from software contributed to Berkeley by
34 * Rick Macklem at The University of Guelph.
35 *
36 * Redistribution and use in source and binary forms, with or without
37 * modification, are permitted provided that the following conditions
38 * are met:
39 * 1. Redistributions of source code must retain the above copyright
40 * notice, this list of conditions and the following disclaimer.
41 * 2. Redistributions in binary form must reproduce the above copyright
42 * notice, this list of conditions and the following disclaimer in the
43 * documentation and/or other materials provided with the distribution.
44 * 3. All advertising materials mentioning features or use of this software
45 * must display the following acknowledgement:
46 * This product includes software developed by the University of
47 * California, Berkeley and its contributors.
48 * 4. Neither the name of the University nor the names of its contributors
49 * may be used to endorse or promote products derived from this software
50 * without specific prior written permission.
51 *
52 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
53 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
54 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
55 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
56 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
57 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
58 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
59 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
60 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
61 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
62 * SUCH DAMAGE.
63 *
64 * @(#)nfs_node.c 8.6 (Berkeley) 5/22/95
65 * FreeBSD-Id: nfs_node.c,v 1.22 1997/10/28 14:06:20 bde Exp $
66 */
67
68
69 #include <sys/param.h>
70 #include <sys/kernel.h>
71 #include <sys/systm.h>
72 #include <sys/proc.h>
73 #include <sys/kauth.h>
74 #include <sys/mount_internal.h>
75 #include <sys/vnode_internal.h>
76 #include <sys/vnode.h>
77 #include <sys/ubc.h>
78 #include <sys/malloc.h>
79 #include <sys/fcntl.h>
80 #include <sys/time.h>
81
82 #include <nfs/rpcv2.h>
83 #include <nfs/nfsproto.h>
84 #include <nfs/nfs.h>
85 #include <nfs/nfsnode.h>
86 #include <nfs/nfs_gss.h>
87 #include <nfs/nfsmount.h>
88
89 #define NFSNOHASH(fhsum) \
90 (&nfsnodehashtbl[(fhsum) & nfsnodehash])
91 static LIST_HEAD(nfsnodehashhead, nfsnode) * nfsnodehashtbl;
92 static u_long nfsnodehash;
93
94 static lck_grp_t *nfs_node_hash_lck_grp;
95 static lck_grp_t *nfs_node_lck_grp;
96 static lck_grp_t *nfs_data_lck_grp;
97 lck_mtx_t *nfs_node_hash_mutex;
98
99 #define NFS_NODE_DBG(...) NFS_DBG(NFS_FAC_NODE, 7, ## __VA_ARGS__)
100
101 /*
102 * Initialize hash links for nfsnodes
103 * and build nfsnode free list.
104 */
105 void
106 nfs_nhinit(void)
107 {
108 nfs_node_hash_lck_grp = lck_grp_alloc_init("nfs_node_hash", LCK_GRP_ATTR_NULL);
109 nfs_node_hash_mutex = lck_mtx_alloc_init(nfs_node_hash_lck_grp, LCK_ATTR_NULL);
110 nfs_node_lck_grp = lck_grp_alloc_init("nfs_node", LCK_GRP_ATTR_NULL);
111 nfs_data_lck_grp = lck_grp_alloc_init("nfs_data", LCK_GRP_ATTR_NULL);
112 }
113
114 void
115 nfs_nhinit_finish(void)
116 {
117 lck_mtx_lock(nfs_node_hash_mutex);
118 if (!nfsnodehashtbl) {
119 nfsnodehashtbl = hashinit(desiredvnodes, M_NFSNODE, &nfsnodehash);
120 }
121 lck_mtx_unlock(nfs_node_hash_mutex);
122 }
123
124 /*
125 * Compute an entry in the NFS hash table structure
126 */
127 u_long
128 nfs_hash(u_char *fhp, int fhsize)
129 {
130 u_long fhsum;
131 int i;
132
133 fhsum = 0;
134 for (i = 0; i < fhsize; i++) {
135 fhsum += *fhp++;
136 }
137 return fhsum;
138 }
139
140
141 int nfs_case_insensitive(mount_t);
142
143 int
144 nfs_case_insensitive(mount_t mp)
145 {
146 struct nfsmount *nmp = VFSTONFS(mp);
147 int answer = 0;
148 int skip = 0;
149
150 if (nfs_mount_gone(nmp)) {
151 return 0;
152 }
153
154 if (nmp->nm_vers == NFS_VER2) {
155 /* V2 has no way to know */
156 return 0;
157 }
158
159 lck_mtx_lock(&nmp->nm_lock);
160 if (nmp->nm_vers == NFS_VER3) {
161 if (!(nmp->nm_state & NFSSTA_GOTPATHCONF)) {
162 /* We're holding the node lock so we just return
163 * with answer as case sensitive. Is very rare
164 * for file systems not to be homogenous w.r.t. pathconf
165 */
166 skip = 1;
167 }
168 } else if (!(nmp->nm_fsattr.nfsa_flags & NFS_FSFLAG_HOMOGENEOUS)) {
169 /* no pathconf info cached */
170 skip = 1;
171 }
172
173 if (!skip && (nmp->nm_fsattr.nfsa_flags & NFS_FSFLAG_CASE_INSENSITIVE)) {
174 answer = 1;
175 }
176
177 lck_mtx_unlock(&nmp->nm_lock);
178
179 return answer;
180 }
181
182
183 /*
184 * Look up a vnode/nfsnode by file handle.
185 * Callers must check for mount points!!
186 * In all cases, a pointer to a
187 * nfsnode structure is returned.
188 */
189 int
190 nfs_nget(
191 mount_t mp,
192 nfsnode_t dnp,
193 struct componentname *cnp,
194 u_char *fhp,
195 int fhsize,
196 struct nfs_vattr *nvap,
197 u_int64_t *xidp,
198 uint32_t auth,
199 int flags,
200 nfsnode_t *npp)
201 {
202 nfsnode_t np;
203 struct nfsnodehashhead *nhpp;
204 vnode_t vp;
205 int error, nfsvers;
206 mount_t mp2;
207 struct vnode_fsparam vfsp;
208 uint32_t vid;
209
210 FSDBG_TOP(263, mp, dnp, flags, npp);
211
212 /* Check for unmount in progress */
213 if (!mp || vfs_isforce(mp)) {
214 *npp = NULL;
215 error = ENXIO;
216 FSDBG_BOT(263, mp, dnp, 0xd1e, error);
217 return error;
218 }
219 nfsvers = VFSTONFS(mp)->nm_vers;
220
221 nhpp = NFSNOHASH(nfs_hash(fhp, fhsize));
222 loop:
223 lck_mtx_lock(nfs_node_hash_mutex);
224 for (np = nhpp->lh_first; np != 0; np = np->n_hash.le_next) {
225 mp2 = (np->n_hflag & NHINIT) ? np->n_mount : NFSTOMP(np);
226 if (mp != mp2 || np->n_fhsize != fhsize ||
227 bcmp(fhp, np->n_fhp, fhsize)) {
228 continue;
229 }
230 if (nvap && (nvap->nva_flags & NFS_FFLAG_TRIGGER_REFERRAL) &&
231 cnp && (cnp->cn_namelen > (fhsize - (int)sizeof(dnp)))) {
232 /* The name was too long to fit in the file handle. Check it against the node's name. */
233 int namecmp = 0;
234 const char *vname = vnode_getname(NFSTOV(np));
235 if (vname) {
236 if (cnp->cn_namelen != (int)strlen(vname)) {
237 namecmp = 1;
238 } else {
239 namecmp = strncmp(vname, cnp->cn_nameptr, cnp->cn_namelen);
240 }
241 vnode_putname(vname);
242 }
243 if (namecmp) { /* full name didn't match */
244 continue;
245 }
246 }
247 FSDBG(263, dnp, np, np->n_flag, 0xcace0000);
248 /* if the node is locked, sleep on it */
249 if ((np->n_hflag & NHLOCKED) && !(flags & NG_NOCREATE)) {
250 np->n_hflag |= NHLOCKWANT;
251 FSDBG(263, dnp, np, np->n_flag, 0xcace2222);
252 msleep(np, nfs_node_hash_mutex, PDROP | PINOD, "nfs_nget", NULL);
253 FSDBG(263, dnp, np, np->n_flag, 0xcace3333);
254 goto loop;
255 }
256 vp = NFSTOV(np);
257 vid = vnode_vid(vp);
258 lck_mtx_unlock(nfs_node_hash_mutex);
259 if ((error = vnode_getwithvid(vp, vid))) {
260 /*
261 * If vnode is being reclaimed or has already
262 * changed identity, no need to wait.
263 */
264 FSDBG_BOT(263, dnp, *npp, 0xcace0d1e, error);
265 return error;
266 }
267 if ((error = nfs_node_lock(np))) {
268 /* this only fails if the node is now unhashed */
269 /* so let's see if we can find/create it again */
270 FSDBG(263, dnp, *npp, 0xcaced1e2, error);
271 vnode_put(vp);
272 if (flags & NG_NOCREATE) {
273 *npp = 0;
274 FSDBG_BOT(263, dnp, *npp, 0xcaced1e0, ENOENT);
275 return ENOENT;
276 }
277 goto loop;
278 }
279 /* update attributes */
280 if (nvap) {
281 error = nfs_loadattrcache(np, nvap, xidp, 0);
282 }
283 if (error) {
284 nfs_node_unlock(np);
285 vnode_put(vp);
286 } else {
287 if (dnp && cnp && (flags & NG_MAKEENTRY)) {
288 cache_enter(NFSTOV(dnp), vp, cnp);
289 }
290 /*
291 * Update the vnode if the name/and or the parent has
292 * changed. We need to do this so that if getattrlist is
293 * called asking for ATTR_CMN_NAME, that the "most"
294 * correct name is being returned. In addition for
295 * monitored vnodes we need to kick the vnode out of the
296 * name cache. We do this so that if there are hard
297 * links in the same directory the link will not be
298 * found and a lookup will get us here to return the
299 * name of the current link. In addition by removing the
300 * name from the name cache the old name will not be
301 * found after a rename done on another client or the
302 * server. The principle reason to do this is because
303 * Finder is asking for notifications on a directory.
304 * The directory changes, Finder gets notified, reads
305 * the directory (which we have purged) and for each
306 * entry returned calls getattrlist with the name
307 * returned from readdir. gettattrlist has to call
308 * namei/lookup to resolve the name, because its not in
309 * the cache we end up here. We need to update the name
310 * so Finder will get the name it called us with.
311 *
312 * We had an imperfect solution with respect to case
313 * sensitivity. There is a test that is run in
314 * FileBuster that does renames from some name to
315 * another name differing only in case. It then reads
316 * the directory looking for the new name, after it
317 * finds that new name, it ask gettattrlist to verify
318 * that the name is the new name. Usually that works,
319 * but renames generate fsevents and fseventsd will do a
320 * lookup on the name via lstat. Since that test renames
321 * old name to new name back and forth there is a race
322 * that an fsevent will be behind and will access the
323 * file by the old name, on a case insensitive file
324 * system that will work. Problem is if we do a case
325 * sensitive compare, we're going to change the name,
326 * which the test's getattrlist verification step is
327 * going to fail. So we will check the case sensitivity
328 * of the file system and do the appropriate compare. In
329 * a rare instance for non homogeneous file systems
330 * w.r.t. pathconf we will use case sensitive compares.
331 * That could break if the file system is actually case
332 * insensitive.
333 *
334 * Note that V2 does not know the case, so we just
335 * assume case sensitivity.
336 *
337 * This is clearly not perfect due to races, but this is
338 * as good as its going to get. You can defeat the
339 * handling of hard links simply by doing:
340 *
341 * while :; do ls -l > /dev/null; done
342 *
343 * in a terminal window. Even a single ls -l can cause a
344 * race.
345 *
346 * <rant>What we really need is for the caller, that
347 * knows the name being used is valid since it got it
348 * from a readdir to use that name and not ask for the
349 * ATTR_CMN_NAME</rant>
350 */
351 if (dnp && cnp && (vp != NFSTOV(dnp))) {
352 int update_flags = (vnode_ismonitored((NFSTOV(dnp)))) ? VNODE_UPDATE_CACHE : 0;
353 int (*cmp)(const char *s1, const char *s2, size_t n);
354
355 cmp = nfs_case_insensitive(mp) ? strncasecmp : strncmp;
356
357 if (vp->v_name && (size_t)cnp->cn_namelen != strnlen(vp->v_name, MAXPATHLEN)) {
358 update_flags |= VNODE_UPDATE_NAME;
359 }
360 if (vp->v_name && cnp->cn_namelen && (*cmp)(cnp->cn_nameptr, vp->v_name, cnp->cn_namelen)) {
361 update_flags |= VNODE_UPDATE_NAME;
362 }
363 if ((vp->v_name == NULL && cnp->cn_namelen != 0) || (vp->v_name != NULL && cnp->cn_namelen == 0)) {
364 update_flags |= VNODE_UPDATE_NAME;
365 }
366 if (vnode_parent(vp) != NFSTOV(dnp)) {
367 update_flags |= VNODE_UPDATE_PARENT;
368 }
369 if (update_flags) {
370 NFS_NODE_DBG("vnode_update_identity old name %s new name %.*s update flags = %x\n",
371 vp->v_name, cnp->cn_namelen, cnp->cn_nameptr ? cnp->cn_nameptr : "", update_flags);
372 vnode_update_identity(vp, NFSTOV(dnp), cnp->cn_nameptr, cnp->cn_namelen, 0, update_flags);
373 }
374 }
375
376 *npp = np;
377 }
378 FSDBG_BOT(263, dnp, *npp, 0xcace0000, error);
379 return error;
380 }
381
382 FSDBG(263, mp, dnp, npp, 0xaaaaaaaa);
383
384 if (flags & NG_NOCREATE) {
385 lck_mtx_unlock(nfs_node_hash_mutex);
386 *npp = 0;
387 FSDBG_BOT(263, dnp, *npp, 0x80000001, ENOENT);
388 return ENOENT;
389 }
390
391 /*
392 * allocate and initialize nfsnode and stick it in the hash
393 * before calling getnewvnode(). Anyone finding it in the
394 * hash before initialization is complete will wait for it.
395 */
396 MALLOC_ZONE(np, nfsnode_t, sizeof *np, M_NFSNODE, M_WAITOK);
397 if (!np) {
398 lck_mtx_unlock(nfs_node_hash_mutex);
399 *npp = 0;
400 FSDBG_BOT(263, dnp, *npp, 0x80000001, ENOMEM);
401 return ENOMEM;
402 }
403 bzero(np, sizeof *np);
404 np->n_hflag |= (NHINIT | NHLOCKED);
405 np->n_mount = mp;
406 np->n_auth = auth;
407 TAILQ_INIT(&np->n_opens);
408 TAILQ_INIT(&np->n_lock_owners);
409 TAILQ_INIT(&np->n_locks);
410 np->n_dlink.tqe_next = NFSNOLIST;
411 np->n_dreturn.tqe_next = NFSNOLIST;
412 np->n_monlink.le_next = NFSNOLIST;
413
414 /* ugh... need to keep track of ".zfs" directories to workaround server bugs */
415 if ((nvap->nva_type == VDIR) && cnp && (cnp->cn_namelen == 4) &&
416 (cnp->cn_nameptr[0] == '.') && (cnp->cn_nameptr[1] == 'z') &&
417 (cnp->cn_nameptr[2] == 'f') && (cnp->cn_nameptr[3] == 's')) {
418 np->n_flag |= NISDOTZFS;
419 }
420 if (dnp && (dnp->n_flag & NISDOTZFS)) {
421 np->n_flag |= NISDOTZFSCHILD;
422 }
423
424 if (dnp && cnp && ((cnp->cn_namelen != 2) ||
425 (cnp->cn_nameptr[0] != '.') || (cnp->cn_nameptr[1] != '.'))) {
426 vnode_t dvp = NFSTOV(dnp);
427 if (!vnode_get(dvp)) {
428 if (!vnode_ref(dvp)) {
429 np->n_parent = dvp;
430 }
431 vnode_put(dvp);
432 }
433 }
434
435 /* setup node's file handle */
436 if (fhsize > NFS_SMALLFH) {
437 MALLOC_ZONE(np->n_fhp, u_char *,
438 fhsize, M_NFSBIGFH, M_WAITOK);
439 if (!np->n_fhp) {
440 lck_mtx_unlock(nfs_node_hash_mutex);
441 FREE_ZONE(np, sizeof *np, M_NFSNODE);
442 *npp = 0;
443 FSDBG_BOT(263, dnp, *npp, 0x80000002, ENOMEM);
444 return ENOMEM;
445 }
446 } else {
447 np->n_fhp = &np->n_fh[0];
448 }
449 bcopy(fhp, np->n_fhp, fhsize);
450 np->n_fhsize = fhsize;
451
452 /* Insert the nfsnode in the hash queue for its new file handle */
453 LIST_INSERT_HEAD(nhpp, np, n_hash);
454 np->n_hflag |= NHHASHED;
455 FSDBG(266, 0, np, np->n_flag, np->n_hflag);
456
457 /* lock the new nfsnode */
458 lck_mtx_init(&np->n_lock, nfs_node_lck_grp, LCK_ATTR_NULL);
459 lck_rw_init(&np->n_datalock, nfs_data_lck_grp, LCK_ATTR_NULL);
460 lck_mtx_init(&np->n_openlock, nfs_open_grp, LCK_ATTR_NULL);
461 lck_mtx_lock(&np->n_lock);
462
463 /* release lock on hash table */
464 lck_mtx_unlock(nfs_node_hash_mutex);
465
466 /* do initial loading of attributes */
467 NACLINVALIDATE(np);
468 NACCESSINVALIDATE(np);
469 error = nfs_loadattrcache(np, nvap, xidp, 1);
470 if (error) {
471 FSDBG(266, 0, np, np->n_flag, 0xb1eb1e);
472 nfs_node_unlock(np);
473 lck_mtx_lock(nfs_node_hash_mutex);
474 LIST_REMOVE(np, n_hash);
475 np->n_hflag &= ~(NHHASHED | NHINIT | NHLOCKED);
476 if (np->n_hflag & NHLOCKWANT) {
477 np->n_hflag &= ~NHLOCKWANT;
478 wakeup(np);
479 }
480 lck_mtx_unlock(nfs_node_hash_mutex);
481 if (np->n_parent) {
482 if (!vnode_get(np->n_parent)) {
483 vnode_rele(np->n_parent);
484 vnode_put(np->n_parent);
485 }
486 np->n_parent = NULL;
487 }
488 lck_mtx_destroy(&np->n_lock, nfs_node_lck_grp);
489 lck_rw_destroy(&np->n_datalock, nfs_data_lck_grp);
490 lck_mtx_destroy(&np->n_openlock, nfs_open_grp);
491 if (np->n_fhsize > NFS_SMALLFH) {
492 FREE_ZONE(np->n_fhp, np->n_fhsize, M_NFSBIGFH);
493 }
494 FREE_ZONE(np, sizeof *np, M_NFSNODE);
495 *npp = 0;
496 FSDBG_BOT(263, dnp, *npp, 0x80000003, error);
497 return error;
498 }
499 NFS_CHANGED_UPDATE(nfsvers, np, nvap);
500 if (nvap->nva_type == VDIR) {
501 NFS_CHANGED_UPDATE_NC(nfsvers, np, nvap);
502 }
503
504 /* now, attempt to get a new vnode */
505 vfsp.vnfs_mp = mp;
506 vfsp.vnfs_vtype = nvap->nva_type;
507 vfsp.vnfs_str = "nfs";
508 vfsp.vnfs_dvp = dnp ? NFSTOV(dnp) : NULL;
509 vfsp.vnfs_fsnode = np;
510 #if CONFIG_NFS4
511 if (nfsvers == NFS_VER4) {
512 #if FIFO
513 if (nvap->nva_type == VFIFO) {
514 vfsp.vnfs_vops = fifo_nfsv4nodeop_p;
515 } else
516 #endif /* FIFO */
517 if (nvap->nva_type == VBLK || nvap->nva_type == VCHR) {
518 vfsp.vnfs_vops = spec_nfsv4nodeop_p;
519 } else {
520 vfsp.vnfs_vops = nfsv4_vnodeop_p;
521 }
522 } else
523 #endif /* CONFIG_NFS4 */
524 {
525 #if FIFO
526 if (nvap->nva_type == VFIFO) {
527 vfsp.vnfs_vops = fifo_nfsv2nodeop_p;
528 } else
529 #endif /* FIFO */
530 if (nvap->nva_type == VBLK || nvap->nva_type == VCHR) {
531 vfsp.vnfs_vops = spec_nfsv2nodeop_p;
532 } else {
533 vfsp.vnfs_vops = nfsv2_vnodeop_p;
534 }
535 }
536 vfsp.vnfs_markroot = (flags & NG_MARKROOT) ? 1 : 0;
537 vfsp.vnfs_marksystem = 0;
538 vfsp.vnfs_rdev = 0;
539 vfsp.vnfs_filesize = nvap->nva_size;
540 vfsp.vnfs_cnp = cnp;
541 vfsp.vnfs_flags = VNFS_ADDFSREF;
542 if (!dnp || !cnp || !(flags & NG_MAKEENTRY)) {
543 vfsp.vnfs_flags |= VNFS_NOCACHE;
544 }
545
546 #if CONFIG_TRIGGERS
547 if (((nfsvers >= NFS_VER4)
548 )
549 && (nvap->nva_type == VDIR) && (np->n_vattr.nva_flags & NFS_FFLAG_TRIGGER)
550 && !(flags & NG_MARKROOT)) {
551 struct vnode_trigger_param vtp;
552 bzero(&vtp, sizeof(vtp));
553 bcopy(&vfsp, &vtp.vnt_params, sizeof(vfsp));
554 vtp.vnt_resolve_func = nfs_mirror_mount_trigger_resolve;
555 vtp.vnt_unresolve_func = nfs_mirror_mount_trigger_unresolve;
556 vtp.vnt_rearm_func = nfs_mirror_mount_trigger_rearm;
557 vtp.vnt_flags = VNT_AUTO_REARM | VNT_KERN_RESOLVE;
558 error = vnode_create(VNCREATE_TRIGGER, VNCREATE_TRIGGER_SIZE, &vtp, &np->n_vnode);
559 } else
560 #endif
561 {
562 error = vnode_create(VNCREATE_FLAVOR, VCREATESIZE, &vfsp, &np->n_vnode);
563 }
564 if (error) {
565 FSDBG(266, 0, np, np->n_flag, 0xb1eb1e);
566 nfs_node_unlock(np);
567 lck_mtx_lock(nfs_node_hash_mutex);
568 LIST_REMOVE(np, n_hash);
569 np->n_hflag &= ~(NHHASHED | NHINIT | NHLOCKED);
570 if (np->n_hflag & NHLOCKWANT) {
571 np->n_hflag &= ~NHLOCKWANT;
572 wakeup(np);
573 }
574 lck_mtx_unlock(nfs_node_hash_mutex);
575 if (np->n_parent) {
576 if (!vnode_get(np->n_parent)) {
577 vnode_rele(np->n_parent);
578 vnode_put(np->n_parent);
579 }
580 np->n_parent = NULL;
581 }
582 lck_mtx_destroy(&np->n_lock, nfs_node_lck_grp);
583 lck_rw_destroy(&np->n_datalock, nfs_data_lck_grp);
584 lck_mtx_destroy(&np->n_openlock, nfs_open_grp);
585 if (np->n_fhsize > NFS_SMALLFH) {
586 FREE_ZONE(np->n_fhp, np->n_fhsize, M_NFSBIGFH);
587 }
588 FREE_ZONE(np, sizeof *np, M_NFSNODE);
589 *npp = 0;
590 FSDBG_BOT(263, dnp, *npp, 0x80000004, error);
591 return error;
592 }
593 vp = np->n_vnode;
594 vnode_settag(vp, VT_NFS);
595 /* node is now initialized */
596
597 /* check if anyone's waiting on this node */
598 lck_mtx_lock(nfs_node_hash_mutex);
599 np->n_hflag &= ~(NHINIT | NHLOCKED);
600 if (np->n_hflag & NHLOCKWANT) {
601 np->n_hflag &= ~NHLOCKWANT;
602 wakeup(np);
603 }
604 lck_mtx_unlock(nfs_node_hash_mutex);
605
606 *npp = np;
607
608 FSDBG_BOT(263, dnp, vp, *npp, error);
609 return error;
610 }
611
612
613 int
614 nfs_vnop_inactive(
615 struct vnop_inactive_args /* {
616 * struct vnodeop_desc *a_desc;
617 * vnode_t a_vp;
618 * vfs_context_t a_context;
619 * } */*ap)
620 {
621 vnode_t vp = ap->a_vp;
622 vfs_context_t ctx = ap->a_context;
623 nfsnode_t np;
624 struct nfs_sillyrename *nsp;
625 struct nfs_vattr nvattr;
626 int unhash, attrerr, busyerror, error, inuse, busied, force;
627 struct nfs_open_file *nofp;
628 struct componentname cn;
629 struct nfsmount *nmp;
630 mount_t mp;
631
632 if (vp == NULL) {
633 panic("nfs_vnop_inactive: vp == NULL");
634 }
635 np = VTONFS(vp);
636 if (np == NULL) {
637 panic("nfs_vnop_inactive: np == NULL");
638 }
639
640 nmp = NFSTONMP(np);
641 mp = vnode_mount(vp);
642
643 restart:
644 force = (!mp || vfs_isforce(mp));
645 error = 0;
646 inuse = (nfs_mount_state_in_use_start(nmp, NULL) == 0);
647
648 /* There shouldn't be any open or lock state at this point */
649 lck_mtx_lock(&np->n_openlock);
650 if (np->n_openrefcnt && !force) {
651 /*
652 * vnode_rele and vnode_put drop the vnode lock before
653 * calling VNOP_INACTIVE, so there is a race were the
654 * vnode could become active again. Perhaps there are
655 * other places where this can happen, so if we've got
656 * here we need to get out.
657 */
658 #ifdef NFS_NODE_DEBUG
659 NP(np, "nfs_vnop_inactive: still open: %d", np->n_openrefcnt);
660 #endif
661 lck_mtx_unlock(&np->n_openlock);
662 return 0;
663 }
664
665 TAILQ_FOREACH(nofp, &np->n_opens, nof_link) {
666 lck_mtx_lock(&nofp->nof_lock);
667 if (nofp->nof_flags & NFS_OPEN_FILE_BUSY) {
668 if (!force) {
669 NP(np, "nfs_vnop_inactive: open file busy");
670 }
671 busied = 0;
672 } else {
673 nofp->nof_flags |= NFS_OPEN_FILE_BUSY;
674 busied = 1;
675 }
676 lck_mtx_unlock(&nofp->nof_lock);
677 if ((np->n_flag & NREVOKE) || (nofp->nof_flags & NFS_OPEN_FILE_LOST)) {
678 if (busied) {
679 nfs_open_file_clear_busy(nofp);
680 }
681 continue;
682 }
683 /*
684 * If we just created the file, we already had it open in
685 * anticipation of getting a subsequent open call. If the
686 * node has gone inactive without being open, we need to
687 * clean up (close) the open done in the create.
688 */
689 #if CONFIG_NFS4
690 if ((nofp->nof_flags & NFS_OPEN_FILE_CREATE) && nofp->nof_creator && !force) {
691 if (nofp->nof_flags & NFS_OPEN_FILE_REOPEN) {
692 lck_mtx_unlock(&np->n_openlock);
693 if (busied) {
694 nfs_open_file_clear_busy(nofp);
695 }
696 if (inuse) {
697 nfs_mount_state_in_use_end(nmp, 0);
698 }
699 if (!nfs4_reopen(nofp, NULL)) {
700 goto restart;
701 }
702 }
703 nofp->nof_flags &= ~NFS_OPEN_FILE_CREATE;
704 lck_mtx_unlock(&np->n_openlock);
705 error = nfs_close(np, nofp, NFS_OPEN_SHARE_ACCESS_BOTH, NFS_OPEN_SHARE_DENY_NONE, ctx);
706 if (error) {
707 NP(np, "nfs_vnop_inactive: create close error: %d", error);
708 nofp->nof_flags |= NFS_OPEN_FILE_CREATE;
709 }
710 if (busied) {
711 nfs_open_file_clear_busy(nofp);
712 }
713 if (inuse) {
714 nfs_mount_state_in_use_end(nmp, error);
715 }
716 goto restart;
717 }
718 #endif
719 if (nofp->nof_flags & NFS_OPEN_FILE_NEEDCLOSE) {
720 /*
721 * If the file is marked as needing reopen, but this was the only
722 * open on the file, just drop the open.
723 */
724 nofp->nof_flags &= ~NFS_OPEN_FILE_NEEDCLOSE;
725 if ((nofp->nof_flags & NFS_OPEN_FILE_REOPEN) && (nofp->nof_opencnt == 1)) {
726 nofp->nof_flags &= ~NFS_OPEN_FILE_REOPEN;
727 nofp->nof_r--;
728 nofp->nof_opencnt--;
729 nofp->nof_access = 0;
730 } else if (!force) {
731 lck_mtx_unlock(&np->n_openlock);
732 if (nofp->nof_flags & NFS_OPEN_FILE_REOPEN) {
733 if (busied) {
734 nfs_open_file_clear_busy(nofp);
735 }
736 if (inuse) {
737 nfs_mount_state_in_use_end(nmp, 0);
738 }
739 #if CONFIG_NFS4
740 if (!nfs4_reopen(nofp, NULL)) {
741 goto restart;
742 }
743 #endif
744 }
745 error = nfs_close(np, nofp, NFS_OPEN_SHARE_ACCESS_READ, NFS_OPEN_SHARE_DENY_NONE, ctx);
746 if (error) {
747 NP(np, "nfs_vnop_inactive: need close error: %d", error);
748 nofp->nof_flags |= NFS_OPEN_FILE_NEEDCLOSE;
749 }
750 if (busied) {
751 nfs_open_file_clear_busy(nofp);
752 }
753 if (inuse) {
754 nfs_mount_state_in_use_end(nmp, error);
755 }
756 goto restart;
757 }
758 }
759 if (nofp->nof_opencnt && !force) {
760 NP(np, "nfs_vnop_inactive: file still open: %d", nofp->nof_opencnt);
761 }
762 if (!force && (nofp->nof_access || nofp->nof_deny ||
763 nofp->nof_mmap_access || nofp->nof_mmap_deny ||
764 nofp->nof_r || nofp->nof_w || nofp->nof_rw ||
765 nofp->nof_r_dw || nofp->nof_w_dw || nofp->nof_rw_dw ||
766 nofp->nof_r_drw || nofp->nof_w_drw || nofp->nof_rw_drw ||
767 nofp->nof_d_r || nofp->nof_d_w || nofp->nof_d_rw ||
768 nofp->nof_d_r_dw || nofp->nof_d_w_dw || nofp->nof_d_rw_dw ||
769 nofp->nof_d_r_drw || nofp->nof_d_w_drw || nofp->nof_d_rw_drw)) {
770 NP(np, "nfs_vnop_inactive: non-zero access: %d %d %d %d # %u.%u %u.%u %u.%u dw %u.%u %u.%u %u.%u drw %u.%u %u.%u %u.%u",
771 nofp->nof_access, nofp->nof_deny,
772 nofp->nof_mmap_access, nofp->nof_mmap_deny,
773 nofp->nof_r, nofp->nof_d_r,
774 nofp->nof_w, nofp->nof_d_w,
775 nofp->nof_rw, nofp->nof_d_rw,
776 nofp->nof_r_dw, nofp->nof_d_r_dw,
777 nofp->nof_w_dw, nofp->nof_d_w_dw,
778 nofp->nof_rw_dw, nofp->nof_d_rw_dw,
779 nofp->nof_r_drw, nofp->nof_d_r_drw,
780 nofp->nof_w_drw, nofp->nof_d_w_drw,
781 nofp->nof_rw_drw, nofp->nof_d_rw_drw);
782 }
783 if (busied) {
784 nfs_open_file_clear_busy(nofp);
785 }
786 }
787 lck_mtx_unlock(&np->n_openlock);
788
789 if (inuse && nfs_mount_state_in_use_end(nmp, error)) {
790 goto restart;
791 }
792
793 nfs_node_lock_force(np);
794
795 if (vnode_vtype(vp) != VDIR) {
796 nsp = np->n_sillyrename;
797 np->n_sillyrename = NULL;
798 } else {
799 nsp = NULL;
800 }
801
802 FSDBG_TOP(264, vp, np, np->n_flag, nsp);
803
804 if (!nsp) {
805 /* no silly file to clean up... */
806 /* clear all flags other than these */
807 np->n_flag &= (NMODIFIED);
808 nfs_node_unlock(np);
809 FSDBG_BOT(264, vp, np, np->n_flag, 0);
810 return 0;
811 }
812 nfs_node_unlock(np);
813
814 /* Remove the silly file that was rename'd earlier */
815
816 /* flush all the buffers */
817 nfs_vinvalbuf2(vp, V_SAVE, vfs_context_thread(ctx), nsp->nsr_cred, 1);
818
819 /* try to get the latest attributes */
820 attrerr = nfs_getattr(np, &nvattr, ctx, NGA_UNCACHED);
821
822 /* Check if we should remove it from the node hash. */
823 /* Leave it if inuse or it has multiple hard links. */
824 if (vnode_isinuse(vp, 0) || (!attrerr && (nvattr.nva_nlink > 1))) {
825 unhash = 0;
826 } else {
827 unhash = 1;
828 ubc_setsize(vp, 0);
829 }
830
831 /* mark this node and the directory busy while we do the remove */
832 busyerror = nfs_node_set_busy2(nsp->nsr_dnp, np, vfs_context_thread(ctx));
833
834 /* lock the node while we remove the silly file */
835 lck_mtx_lock(nfs_node_hash_mutex);
836 while (np->n_hflag & NHLOCKED) {
837 np->n_hflag |= NHLOCKWANT;
838 msleep(np, nfs_node_hash_mutex, PINOD, "nfs_inactive", NULL);
839 }
840 np->n_hflag |= NHLOCKED;
841 lck_mtx_unlock(nfs_node_hash_mutex);
842
843 /* purge the name cache to deter others from finding it */
844 bzero(&cn, sizeof(cn));
845 cn.cn_nameptr = nsp->nsr_name;
846 cn.cn_namelen = nsp->nsr_namlen;
847 nfs_name_cache_purge(nsp->nsr_dnp, np, &cn, ctx);
848
849 FSDBG(264, np, np->n_size, np->n_vattr.nva_size, 0xf00d00f1);
850
851 /* now remove the silly file */
852 nfs_removeit(nsp);
853
854 /* clear all flags other than these */
855 nfs_node_lock_force(np);
856 np->n_flag &= (NMODIFIED);
857 nfs_node_unlock(np);
858
859 if (!busyerror) {
860 nfs_node_clear_busy2(nsp->nsr_dnp, np);
861 }
862
863 if (unhash && vnode_isinuse(vp, 0)) {
864 /* vnode now inuse after silly remove? */
865 unhash = 0;
866 ubc_setsize(vp, np->n_size);
867 }
868
869 lck_mtx_lock(nfs_node_hash_mutex);
870 if (unhash) {
871 /*
872 * remove nfsnode from hash now so we can't accidentally find it
873 * again if another object gets created with the same filehandle
874 * before this vnode gets reclaimed
875 */
876 if (np->n_hflag & NHHASHED) {
877 LIST_REMOVE(np, n_hash);
878 np->n_hflag &= ~NHHASHED;
879 FSDBG(266, 0, np, np->n_flag, 0xb1eb1e);
880 }
881 vnode_recycle(vp);
882 }
883 /* unlock the node */
884 np->n_hflag &= ~NHLOCKED;
885 if (np->n_hflag & NHLOCKWANT) {
886 np->n_hflag &= ~NHLOCKWANT;
887 wakeup(np);
888 }
889 lck_mtx_unlock(nfs_node_hash_mutex);
890
891 /* cleanup sillyrename info */
892 if (nsp->nsr_cred != NOCRED) {
893 kauth_cred_unref(&nsp->nsr_cred);
894 }
895 vnode_rele(NFSTOV(nsp->nsr_dnp));
896 FREE_ZONE(nsp, sizeof(*nsp), M_NFSREQ);
897
898 FSDBG_BOT(264, vp, np, np->n_flag, 0);
899 return 0;
900 }
901
902 /*
903 * Reclaim an nfsnode so that it can be used for other purposes.
904 */
905 int
906 nfs_vnop_reclaim(
907 struct vnop_reclaim_args /* {
908 * struct vnodeop_desc *a_desc;
909 * vnode_t a_vp;
910 * vfs_context_t a_context;
911 * } */*ap)
912 {
913 vnode_t vp = ap->a_vp;
914 nfsnode_t np = VTONFS(vp);
915 struct nfs_open_file *nofp, *nextnofp;
916 struct nfs_file_lock *nflp, *nextnflp;
917 struct nfs_lock_owner *nlop, *nextnlop;
918 struct nfsmount *nmp = np->n_mount ? VFSTONFS(np->n_mount) : NFSTONMP(np);
919 mount_t mp = vnode_mount(vp);
920 int force;
921
922 FSDBG_TOP(265, vp, np, np->n_flag, 0);
923 force = (!mp || vfs_isforce(mp) || nfs_mount_gone(nmp));
924
925
926 /* There shouldn't be any open or lock state at this point */
927 lck_mtx_lock(&np->n_openlock);
928
929 #if CONFIG_NFS4
930 if (nmp && (nmp->nm_vers >= NFS_VER4)) {
931 /* need to drop a delegation */
932 if (np->n_dreturn.tqe_next != NFSNOLIST) {
933 /* remove this node from the delegation return list */
934 lck_mtx_lock(&nmp->nm_lock);
935 if (np->n_dreturn.tqe_next != NFSNOLIST) {
936 TAILQ_REMOVE(&nmp->nm_dreturnq, np, n_dreturn);
937 np->n_dreturn.tqe_next = NFSNOLIST;
938 }
939 lck_mtx_unlock(&nmp->nm_lock);
940 }
941 if (np->n_dlink.tqe_next != NFSNOLIST) {
942 /* remove this node from the delegation list */
943 lck_mtx_lock(&nmp->nm_lock);
944 if (np->n_dlink.tqe_next != NFSNOLIST) {
945 TAILQ_REMOVE(&nmp->nm_delegations, np, n_dlink);
946 np->n_dlink.tqe_next = NFSNOLIST;
947 }
948 lck_mtx_unlock(&nmp->nm_lock);
949 }
950 if ((np->n_openflags & N_DELEG_MASK) && !force) {
951 /* try to return the delegation */
952 np->n_openflags &= ~N_DELEG_MASK;
953 nfs4_delegreturn_rpc(nmp, np->n_fhp, np->n_fhsize, &np->n_dstateid,
954 R_RECOVER, vfs_context_thread(ctx), vfs_context_ucred(ctx));
955 }
956 if (np->n_attrdirfh) {
957 FREE(np->n_attrdirfh, M_TEMP);
958 np->n_attrdirfh = NULL;
959 }
960 }
961 #endif
962
963 /* clean up file locks */
964 TAILQ_FOREACH_SAFE(nflp, &np->n_locks, nfl_link, nextnflp) {
965 if (!(nflp->nfl_flags & NFS_FILE_LOCK_DEAD) && !force) {
966 NP(np, "nfs_vnop_reclaim: lock 0x%llx 0x%llx 0x%x (bc %d)",
967 nflp->nfl_start, nflp->nfl_end, nflp->nfl_flags, nflp->nfl_blockcnt);
968 }
969 if (!(nflp->nfl_flags & (NFS_FILE_LOCK_BLOCKED | NFS_FILE_LOCK_DEAD))) {
970 /* try sending an unlock RPC if it wasn't delegated */
971 if (!(nflp->nfl_flags & NFS_FILE_LOCK_DELEGATED) && !force) {
972 nmp->nm_funcs->nf_unlock_rpc(np, nflp->nfl_owner, F_WRLCK, nflp->nfl_start, nflp->nfl_end, R_RECOVER,
973 NULL, nflp->nfl_owner->nlo_open_owner->noo_cred);
974 }
975 lck_mtx_lock(&nflp->nfl_owner->nlo_lock);
976 TAILQ_REMOVE(&nflp->nfl_owner->nlo_locks, nflp, nfl_lolink);
977 lck_mtx_unlock(&nflp->nfl_owner->nlo_lock);
978 }
979 TAILQ_REMOVE(&np->n_locks, nflp, nfl_link);
980 nfs_file_lock_destroy(nflp);
981 }
982 /* clean up lock owners */
983 TAILQ_FOREACH_SAFE(nlop, &np->n_lock_owners, nlo_link, nextnlop) {
984 if (!TAILQ_EMPTY(&nlop->nlo_locks) && !force) {
985 NP(np, "nfs_vnop_reclaim: lock owner with locks");
986 }
987 TAILQ_REMOVE(&np->n_lock_owners, nlop, nlo_link);
988 nfs_lock_owner_destroy(nlop);
989 }
990 /* clean up open state */
991 if (np->n_openrefcnt && !force) {
992 NP(np, "nfs_vnop_reclaim: still open: %d", np->n_openrefcnt);
993 }
994 TAILQ_FOREACH_SAFE(nofp, &np->n_opens, nof_link, nextnofp) {
995 if (nofp->nof_flags & NFS_OPEN_FILE_BUSY) {
996 NP(np, "nfs_vnop_reclaim: open file busy");
997 }
998 if (!(np->n_flag & NREVOKE) && !(nofp->nof_flags & NFS_OPEN_FILE_LOST)) {
999 if (nofp->nof_opencnt && !force) {
1000 NP(np, "nfs_vnop_reclaim: file still open: %d", nofp->nof_opencnt);
1001 }
1002 if (!force && (nofp->nof_access || nofp->nof_deny ||
1003 nofp->nof_mmap_access || nofp->nof_mmap_deny ||
1004 nofp->nof_r || nofp->nof_w || nofp->nof_rw ||
1005 nofp->nof_r_dw || nofp->nof_w_dw || nofp->nof_rw_dw ||
1006 nofp->nof_r_drw || nofp->nof_w_drw || nofp->nof_rw_drw ||
1007 nofp->nof_d_r || nofp->nof_d_w || nofp->nof_d_rw ||
1008 nofp->nof_d_r_dw || nofp->nof_d_w_dw || nofp->nof_d_rw_dw ||
1009 nofp->nof_d_r_drw || nofp->nof_d_w_drw || nofp->nof_d_rw_drw)) {
1010 NP(np, "nfs_vnop_reclaim: non-zero access: %d %d %d %d # %u.%u %u.%u %u.%u dw %u.%u %u.%u %u.%u drw %u.%u %u.%u %u.%u",
1011 nofp->nof_access, nofp->nof_deny,
1012 nofp->nof_mmap_access, nofp->nof_mmap_deny,
1013 nofp->nof_r, nofp->nof_d_r,
1014 nofp->nof_w, nofp->nof_d_w,
1015 nofp->nof_rw, nofp->nof_d_rw,
1016 nofp->nof_r_dw, nofp->nof_d_r_dw,
1017 nofp->nof_w_dw, nofp->nof_d_w_dw,
1018 nofp->nof_rw_dw, nofp->nof_d_rw_dw,
1019 nofp->nof_r_drw, nofp->nof_d_r_drw,
1020 nofp->nof_w_drw, nofp->nof_d_w_drw,
1021 nofp->nof_rw_drw, nofp->nof_d_rw_drw);
1022 #if CONFIG_NFS4
1023 /* try sending a close RPC if it wasn't delegated */
1024 if (nofp->nof_r || nofp->nof_w || nofp->nof_rw ||
1025 nofp->nof_r_dw || nofp->nof_w_dw || nofp->nof_rw_dw ||
1026 nofp->nof_r_drw || nofp->nof_w_drw || nofp->nof_rw_drw) {
1027 nfs4_close_rpc(np, nofp, NULL, nofp->nof_owner->noo_cred, R_RECOVER);
1028 }
1029 #endif
1030 }
1031 }
1032 TAILQ_REMOVE(&np->n_opens, nofp, nof_link);
1033 nfs_open_file_destroy(nofp);
1034 }
1035 lck_mtx_unlock(&np->n_openlock);
1036
1037 if (np->n_monlink.le_next != NFSNOLIST) {
1038 /* Wait for any in-progress getattr to complete, */
1039 /* then remove this node from the monitored node list. */
1040 lck_mtx_lock(&nmp->nm_lock);
1041 while (np->n_mflag & NMMONSCANINPROG) {
1042 struct timespec ts = { .tv_sec = 1, .tv_nsec = 0 };
1043 np->n_mflag |= NMMONSCANWANT;
1044 msleep(&np->n_mflag, &nmp->nm_lock, PZERO - 1, "nfswaitmonscan", &ts);
1045 }
1046 if (np->n_monlink.le_next != NFSNOLIST) {
1047 LIST_REMOVE(np, n_monlink);
1048 np->n_monlink.le_next = NFSNOLIST;
1049 }
1050 lck_mtx_unlock(&nmp->nm_lock);
1051 }
1052
1053 lck_mtx_lock(nfs_buf_mutex);
1054 if (!force && (!LIST_EMPTY(&np->n_dirtyblkhd) || !LIST_EMPTY(&np->n_cleanblkhd))) {
1055 NP(np, "nfs_reclaim: dropping %s buffers", (!LIST_EMPTY(&np->n_dirtyblkhd) ? "dirty" : "clean"));
1056 }
1057 lck_mtx_unlock(nfs_buf_mutex);
1058 nfs_vinvalbuf(vp, V_IGNORE_WRITEERR, ap->a_context, 0);
1059
1060 lck_mtx_lock(nfs_node_hash_mutex);
1061
1062 if ((vnode_vtype(vp) != VDIR) && np->n_sillyrename) {
1063 if (!force) {
1064 NP(np, "nfs_reclaim: leaving unlinked file %s", np->n_sillyrename->nsr_name);
1065 }
1066 if (np->n_sillyrename->nsr_cred != NOCRED) {
1067 kauth_cred_unref(&np->n_sillyrename->nsr_cred);
1068 }
1069 vnode_rele(NFSTOV(np->n_sillyrename->nsr_dnp));
1070 FREE_ZONE(np->n_sillyrename, sizeof(*np->n_sillyrename), M_NFSREQ);
1071 }
1072
1073 vnode_removefsref(vp);
1074
1075 if (np->n_hflag & NHHASHED) {
1076 LIST_REMOVE(np, n_hash);
1077 np->n_hflag &= ~NHHASHED;
1078 FSDBG(266, 0, np, np->n_flag, 0xb1eb1e);
1079 }
1080 lck_mtx_unlock(nfs_node_hash_mutex);
1081
1082 /*
1083 * Free up any directory cookie structures and large file handle
1084 * structures that might be associated with this nfs node.
1085 */
1086 nfs_node_lock_force(np);
1087 if ((vnode_vtype(vp) == VDIR) && np->n_cookiecache) {
1088 FREE_ZONE(np->n_cookiecache, sizeof(struct nfsdmap), M_NFSDIROFF);
1089 }
1090 if (np->n_fhsize > NFS_SMALLFH) {
1091 FREE_ZONE(np->n_fhp, np->n_fhsize, M_NFSBIGFH);
1092 }
1093 if (np->n_vattr.nva_acl) {
1094 kauth_acl_free(np->n_vattr.nva_acl);
1095 }
1096 nfs_node_unlock(np);
1097 vnode_clearfsnode(vp);
1098
1099 if (np->n_parent) {
1100 if (!vnode_get(np->n_parent)) {
1101 vnode_rele(np->n_parent);
1102 vnode_put(np->n_parent);
1103 }
1104 np->n_parent = NULL;
1105 }
1106
1107 lck_mtx_destroy(&np->n_lock, nfs_node_lck_grp);
1108 lck_rw_destroy(&np->n_datalock, nfs_data_lck_grp);
1109 lck_mtx_destroy(&np->n_openlock, nfs_open_grp);
1110
1111 FSDBG_BOT(265, vp, np, np->n_flag, 0xd1ed1e);
1112 FREE_ZONE(np, sizeof(struct nfsnode), M_NFSNODE);
1113 return 0;
1114 }
1115
1116 /*
1117 * Acquire an NFS node lock
1118 */
1119
1120 int
1121 nfs_node_lock_internal(nfsnode_t np, int force)
1122 {
1123 FSDBG_TOP(268, np, force, 0, 0);
1124 lck_mtx_lock(&np->n_lock);
1125 if (!force && !(np->n_hflag && NHHASHED)) {
1126 FSDBG_BOT(268, np, 0xdead, 0, 0);
1127 lck_mtx_unlock(&np->n_lock);
1128 return ENOENT;
1129 }
1130 FSDBG_BOT(268, np, force, 0, 0);
1131 return 0;
1132 }
1133
1134 int
1135 nfs_node_lock(nfsnode_t np)
1136 {
1137 return nfs_node_lock_internal(np, 0);
1138 }
1139
1140 void
1141 nfs_node_lock_force(nfsnode_t np)
1142 {
1143 nfs_node_lock_internal(np, 1);
1144 }
1145
1146 /*
1147 * Release an NFS node lock
1148 */
1149 void
1150 nfs_node_unlock(nfsnode_t np)
1151 {
1152 FSDBG(269, np, current_thread(), 0, 0);
1153 lck_mtx_unlock(&np->n_lock);
1154 }
1155
1156 /*
1157 * Acquire 2 NFS node locks
1158 * - locks taken in reverse address order
1159 * - both or neither of the locks are taken
1160 * - only one lock taken per node (dup nodes are skipped)
1161 */
1162 int
1163 nfs_node_lock2(nfsnode_t np1, nfsnode_t np2)
1164 {
1165 nfsnode_t first, second;
1166 int error;
1167
1168 first = (np1 > np2) ? np1 : np2;
1169 second = (np1 > np2) ? np2 : np1;
1170 if ((error = nfs_node_lock(first))) {
1171 return error;
1172 }
1173 if (np1 == np2) {
1174 return error;
1175 }
1176 if ((error = nfs_node_lock(second))) {
1177 nfs_node_unlock(first);
1178 }
1179 return error;
1180 }
1181
1182 void
1183 nfs_node_unlock2(nfsnode_t np1, nfsnode_t np2)
1184 {
1185 nfs_node_unlock(np1);
1186 if (np1 != np2) {
1187 nfs_node_unlock(np2);
1188 }
1189 }
1190
1191 /*
1192 * Manage NFS node busy state.
1193 * (Similar to NFS node locks above)
1194 */
1195 int
1196 nfs_node_set_busy(nfsnode_t np, thread_t thd)
1197 {
1198 struct timespec ts = { .tv_sec = 2, .tv_nsec = 0 };
1199 int error;
1200
1201 if ((error = nfs_node_lock(np))) {
1202 return error;
1203 }
1204 while (ISSET(np->n_flag, NBUSY)) {
1205 SET(np->n_flag, NBUSYWANT);
1206 msleep(np, &np->n_lock, PZERO - 1, "nfsbusywant", &ts);
1207 if ((error = nfs_sigintr(NFSTONMP(np), NULL, thd, 0))) {
1208 break;
1209 }
1210 }
1211 if (!error) {
1212 SET(np->n_flag, NBUSY);
1213 }
1214 nfs_node_unlock(np);
1215 return error;
1216 }
1217
1218 void
1219 nfs_node_clear_busy(nfsnode_t np)
1220 {
1221 int wanted;
1222
1223 nfs_node_lock_force(np);
1224 wanted = ISSET(np->n_flag, NBUSYWANT);
1225 CLR(np->n_flag, NBUSY | NBUSYWANT);
1226 nfs_node_unlock(np);
1227 if (wanted) {
1228 wakeup(np);
1229 }
1230 }
1231
1232 int
1233 nfs_node_set_busy2(nfsnode_t np1, nfsnode_t np2, thread_t thd)
1234 {
1235 nfsnode_t first, second;
1236 int error;
1237
1238 first = (np1 > np2) ? np1 : np2;
1239 second = (np1 > np2) ? np2 : np1;
1240 if ((error = nfs_node_set_busy(first, thd))) {
1241 return error;
1242 }
1243 if (np1 == np2) {
1244 return error;
1245 }
1246 if ((error = nfs_node_set_busy(second, thd))) {
1247 nfs_node_clear_busy(first);
1248 }
1249 return error;
1250 }
1251
1252 void
1253 nfs_node_clear_busy2(nfsnode_t np1, nfsnode_t np2)
1254 {
1255 nfs_node_clear_busy(np1);
1256 if (np1 != np2) {
1257 nfs_node_clear_busy(np2);
1258 }
1259 }
1260
1261 /* helper function to sort four nodes in reverse address order (no dupes) */
1262 static void
1263 nfs_node_sort4(nfsnode_t np1, nfsnode_t np2, nfsnode_t np3, nfsnode_t np4, nfsnode_t *list, int *lcntp)
1264 {
1265 nfsnode_t na[2], nb[2];
1266 int a, b, i, lcnt;
1267
1268 /* sort pairs then merge */
1269 na[0] = (np1 > np2) ? np1 : np2;
1270 na[1] = (np1 > np2) ? np2 : np1;
1271 nb[0] = (np3 > np4) ? np3 : np4;
1272 nb[1] = (np3 > np4) ? np4 : np3;
1273 for (a = b = i = lcnt = 0; i < 4; i++) {
1274 if (a >= 2) {
1275 list[lcnt] = nb[b++];
1276 } else if ((b >= 2) || (na[a] >= nb[b])) {
1277 list[lcnt] = na[a++];
1278 } else {
1279 list[lcnt] = nb[b++];
1280 }
1281 if ((lcnt <= 0) || (list[lcnt] != list[lcnt - 1])) {
1282 lcnt++; /* omit dups */
1283 }
1284 }
1285 if (list[lcnt - 1] == NULL) {
1286 lcnt--;
1287 }
1288 *lcntp = lcnt;
1289 }
1290
1291 int
1292 nfs_node_set_busy4(nfsnode_t np1, nfsnode_t np2, nfsnode_t np3, nfsnode_t np4, thread_t thd)
1293 {
1294 nfsnode_t list[4];
1295 int i, lcnt, error;
1296
1297 nfs_node_sort4(np1, np2, np3, np4, list, &lcnt);
1298
1299 /* Now we can lock using list[0 - lcnt-1] */
1300 for (i = 0; i < lcnt; ++i) {
1301 if ((error = nfs_node_set_busy(list[i], thd))) {
1302 /* Drop any locks we acquired. */
1303 while (--i >= 0) {
1304 nfs_node_clear_busy(list[i]);
1305 }
1306 return error;
1307 }
1308 }
1309 return 0;
1310 }
1311
1312 void
1313 nfs_node_clear_busy4(nfsnode_t np1, nfsnode_t np2, nfsnode_t np3, nfsnode_t np4)
1314 {
1315 nfsnode_t list[4];
1316 int lcnt;
1317
1318 nfs_node_sort4(np1, np2, np3, np4, list, &lcnt);
1319 while (--lcnt >= 0) {
1320 nfs_node_clear_busy(list[lcnt]);
1321 }
1322 }
1323
1324 /*
1325 * Acquire an NFS node data lock
1326 */
1327 void
1328 nfs_data_lock(nfsnode_t np, int locktype)
1329 {
1330 nfs_data_lock_internal(np, locktype, 1);
1331 }
1332 void
1333 nfs_data_lock_noupdate(nfsnode_t np, int locktype)
1334 {
1335 nfs_data_lock_internal(np, locktype, 0);
1336 }
1337 void
1338 nfs_data_lock_internal(nfsnode_t np, int locktype, int updatesize)
1339 {
1340 FSDBG_TOP(270, np, locktype, np->n_datalockowner, 0);
1341 if (locktype == NFS_DATA_LOCK_SHARED) {
1342 if (updatesize && ISSET(np->n_flag, NUPDATESIZE)) {
1343 nfs_data_update_size(np, 0);
1344 }
1345 lck_rw_lock_shared(&np->n_datalock);
1346 } else {
1347 lck_rw_lock_exclusive(&np->n_datalock);
1348 np->n_datalockowner = current_thread();
1349 if (updatesize && ISSET(np->n_flag, NUPDATESIZE)) {
1350 nfs_data_update_size(np, 1);
1351 }
1352 }
1353 FSDBG_BOT(270, np, locktype, np->n_datalockowner, 0);
1354 }
1355
1356 /*
1357 * Release an NFS node data lock
1358 */
1359 void
1360 nfs_data_unlock(nfsnode_t np)
1361 {
1362 nfs_data_unlock_internal(np, 1);
1363 }
1364 void
1365 nfs_data_unlock_noupdate(nfsnode_t np)
1366 {
1367 nfs_data_unlock_internal(np, 0);
1368 }
1369 void
1370 nfs_data_unlock_internal(nfsnode_t np, int updatesize)
1371 {
1372 int mine = (np->n_datalockowner == current_thread());
1373 FSDBG_TOP(271, np, np->n_datalockowner, current_thread(), 0);
1374 if (updatesize && mine && ISSET(np->n_flag, NUPDATESIZE)) {
1375 nfs_data_update_size(np, 1);
1376 }
1377 np->n_datalockowner = NULL;
1378 lck_rw_done(&np->n_datalock);
1379 if (updatesize && !mine && ISSET(np->n_flag, NUPDATESIZE)) {
1380 nfs_data_update_size(np, 0);
1381 }
1382 FSDBG_BOT(271, np, np->n_datalockowner, current_thread(), 0);
1383 }
1384
1385
1386 /*
1387 * update an NFS node's size
1388 */
1389 void
1390 nfs_data_update_size(nfsnode_t np, int datalocked)
1391 {
1392 int error;
1393
1394 FSDBG_TOP(272, np, np->n_flag, np->n_size, np->n_newsize);
1395 if (!datalocked) {
1396 nfs_data_lock(np, NFS_DATA_LOCK_EXCLUSIVE);
1397 /* grabbing data lock will automatically update size */
1398 nfs_data_unlock(np);
1399 FSDBG_BOT(272, np, np->n_flag, np->n_size, np->n_newsize);
1400 return;
1401 }
1402 error = nfs_node_lock(np);
1403 if (error || !ISSET(np->n_flag, NUPDATESIZE)) {
1404 if (!error) {
1405 nfs_node_unlock(np);
1406 }
1407 FSDBG_BOT(272, np, np->n_flag, np->n_size, np->n_newsize);
1408 return;
1409 }
1410 CLR(np->n_flag, NUPDATESIZE);
1411 np->n_size = np->n_newsize;
1412 /* make sure we invalidate buffers the next chance we get */
1413 SET(np->n_flag, NNEEDINVALIDATE);
1414 nfs_node_unlock(np);
1415 ubc_setsize(NFSTOV(np), (off_t)np->n_size); /* XXX error? */
1416 FSDBG_BOT(272, np, np->n_flag, np->n_size, np->n_newsize);
1417 }
1418
1419 #define DODEBUG 1
1420
1421 int
1422 nfs_mount_is_dirty(mount_t mp)
1423 {
1424 u_long i;
1425 nfsnode_t np;
1426 #ifdef DODEBUG
1427 struct timeval now, then, diff;
1428 u_long ncnt = 0;
1429 microuptime(&now);
1430 #endif
1431 lck_mtx_lock(nfs_node_hash_mutex);
1432 for (i = 0; i <= nfsnodehash; i++) {
1433 LIST_FOREACH(np, &nfsnodehashtbl[i], n_hash) {
1434 #ifdef DODEBUG
1435 ncnt++;
1436 #endif
1437 if (np->n_mount == mp && !LIST_EMPTY(&np->n_dirtyblkhd)) {
1438 goto out;
1439 }
1440 }
1441 }
1442 out:
1443 lck_mtx_unlock(nfs_node_hash_mutex);
1444 #ifdef DODEBUG
1445 microuptime(&then);
1446 timersub(&then, &now, &diff);
1447
1448 NFS_DBG(NFS_FAC_SOCK, 7, "mount_is_dirty for %s took %lld mics for %ld slots and %ld nodes return %d\n",
1449 vfs_statfs(mp)->f_mntfromname, (uint64_t)diff.tv_sec * 1000000LL + diff.tv_usec, i, ncnt, (i <= nfsnodehash));
1450 #endif
1451
1452 return i <= nfsnodehash;
1453 }