]> git.saurik.com Git - apple/xnu.git/blob - bsd/nfs/nfs_node.c
9563cc5de1b4aad486ae4617d4b3673521f09937
[apple/xnu.git] / bsd / nfs / nfs_node.c
1 /*
2 * Copyright (c) 2000-2013 Apple Inc. All rights reserved.
3 *
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
5 *
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
14 *
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
17 *
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
25 *
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
27 */
28 /* Copyright (c) 1995 NeXT Computer, Inc. All Rights Reserved */
29 /*
30 * Copyright (c) 1989, 1993
31 * The Regents of the University of California. All rights reserved.
32 *
33 * This code is derived from software contributed to Berkeley by
34 * Rick Macklem at The University of Guelph.
35 *
36 * Redistribution and use in source and binary forms, with or without
37 * modification, are permitted provided that the following conditions
38 * are met:
39 * 1. Redistributions of source code must retain the above copyright
40 * notice, this list of conditions and the following disclaimer.
41 * 2. Redistributions in binary form must reproduce the above copyright
42 * notice, this list of conditions and the following disclaimer in the
43 * documentation and/or other materials provided with the distribution.
44 * 3. All advertising materials mentioning features or use of this software
45 * must display the following acknowledgement:
46 * This product includes software developed by the University of
47 * California, Berkeley and its contributors.
48 * 4. Neither the name of the University nor the names of its contributors
49 * may be used to endorse or promote products derived from this software
50 * without specific prior written permission.
51 *
52 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
53 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
54 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
55 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
56 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
57 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
58 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
59 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
60 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
61 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
62 * SUCH DAMAGE.
63 *
64 * @(#)nfs_node.c 8.6 (Berkeley) 5/22/95
65 * FreeBSD-Id: nfs_node.c,v 1.22 1997/10/28 14:06:20 bde Exp $
66 */
67
68
69 #include <sys/param.h>
70 #include <sys/kernel.h>
71 #include <sys/systm.h>
72 #include <sys/proc.h>
73 #include <sys/kauth.h>
74 #include <sys/mount_internal.h>
75 #include <sys/vnode_internal.h>
76 #include <sys/vnode.h>
77 #include <sys/ubc.h>
78 #include <sys/malloc.h>
79 #include <sys/fcntl.h>
80 #include <sys/time.h>
81
82 #include <nfs/rpcv2.h>
83 #include <nfs/nfsproto.h>
84 #include <nfs/nfs.h>
85 #include <nfs/nfsnode.h>
86 #include <nfs/nfs_gss.h>
87 #include <nfs/nfsmount.h>
88
89 #define NFSNOHASH(fhsum) \
90 (&nfsnodehashtbl[(fhsum) & nfsnodehash])
91 static LIST_HEAD(nfsnodehashhead, nfsnode) *nfsnodehashtbl;
92 static u_long nfsnodehash;
93
94 static lck_grp_t *nfs_node_hash_lck_grp;
95 static lck_grp_t *nfs_node_lck_grp;
96 static lck_grp_t *nfs_data_lck_grp;
97 lck_mtx_t *nfs_node_hash_mutex;
98
99 /*
100 * Initialize hash links for nfsnodes
101 * and build nfsnode free list.
102 */
103 void
104 nfs_nhinit(void)
105 {
106 nfs_node_hash_lck_grp = lck_grp_alloc_init("nfs_node_hash", LCK_GRP_ATTR_NULL);
107 nfs_node_hash_mutex = lck_mtx_alloc_init(nfs_node_hash_lck_grp, LCK_ATTR_NULL);
108 nfs_node_lck_grp = lck_grp_alloc_init("nfs_node", LCK_GRP_ATTR_NULL);
109 nfs_data_lck_grp = lck_grp_alloc_init("nfs_data", LCK_GRP_ATTR_NULL);
110 }
111
112 void
113 nfs_nhinit_finish(void)
114 {
115 lck_mtx_lock(nfs_node_hash_mutex);
116 if (!nfsnodehashtbl)
117 nfsnodehashtbl = hashinit(desiredvnodes, M_NFSNODE, &nfsnodehash);
118 lck_mtx_unlock(nfs_node_hash_mutex);
119 }
120
121 /*
122 * Compute an entry in the NFS hash table structure
123 */
124 u_long
125 nfs_hash(u_char *fhp, int fhsize)
126 {
127 u_long fhsum;
128 int i;
129
130 fhsum = 0;
131 for (i = 0; i < fhsize; i++)
132 fhsum += *fhp++;
133 return (fhsum);
134 }
135
136
137 int nfs_case_insensitive(mount_t);
138
139 int
140 nfs_case_insensitive(mount_t mp)
141 {
142 struct nfsmount *nmp = VFSTONFS(mp);
143 int answer = 0;
144 int skip = 0;
145
146 if (nmp == NULL) {
147 return (0);
148 }
149
150 if (nmp->nm_vers == NFS_VER2) {
151 /* V2 has no way to know */
152 return (0);
153 }
154
155 lck_mtx_lock(&nmp->nm_lock);
156 if (nmp->nm_vers == NFS_VER3) {
157 if (!(nmp->nm_state & NFSSTA_GOTPATHCONF)) {
158 /* We're holding the node lock so we just return
159 * with answer as case sensitive. Is very rare
160 * for file systems not to be homogenous w.r.t. pathconf
161 */
162 skip = 1;
163 }
164 } else if (!(nmp->nm_fsattr.nfsa_flags & NFS_FSFLAG_HOMOGENEOUS)) {
165 /* no pathconf info cached */
166 skip = 1;
167 }
168
169 if (!skip && NFS_BITMAP_ISSET(nmp->nm_fsattr.nfsa_bitmap, NFS_FATTR_CASE_INSENSITIVE))
170 answer = 1;
171
172 lck_mtx_unlock(&nmp->nm_lock);
173
174 return (answer);
175 }
176
177
178 /*
179 * Look up a vnode/nfsnode by file handle.
180 * Callers must check for mount points!!
181 * In all cases, a pointer to a
182 * nfsnode structure is returned.
183 */
184 int
185 nfs_nget(
186 mount_t mp,
187 nfsnode_t dnp,
188 struct componentname *cnp,
189 u_char *fhp,
190 int fhsize,
191 struct nfs_vattr *nvap,
192 u_int64_t *xidp,
193 uint32_t auth,
194 int flags,
195 nfsnode_t *npp)
196 {
197 nfsnode_t np;
198 struct nfsnodehashhead *nhpp;
199 vnode_t vp;
200 int error, nfsvers;
201 mount_t mp2;
202 struct vnode_fsparam vfsp;
203 uint32_t vid;
204
205 FSDBG_TOP(263, mp, dnp, flags, npp);
206
207 /* Check for unmount in progress */
208 if (!mp || (mp->mnt_kern_flag & MNTK_FRCUNMOUNT)) {
209 *npp = NULL;
210 error = ENXIO;
211 FSDBG_BOT(263, mp, dnp, 0xd1e, error);
212 return (error);
213 }
214 nfsvers = VFSTONFS(mp)->nm_vers;
215
216 nhpp = NFSNOHASH(nfs_hash(fhp, fhsize));
217 loop:
218 lck_mtx_lock(nfs_node_hash_mutex);
219 for (np = nhpp->lh_first; np != 0; np = np->n_hash.le_next) {
220 mp2 = (np->n_hflag & NHINIT) ? np->n_mount : NFSTOMP(np);
221 if (mp != mp2 || np->n_fhsize != fhsize ||
222 bcmp(fhp, np->n_fhp, fhsize))
223 continue;
224 if (nvap && (nvap->nva_flags & NFS_FFLAG_TRIGGER_REFERRAL) &&
225 cnp && (cnp->cn_namelen > (fhsize - (int)sizeof(dnp)))) {
226 /* The name was too long to fit in the file handle. Check it against the node's name. */
227 int namecmp = 0;
228 const char *vname = vnode_getname(NFSTOV(np));
229 if (vname) {
230 if (cnp->cn_namelen != (int)strlen(vname))
231 namecmp = 1;
232 else
233 namecmp = strncmp(vname, cnp->cn_nameptr, cnp->cn_namelen);
234 vnode_putname(vname);
235 }
236 if (namecmp) /* full name didn't match */
237 continue;
238 }
239 FSDBG(263, dnp, np, np->n_flag, 0xcace0000);
240 /* if the node is locked, sleep on it */
241 if ((np->n_hflag & NHLOCKED) && !(flags & NG_NOCREATE)) {
242 np->n_hflag |= NHLOCKWANT;
243 FSDBG(263, dnp, np, np->n_flag, 0xcace2222);
244 msleep(np, nfs_node_hash_mutex, PDROP | PINOD, "nfs_nget", NULL);
245 FSDBG(263, dnp, np, np->n_flag, 0xcace3333);
246 goto loop;
247 }
248 vp = NFSTOV(np);
249 vid = vnode_vid(vp);
250 lck_mtx_unlock(nfs_node_hash_mutex);
251 if ((error = vnode_getwithvid(vp, vid))) {
252 /*
253 * If vnode is being reclaimed or has already
254 * changed identity, no need to wait.
255 */
256 FSDBG_BOT(263, dnp, *npp, 0xcace0d1e, error);
257 return (error);
258 }
259 if ((error = nfs_node_lock(np))) {
260 /* this only fails if the node is now unhashed */
261 /* so let's see if we can find/create it again */
262 FSDBG(263, dnp, *npp, 0xcaced1e2, error);
263 vnode_put(vp);
264 if (flags & NG_NOCREATE) {
265 *npp = 0;
266 FSDBG_BOT(263, dnp, *npp, 0xcaced1e0, ENOENT);
267 return (ENOENT);
268 }
269 goto loop;
270 }
271 /* update attributes */
272 if (nvap)
273 error = nfs_loadattrcache(np, nvap, xidp, 0);
274 if (error) {
275 nfs_node_unlock(np);
276 vnode_put(vp);
277 } else {
278 if (dnp && cnp && (flags & NG_MAKEENTRY))
279 cache_enter(NFSTOV(dnp), vp, cnp);
280 /*
281 * Update the vnode if the name/and or the parent has
282 * changed. We need to do this so that if getattrlist is
283 * called asking for ATTR_CMN_NAME, that the "most"
284 * correct name is being returned if we're not making an
285 * entry. In addition for monitored vnodes we need to
286 * kick the vnode out of the name cache. We do this so
287 * that if there are hard links in the same directory
288 * the link will not be found and a lookup will get us
289 * here to return the name of the current link. In
290 * addition by removing the name from the name cache the
291 * old name will not be found after a rename done on
292 * another client or the server. The principle reason
293 * to do this is because Finder is asking for
294 * notifications on a directory. The directory changes,
295 * Finder gets notified, reads the directory (which we
296 * have purged) and for each entry returned calls
297 * getattrlist with the name returned from
298 * readdir. gettattrlist has to call namei/lookup to
299 * resolve the name, because its not in the cache we end
300 * up here. We need to update the name so Finder will
301 * get the name it called us with.
302 *
303 * We had an imperfect solution with respect to case
304 * sensitivity. There is a test that is run in
305 * FileBuster that does renames from some name to
306 * another name differing only in case. It then reads
307 * the directory looking for the new name, after it
308 * finds that new name, it ask gettattrlist to verify
309 * that the name is the new name. Usually that works,
310 * but renames generate fsevents and fseventsd will do a
311 * lookup on the name via lstat. Since that test renames
312 * old name to new name back and forth there is a race
313 * that an fsevent will be behind and will access the
314 * file by the old name, on a case insensitive file
315 * system that will work. Problem is if we do a case
316 * sensitive compare, we're going to change the name,
317 * which the test's getattrlist verification step is
318 * going to fail. So we will check the case sensitivity
319 * of the file system and do the appropriate compare. In
320 * a rare instance for non homogeneous file systems
321 * w.r.t. pathconf we will use case sensitive compares.
322 * That could break if the file system is actually case
323 * insensitive.
324 *
325 * Note that V2 does not know the case, so we just
326 * assume case sensitivity.
327 *
328 * This is clearly not perfect due to races, but this is
329 * as good as its going to get. You can defeat the
330 * handling of hard links simply by doing:
331 *
332 * while :; do ls -l > /dev/null; done
333 *
334 * in a terminal window. Even a single ls -l can cause a
335 * race.
336 *
337 * <rant>What we really need is for the caller, that
338 * knows the name being used is valid since it got it
339 * from a readdir to use that name and not ask for the
340 * ATTR_CMN_NAME</rant>
341 */
342 if (dnp && cnp && (vp != NFSTOV(dnp))) {
343 int update_flags = vnode_ismonitored((NFSTOV(dnp))) ? VNODE_UPDATE_CACHE : 0;
344 int (*cmp)(const char *s1, const char *s2, size_t n);
345
346 cmp = nfs_case_insensitive(mp) ? strncasecmp : strncmp;
347
348 if (vp->v_name && cnp->cn_namelen && (*cmp)(cnp->cn_nameptr, vp->v_name, cnp->cn_namelen))
349 update_flags |= VNODE_UPDATE_NAME;
350 if ((vp->v_name == NULL && cnp->cn_namelen != 0) || (vp->v_name != NULL && cnp->cn_namelen == 0))
351 update_flags |= VNODE_UPDATE_NAME;
352 if (vnode_parent(vp) != NFSTOV(dnp))
353 update_flags |= VNODE_UPDATE_PARENT;
354 if (update_flags)
355 vnode_update_identity(vp, NFSTOV(dnp), cnp->cn_nameptr, cnp->cn_namelen, 0, update_flags);
356 }
357
358 *npp = np;
359 }
360 FSDBG_BOT(263, dnp, *npp, 0xcace0000, error);
361 return(error);
362 }
363
364 FSDBG(263, mp, dnp, npp, 0xaaaaaaaa);
365
366 if (flags & NG_NOCREATE) {
367 lck_mtx_unlock(nfs_node_hash_mutex);
368 *npp = 0;
369 FSDBG_BOT(263, dnp, *npp, 0x80000001, ENOENT);
370 return (ENOENT);
371 }
372
373 /*
374 * allocate and initialize nfsnode and stick it in the hash
375 * before calling getnewvnode(). Anyone finding it in the
376 * hash before initialization is complete will wait for it.
377 */
378 MALLOC_ZONE(np, nfsnode_t, sizeof *np, M_NFSNODE, M_WAITOK);
379 if (!np) {
380 lck_mtx_unlock(nfs_node_hash_mutex);
381 *npp = 0;
382 FSDBG_BOT(263, dnp, *npp, 0x80000001, ENOMEM);
383 return (ENOMEM);
384 }
385 bzero(np, sizeof *np);
386 np->n_hflag |= (NHINIT | NHLOCKED);
387 np->n_mount = mp;
388 np->n_auth = auth;
389 TAILQ_INIT(&np->n_opens);
390 TAILQ_INIT(&np->n_lock_owners);
391 TAILQ_INIT(&np->n_locks);
392 np->n_dlink.tqe_next = NFSNOLIST;
393 np->n_dreturn.tqe_next = NFSNOLIST;
394 np->n_monlink.le_next = NFSNOLIST;
395
396 /* ugh... need to keep track of ".zfs" directories to workaround server bugs */
397 if ((nvap->nva_type == VDIR) && cnp && (cnp->cn_namelen == 4) &&
398 (cnp->cn_nameptr[0] == '.') && (cnp->cn_nameptr[1] == 'z') &&
399 (cnp->cn_nameptr[2] == 'f') && (cnp->cn_nameptr[3] == 's'))
400 np->n_flag |= NISDOTZFS;
401 if (dnp && (dnp->n_flag & NISDOTZFS))
402 np->n_flag |= NISDOTZFSCHILD;
403
404 if (dnp && cnp && ((cnp->cn_namelen != 2) ||
405 (cnp->cn_nameptr[0] != '.') || (cnp->cn_nameptr[1] != '.'))) {
406 vnode_t dvp = NFSTOV(dnp);
407 if (!vnode_get(dvp)) {
408 if (!vnode_ref(dvp))
409 np->n_parent = dvp;
410 vnode_put(dvp);
411 }
412 }
413
414 /* setup node's file handle */
415 if (fhsize > NFS_SMALLFH) {
416 MALLOC_ZONE(np->n_fhp, u_char *,
417 fhsize, M_NFSBIGFH, M_WAITOK);
418 if (!np->n_fhp) {
419 lck_mtx_unlock(nfs_node_hash_mutex);
420 FREE_ZONE(np, sizeof *np, M_NFSNODE);
421 *npp = 0;
422 FSDBG_BOT(263, dnp, *npp, 0x80000002, ENOMEM);
423 return (ENOMEM);
424 }
425 } else {
426 np->n_fhp = &np->n_fh[0];
427 }
428 bcopy(fhp, np->n_fhp, fhsize);
429 np->n_fhsize = fhsize;
430
431 /* Insert the nfsnode in the hash queue for its new file handle */
432 LIST_INSERT_HEAD(nhpp, np, n_hash);
433 np->n_hflag |= NHHASHED;
434 FSDBG(266, 0, np, np->n_flag, np->n_hflag);
435
436 /* lock the new nfsnode */
437 lck_mtx_init(&np->n_lock, nfs_node_lck_grp, LCK_ATTR_NULL);
438 lck_rw_init(&np->n_datalock, nfs_data_lck_grp, LCK_ATTR_NULL);
439 lck_mtx_init(&np->n_openlock, nfs_open_grp, LCK_ATTR_NULL);
440 lck_mtx_lock(&np->n_lock);
441
442 /* release lock on hash table */
443 lck_mtx_unlock(nfs_node_hash_mutex);
444
445 /* do initial loading of attributes */
446 NACLINVALIDATE(np);
447 NACCESSINVALIDATE(np);
448 error = nfs_loadattrcache(np, nvap, xidp, 1);
449 if (error) {
450 FSDBG(266, 0, np, np->n_flag, 0xb1eb1e);
451 nfs_node_unlock(np);
452 lck_mtx_lock(nfs_node_hash_mutex);
453 LIST_REMOVE(np, n_hash);
454 np->n_hflag &= ~(NHHASHED|NHINIT|NHLOCKED);
455 if (np->n_hflag & NHLOCKWANT) {
456 np->n_hflag &= ~NHLOCKWANT;
457 wakeup(np);
458 }
459 lck_mtx_unlock(nfs_node_hash_mutex);
460 if (np->n_parent) {
461 if (!vnode_get(np->n_parent)) {
462 vnode_rele(np->n_parent);
463 vnode_put(np->n_parent);
464 }
465 np->n_parent = NULL;
466 }
467 lck_mtx_destroy(&np->n_lock, nfs_node_lck_grp);
468 lck_rw_destroy(&np->n_datalock, nfs_data_lck_grp);
469 lck_mtx_destroy(&np->n_openlock, nfs_open_grp);
470 if (np->n_fhsize > NFS_SMALLFH)
471 FREE_ZONE(np->n_fhp, np->n_fhsize, M_NFSBIGFH);
472 FREE_ZONE(np, sizeof *np, M_NFSNODE);
473 *npp = 0;
474 FSDBG_BOT(263, dnp, *npp, 0x80000003, error);
475 return (error);
476 }
477 NFS_CHANGED_UPDATE(nfsvers, np, nvap);
478 if (nvap->nva_type == VDIR)
479 NFS_CHANGED_UPDATE_NC(nfsvers, np, nvap);
480
481 /* now, attempt to get a new vnode */
482 vfsp.vnfs_mp = mp;
483 vfsp.vnfs_vtype = nvap->nva_type;
484 vfsp.vnfs_str = "nfs";
485 vfsp.vnfs_dvp = dnp ? NFSTOV(dnp) : NULL;
486 vfsp.vnfs_fsnode = np;
487 if (nfsvers == NFS_VER4) {
488 #if FIFO
489 if (nvap->nva_type == VFIFO)
490 vfsp.vnfs_vops = fifo_nfsv4nodeop_p;
491 else
492 #endif /* FIFO */
493 if (nvap->nva_type == VBLK || nvap->nva_type == VCHR)
494 vfsp.vnfs_vops = spec_nfsv4nodeop_p;
495 else
496 vfsp.vnfs_vops = nfsv4_vnodeop_p;
497 } else {
498 #if FIFO
499 if (nvap->nva_type == VFIFO)
500 vfsp.vnfs_vops = fifo_nfsv2nodeop_p;
501 else
502 #endif /* FIFO */
503 if (nvap->nva_type == VBLK || nvap->nva_type == VCHR)
504 vfsp.vnfs_vops = spec_nfsv2nodeop_p;
505 else
506 vfsp.vnfs_vops = nfsv2_vnodeop_p;
507 }
508 vfsp.vnfs_markroot = (flags & NG_MARKROOT) ? 1 : 0;
509 vfsp.vnfs_marksystem = 0;
510 vfsp.vnfs_rdev = 0;
511 vfsp.vnfs_filesize = nvap->nva_size;
512 vfsp.vnfs_cnp = cnp;
513 vfsp.vnfs_flags = VNFS_ADDFSREF;
514 if (!dnp || !cnp || !(flags & NG_MAKEENTRY))
515 vfsp.vnfs_flags |= VNFS_NOCACHE;
516
517 #if CONFIG_TRIGGERS
518 if ((nfsvers >= NFS_VER4) && (nvap->nva_type == VDIR) && (np->n_vattr.nva_flags & NFS_FFLAG_TRIGGER)) {
519 struct vnode_trigger_param vtp;
520 bzero(&vtp, sizeof(vtp));
521 bcopy(&vfsp, &vtp.vnt_params, sizeof(vfsp));
522 vtp.vnt_resolve_func = nfs_mirror_mount_trigger_resolve;
523 vtp.vnt_unresolve_func = nfs_mirror_mount_trigger_unresolve;
524 vtp.vnt_rearm_func = nfs_mirror_mount_trigger_rearm;
525 vtp.vnt_flags = VNT_AUTO_REARM;
526 error = vnode_create(VNCREATE_TRIGGER, VNCREATE_TRIGGER_SIZE, &vtp, &np->n_vnode);
527 } else
528 #endif
529 {
530 error = vnode_create(VNCREATE_FLAVOR, VCREATESIZE, &vfsp, &np->n_vnode);
531 }
532 if (error) {
533 FSDBG(266, 0, np, np->n_flag, 0xb1eb1e);
534 nfs_node_unlock(np);
535 lck_mtx_lock(nfs_node_hash_mutex);
536 LIST_REMOVE(np, n_hash);
537 np->n_hflag &= ~(NHHASHED|NHINIT|NHLOCKED);
538 if (np->n_hflag & NHLOCKWANT) {
539 np->n_hflag &= ~NHLOCKWANT;
540 wakeup(np);
541 }
542 lck_mtx_unlock(nfs_node_hash_mutex);
543 if (np->n_parent) {
544 if (!vnode_get(np->n_parent)) {
545 vnode_rele(np->n_parent);
546 vnode_put(np->n_parent);
547 }
548 np->n_parent = NULL;
549 }
550 lck_mtx_destroy(&np->n_lock, nfs_node_lck_grp);
551 lck_rw_destroy(&np->n_datalock, nfs_data_lck_grp);
552 lck_mtx_destroy(&np->n_openlock, nfs_open_grp);
553 if (np->n_fhsize > NFS_SMALLFH)
554 FREE_ZONE(np->n_fhp, np->n_fhsize, M_NFSBIGFH);
555 FREE_ZONE(np, sizeof *np, M_NFSNODE);
556 *npp = 0;
557 FSDBG_BOT(263, dnp, *npp, 0x80000004, error);
558 return (error);
559 }
560 vp = np->n_vnode;
561 vnode_settag(vp, VT_NFS);
562 /* node is now initialized */
563
564 /* check if anyone's waiting on this node */
565 lck_mtx_lock(nfs_node_hash_mutex);
566 np->n_hflag &= ~(NHINIT|NHLOCKED);
567 if (np->n_hflag & NHLOCKWANT) {
568 np->n_hflag &= ~NHLOCKWANT;
569 wakeup(np);
570 }
571 lck_mtx_unlock(nfs_node_hash_mutex);
572
573 *npp = np;
574
575 FSDBG_BOT(263, dnp, vp, *npp, error);
576 return (error);
577 }
578
579
580 int
581 nfs_vnop_inactive(ap)
582 struct vnop_inactive_args /* {
583 struct vnodeop_desc *a_desc;
584 vnode_t a_vp;
585 vfs_context_t a_context;
586 } */ *ap;
587 {
588 vnode_t vp = ap->a_vp;
589 vfs_context_t ctx = ap->a_context;
590 nfsnode_t np = VTONFS(ap->a_vp);
591 struct nfs_sillyrename *nsp;
592 struct nfs_vattr nvattr;
593 int unhash, attrerr, busyerror, error, inuse, busied, force;
594 struct nfs_open_file *nofp;
595 struct componentname cn;
596 struct nfsmount *nmp = NFSTONMP(np);
597 mount_t mp = vnode_mount(vp);
598
599 restart:
600 force = (!mp || (mp->mnt_kern_flag & MNTK_FRCUNMOUNT));
601 error = 0;
602 inuse = (nfs_mount_state_in_use_start(nmp, NULL) == 0);
603
604 /* There shouldn't be any open or lock state at this point */
605 lck_mtx_lock(&np->n_openlock);
606 if (np->n_openrefcnt && !force)
607 NP(np, "nfs_vnop_inactive: still open: %d", np->n_openrefcnt);
608 TAILQ_FOREACH(nofp, &np->n_opens, nof_link) {
609 lck_mtx_lock(&nofp->nof_lock);
610 if (nofp->nof_flags & NFS_OPEN_FILE_BUSY) {
611 if (!force)
612 NP(np, "nfs_vnop_inactive: open file busy");
613 busied = 0;
614 } else {
615 nofp->nof_flags |= NFS_OPEN_FILE_BUSY;
616 busied = 1;
617 }
618 lck_mtx_unlock(&nofp->nof_lock);
619 if ((np->n_flag & NREVOKE) || (nofp->nof_flags & NFS_OPEN_FILE_LOST)) {
620 if (busied)
621 nfs_open_file_clear_busy(nofp);
622 continue;
623 }
624 /*
625 * If we just created the file, we already had it open in
626 * anticipation of getting a subsequent open call. If the
627 * node has gone inactive without being open, we need to
628 * clean up (close) the open done in the create.
629 */
630 if ((nofp->nof_flags & NFS_OPEN_FILE_CREATE) && nofp->nof_creator && !force) {
631 if (nofp->nof_flags & NFS_OPEN_FILE_REOPEN) {
632 lck_mtx_unlock(&np->n_openlock);
633 if (busied)
634 nfs_open_file_clear_busy(nofp);
635 if (inuse)
636 nfs_mount_state_in_use_end(nmp, 0);
637 if (!nfs4_reopen(nofp, NULL))
638 goto restart;
639 }
640 nofp->nof_flags &= ~NFS_OPEN_FILE_CREATE;
641 lck_mtx_unlock(&np->n_openlock);
642 error = nfs_close(np, nofp, NFS_OPEN_SHARE_ACCESS_BOTH, NFS_OPEN_SHARE_DENY_NONE, ctx);
643 if (error) {
644 NP(np, "nfs_vnop_inactive: create close error: %d", error);
645 nofp->nof_flags |= NFS_OPEN_FILE_CREATE;
646 }
647 if (busied)
648 nfs_open_file_clear_busy(nofp);
649 if (inuse)
650 nfs_mount_state_in_use_end(nmp, error);
651 goto restart;
652 }
653 if (nofp->nof_flags & NFS_OPEN_FILE_NEEDCLOSE) {
654 /*
655 * If the file is marked as needing reopen, but this was the only
656 * open on the file, just drop the open.
657 */
658 nofp->nof_flags &= ~NFS_OPEN_FILE_NEEDCLOSE;
659 if ((nofp->nof_flags & NFS_OPEN_FILE_REOPEN) && (nofp->nof_opencnt == 1)) {
660 nofp->nof_flags &= ~NFS_OPEN_FILE_REOPEN;
661 nofp->nof_r--;
662 nofp->nof_opencnt--;
663 nofp->nof_access = 0;
664 } else if (!force) {
665 lck_mtx_unlock(&np->n_openlock);
666 if (nofp->nof_flags & NFS_OPEN_FILE_REOPEN) {
667 if (busied)
668 nfs_open_file_clear_busy(nofp);
669 if (inuse)
670 nfs_mount_state_in_use_end(nmp, 0);
671 if (!nfs4_reopen(nofp, NULL))
672 goto restart;
673 }
674 error = nfs_close(np, nofp, NFS_OPEN_SHARE_ACCESS_READ, NFS_OPEN_SHARE_DENY_NONE, ctx);
675 if (error) {
676 NP(np, "nfs_vnop_inactive: need close error: %d", error);
677 nofp->nof_flags |= NFS_OPEN_FILE_NEEDCLOSE;
678 }
679 if (busied)
680 nfs_open_file_clear_busy(nofp);
681 if (inuse)
682 nfs_mount_state_in_use_end(nmp, error);
683 goto restart;
684 }
685 }
686 if (nofp->nof_opencnt && !force)
687 NP(np, "nfs_vnop_inactive: file still open: %d", nofp->nof_opencnt);
688 if (!force && (nofp->nof_access || nofp->nof_deny ||
689 nofp->nof_mmap_access || nofp->nof_mmap_deny ||
690 nofp->nof_r || nofp->nof_w || nofp->nof_rw ||
691 nofp->nof_r_dw || nofp->nof_w_dw || nofp->nof_rw_dw ||
692 nofp->nof_r_drw || nofp->nof_w_drw || nofp->nof_rw_drw ||
693 nofp->nof_d_r || nofp->nof_d_w || nofp->nof_d_rw ||
694 nofp->nof_d_r_dw || nofp->nof_d_w_dw || nofp->nof_d_rw_dw ||
695 nofp->nof_d_r_drw || nofp->nof_d_w_drw || nofp->nof_d_rw_drw)) {
696 NP(np, "nfs_vnop_inactive: non-zero access: %d %d %d %d # %u.%u %u.%u %u.%u dw %u.%u %u.%u %u.%u drw %u.%u %u.%u %u.%u",
697 nofp->nof_access, nofp->nof_deny,
698 nofp->nof_mmap_access, nofp->nof_mmap_deny,
699 nofp->nof_r, nofp->nof_d_r,
700 nofp->nof_w, nofp->nof_d_w,
701 nofp->nof_rw, nofp->nof_d_rw,
702 nofp->nof_r_dw, nofp->nof_d_r_dw,
703 nofp->nof_w_dw, nofp->nof_d_w_dw,
704 nofp->nof_rw_dw, nofp->nof_d_rw_dw,
705 nofp->nof_r_drw, nofp->nof_d_r_drw,
706 nofp->nof_w_drw, nofp->nof_d_w_drw,
707 nofp->nof_rw_drw, nofp->nof_d_rw_drw);
708 }
709 if (busied)
710 nfs_open_file_clear_busy(nofp);
711 }
712 lck_mtx_unlock(&np->n_openlock);
713
714 if (inuse && nfs_mount_state_in_use_end(nmp, error))
715 goto restart;
716
717 nfs_node_lock_force(np);
718
719 if (vnode_vtype(vp) != VDIR) {
720 nsp = np->n_sillyrename;
721 np->n_sillyrename = NULL;
722 } else {
723 nsp = NULL;
724 }
725
726 FSDBG_TOP(264, vp, np, np->n_flag, nsp);
727
728 if (!nsp) {
729 /* no silly file to clean up... */
730 /* clear all flags other than these */
731 np->n_flag &= (NMODIFIED);
732 nfs_node_unlock(np);
733 FSDBG_BOT(264, vp, np, np->n_flag, 0);
734 return (0);
735 }
736 nfs_node_unlock(np);
737
738 /* Remove the silly file that was rename'd earlier */
739
740 /* flush all the buffers */
741 nfs_vinvalbuf2(vp, V_SAVE, vfs_context_thread(ctx), nsp->nsr_cred, 1);
742
743 /* try to get the latest attributes */
744 attrerr = nfs_getattr(np, &nvattr, ctx, NGA_UNCACHED);
745
746 /* Check if we should remove it from the node hash. */
747 /* Leave it if inuse or it has multiple hard links. */
748 if (vnode_isinuse(vp, 0) || (!attrerr && (nvattr.nva_nlink > 1))) {
749 unhash = 0;
750 } else {
751 unhash = 1;
752 ubc_setsize(vp, 0);
753 }
754
755 /* mark this node and the directory busy while we do the remove */
756 busyerror = nfs_node_set_busy2(nsp->nsr_dnp, np, vfs_context_thread(ctx));
757
758 /* lock the node while we remove the silly file */
759 lck_mtx_lock(nfs_node_hash_mutex);
760 while (np->n_hflag & NHLOCKED) {
761 np->n_hflag |= NHLOCKWANT;
762 msleep(np, nfs_node_hash_mutex, PINOD, "nfs_inactive", NULL);
763 }
764 np->n_hflag |= NHLOCKED;
765 lck_mtx_unlock(nfs_node_hash_mutex);
766
767 /* purge the name cache to deter others from finding it */
768 bzero(&cn, sizeof(cn));
769 cn.cn_nameptr = nsp->nsr_name;
770 cn.cn_namelen = nsp->nsr_namlen;
771 nfs_name_cache_purge(nsp->nsr_dnp, np, &cn, ctx);
772
773 FSDBG(264, np, np->n_size, np->n_vattr.nva_size, 0xf00d00f1);
774
775 /* now remove the silly file */
776 nfs_removeit(nsp);
777
778 /* clear all flags other than these */
779 nfs_node_lock_force(np);
780 np->n_flag &= (NMODIFIED);
781 nfs_node_unlock(np);
782
783 if (!busyerror)
784 nfs_node_clear_busy2(nsp->nsr_dnp, np);
785
786 if (unhash && vnode_isinuse(vp, 0)) {
787 /* vnode now inuse after silly remove? */
788 unhash = 0;
789 ubc_setsize(vp, np->n_size);
790 }
791
792 lck_mtx_lock(nfs_node_hash_mutex);
793 if (unhash) {
794 /*
795 * remove nfsnode from hash now so we can't accidentally find it
796 * again if another object gets created with the same filehandle
797 * before this vnode gets reclaimed
798 */
799 if (np->n_hflag & NHHASHED) {
800 LIST_REMOVE(np, n_hash);
801 np->n_hflag &= ~NHHASHED;
802 FSDBG(266, 0, np, np->n_flag, 0xb1eb1e);
803 }
804 vnode_recycle(vp);
805 }
806 /* unlock the node */
807 np->n_hflag &= ~NHLOCKED;
808 if (np->n_hflag & NHLOCKWANT) {
809 np->n_hflag &= ~NHLOCKWANT;
810 wakeup(np);
811 }
812 lck_mtx_unlock(nfs_node_hash_mutex);
813
814 /* cleanup sillyrename info */
815 if (nsp->nsr_cred != NOCRED)
816 kauth_cred_unref(&nsp->nsr_cred);
817 vnode_rele(NFSTOV(nsp->nsr_dnp));
818 FREE_ZONE(nsp, sizeof(*nsp), M_NFSREQ);
819
820 FSDBG_BOT(264, vp, np, np->n_flag, 0);
821 return (0);
822 }
823
824 /*
825 * Reclaim an nfsnode so that it can be used for other purposes.
826 */
827 int
828 nfs_vnop_reclaim(ap)
829 struct vnop_reclaim_args /* {
830 struct vnodeop_desc *a_desc;
831 vnode_t a_vp;
832 vfs_context_t a_context;
833 } */ *ap;
834 {
835 vnode_t vp = ap->a_vp;
836 nfsnode_t np = VTONFS(vp);
837 vfs_context_t ctx = ap->a_context;
838 struct nfs_open_file *nofp, *nextnofp;
839 struct nfs_file_lock *nflp, *nextnflp;
840 struct nfs_lock_owner *nlop, *nextnlop;
841 struct nfsmount *nmp = np->n_mount ? VFSTONFS(np->n_mount) : NFSTONMP(np);
842 mount_t mp = vnode_mount(vp);
843 int force;
844
845 FSDBG_TOP(265, vp, np, np->n_flag, 0);
846 force = (!mp || (mp->mnt_kern_flag & MNTK_FRCUNMOUNT));
847
848 /* There shouldn't be any open or lock state at this point */
849 lck_mtx_lock(&np->n_openlock);
850
851 if (nmp && (nmp->nm_vers >= NFS_VER4)) {
852 /* need to drop a delegation */
853 if (np->n_dreturn.tqe_next != NFSNOLIST) {
854 /* remove this node from the delegation return list */
855 lck_mtx_lock(&nmp->nm_lock);
856 if (np->n_dreturn.tqe_next != NFSNOLIST) {
857 TAILQ_REMOVE(&nmp->nm_dreturnq, np, n_dreturn);
858 np->n_dreturn.tqe_next = NFSNOLIST;
859 }
860 lck_mtx_unlock(&nmp->nm_lock);
861 }
862 if (np->n_dlink.tqe_next != NFSNOLIST) {
863 /* remove this node from the delegation list */
864 lck_mtx_lock(&nmp->nm_lock);
865 if (np->n_dlink.tqe_next != NFSNOLIST) {
866 TAILQ_REMOVE(&nmp->nm_delegations, np, n_dlink);
867 np->n_dlink.tqe_next = NFSNOLIST;
868 }
869 lck_mtx_unlock(&nmp->nm_lock);
870 }
871 if ((np->n_openflags & N_DELEG_MASK) && !force) {
872 /* try to return the delegation */
873 np->n_openflags &= ~N_DELEG_MASK;
874 nfs4_delegreturn_rpc(nmp, np->n_fhp, np->n_fhsize, &np->n_dstateid,
875 R_RECOVER, vfs_context_thread(ctx), vfs_context_ucred(ctx));
876 }
877 if (np->n_attrdirfh) {
878 FREE(np->n_attrdirfh, M_TEMP);
879 np->n_attrdirfh = NULL;
880 }
881 }
882
883 /* clean up file locks */
884 TAILQ_FOREACH_SAFE(nflp, &np->n_locks, nfl_link, nextnflp) {
885 if (!(nflp->nfl_flags & NFS_FILE_LOCK_DEAD) && !force) {
886 NP(np, "nfs_vnop_reclaim: lock 0x%llx 0x%llx 0x%x (bc %d)",
887 nflp->nfl_start, nflp->nfl_end, nflp->nfl_flags, nflp->nfl_blockcnt);
888 }
889 if (!(nflp->nfl_flags & (NFS_FILE_LOCK_BLOCKED|NFS_FILE_LOCK_DEAD))) {
890 /* try sending an unlock RPC if it wasn't delegated */
891 if (!(nflp->nfl_flags & NFS_FILE_LOCK_DELEGATED) && !force)
892 nmp->nm_funcs->nf_unlock_rpc(np, nflp->nfl_owner, F_WRLCK, nflp->nfl_start, nflp->nfl_end, R_RECOVER,
893 NULL, nflp->nfl_owner->nlo_open_owner->noo_cred);
894 lck_mtx_lock(&nflp->nfl_owner->nlo_lock);
895 TAILQ_REMOVE(&nflp->nfl_owner->nlo_locks, nflp, nfl_lolink);
896 lck_mtx_unlock(&nflp->nfl_owner->nlo_lock);
897 }
898 TAILQ_REMOVE(&np->n_locks, nflp, nfl_link);
899 nfs_file_lock_destroy(nflp);
900 }
901 /* clean up lock owners */
902 TAILQ_FOREACH_SAFE(nlop, &np->n_lock_owners, nlo_link, nextnlop) {
903 if (!TAILQ_EMPTY(&nlop->nlo_locks) && !force)
904 NP(np, "nfs_vnop_reclaim: lock owner with locks");
905 TAILQ_REMOVE(&np->n_lock_owners, nlop, nlo_link);
906 nfs_lock_owner_destroy(nlop);
907 }
908 /* clean up open state */
909 if (np->n_openrefcnt && !force)
910 NP(np, "nfs_vnop_reclaim: still open: %d", np->n_openrefcnt);
911 TAILQ_FOREACH_SAFE(nofp, &np->n_opens, nof_link, nextnofp) {
912 if (nofp->nof_flags & NFS_OPEN_FILE_BUSY)
913 NP(np, "nfs_vnop_reclaim: open file busy");
914 if (!(np->n_flag & NREVOKE) && !(nofp->nof_flags & NFS_OPEN_FILE_LOST)) {
915 if (nofp->nof_opencnt && !force)
916 NP(np, "nfs_vnop_reclaim: file still open: %d", nofp->nof_opencnt);
917 if (!force && (nofp->nof_access || nofp->nof_deny ||
918 nofp->nof_mmap_access || nofp->nof_mmap_deny ||
919 nofp->nof_r || nofp->nof_w || nofp->nof_rw ||
920 nofp->nof_r_dw || nofp->nof_w_dw || nofp->nof_rw_dw ||
921 nofp->nof_r_drw || nofp->nof_w_drw || nofp->nof_rw_drw ||
922 nofp->nof_d_r || nofp->nof_d_w || nofp->nof_d_rw ||
923 nofp->nof_d_r_dw || nofp->nof_d_w_dw || nofp->nof_d_rw_dw ||
924 nofp->nof_d_r_drw || nofp->nof_d_w_drw || nofp->nof_d_rw_drw)) {
925 NP(np, "nfs_vnop_reclaim: non-zero access: %d %d %d %d # %u.%u %u.%u %u.%u dw %u.%u %u.%u %u.%u drw %u.%u %u.%u %u.%u",
926 nofp->nof_access, nofp->nof_deny,
927 nofp->nof_mmap_access, nofp->nof_mmap_deny,
928 nofp->nof_r, nofp->nof_d_r,
929 nofp->nof_w, nofp->nof_d_w,
930 nofp->nof_rw, nofp->nof_d_rw,
931 nofp->nof_r_dw, nofp->nof_d_r_dw,
932 nofp->nof_w_dw, nofp->nof_d_w_dw,
933 nofp->nof_rw_dw, nofp->nof_d_rw_dw,
934 nofp->nof_r_drw, nofp->nof_d_r_drw,
935 nofp->nof_w_drw, nofp->nof_d_w_drw,
936 nofp->nof_rw_drw, nofp->nof_d_rw_drw);
937 /* try sending a close RPC if it wasn't delegated */
938 if (nofp->nof_r || nofp->nof_w || nofp->nof_rw ||
939 nofp->nof_r_dw || nofp->nof_w_dw || nofp->nof_rw_dw ||
940 nofp->nof_r_drw || nofp->nof_w_drw || nofp->nof_rw_drw)
941 nfs4_close_rpc(np, nofp, NULL, nofp->nof_owner->noo_cred, R_RECOVER);
942 }
943 }
944 TAILQ_REMOVE(&np->n_opens, nofp, nof_link);
945 nfs_open_file_destroy(nofp);
946 }
947 lck_mtx_unlock(&np->n_openlock);
948
949 if (np->n_monlink.le_next != NFSNOLIST) {
950 /* Wait for any in-progress getattr to complete, */
951 /* then remove this node from the monitored node list. */
952 lck_mtx_lock(&nmp->nm_lock);
953 while (np->n_mflag & NMMONSCANINPROG) {
954 struct timespec ts = { 1, 0 };
955 np->n_mflag |= NMMONSCANWANT;
956 msleep(&np->n_mflag, &nmp->nm_lock, PZERO-1, "nfswaitmonscan", &ts);
957 }
958 if (np->n_monlink.le_next != NFSNOLIST) {
959 LIST_REMOVE(np, n_monlink);
960 np->n_monlink.le_next = NFSNOLIST;
961 }
962 lck_mtx_unlock(&nmp->nm_lock);
963 }
964
965 lck_mtx_lock(nfs_buf_mutex);
966 if (!force && (!LIST_EMPTY(&np->n_dirtyblkhd) || !LIST_EMPTY(&np->n_cleanblkhd)))
967 NP(np, "nfs_reclaim: dropping %s buffers", (!LIST_EMPTY(&np->n_dirtyblkhd) ? "dirty" : "clean"));
968 lck_mtx_unlock(nfs_buf_mutex);
969 nfs_vinvalbuf(vp, V_IGNORE_WRITEERR, ap->a_context, 0);
970
971 lck_mtx_lock(nfs_node_hash_mutex);
972
973 if ((vnode_vtype(vp) != VDIR) && np->n_sillyrename) {
974 if (!force)
975 NP(np, "nfs_reclaim: leaving unlinked file %s", np->n_sillyrename->nsr_name);
976 if (np->n_sillyrename->nsr_cred != NOCRED)
977 kauth_cred_unref(&np->n_sillyrename->nsr_cred);
978 vnode_rele(NFSTOV(np->n_sillyrename->nsr_dnp));
979 FREE_ZONE(np->n_sillyrename, sizeof(*np->n_sillyrename), M_NFSREQ);
980 }
981
982 vnode_removefsref(vp);
983
984 if (np->n_hflag & NHHASHED) {
985 LIST_REMOVE(np, n_hash);
986 np->n_hflag &= ~NHHASHED;
987 FSDBG(266, 0, np, np->n_flag, 0xb1eb1e);
988 }
989 lck_mtx_unlock(nfs_node_hash_mutex);
990
991 /*
992 * Free up any directory cookie structures and large file handle
993 * structures that might be associated with this nfs node.
994 */
995 nfs_node_lock_force(np);
996 if ((vnode_vtype(vp) == VDIR) && np->n_cookiecache)
997 FREE_ZONE(np->n_cookiecache, sizeof(struct nfsdmap), M_NFSDIROFF);
998 if (np->n_fhsize > NFS_SMALLFH)
999 FREE_ZONE(np->n_fhp, np->n_fhsize, M_NFSBIGFH);
1000 if (np->n_vattr.nva_acl)
1001 kauth_acl_free(np->n_vattr.nva_acl);
1002 nfs_node_unlock(np);
1003 vnode_clearfsnode(vp);
1004
1005 if (np->n_parent) {
1006 if (!vnode_get(np->n_parent)) {
1007 vnode_rele(np->n_parent);
1008 vnode_put(np->n_parent);
1009 }
1010 np->n_parent = NULL;
1011 }
1012
1013 lck_mtx_destroy(&np->n_lock, nfs_node_lck_grp);
1014 lck_rw_destroy(&np->n_datalock, nfs_data_lck_grp);
1015 lck_mtx_destroy(&np->n_openlock, nfs_open_grp);
1016
1017 FSDBG_BOT(265, vp, np, np->n_flag, 0xd1ed1e);
1018 FREE_ZONE(np, sizeof(struct nfsnode), M_NFSNODE);
1019 return (0);
1020 }
1021
1022 /*
1023 * Acquire an NFS node lock
1024 */
1025
1026 int
1027 nfs_node_lock_internal(nfsnode_t np, int force)
1028 {
1029 FSDBG_TOP(268, np, force, 0, 0);
1030 lck_mtx_lock(&np->n_lock);
1031 if (!force && !(np->n_hflag && NHHASHED)) {
1032 FSDBG_BOT(268, np, 0xdead, 0, 0);
1033 lck_mtx_unlock(&np->n_lock);
1034 return (ENOENT);
1035 }
1036 FSDBG_BOT(268, np, force, 0, 0);
1037 return (0);
1038 }
1039
1040 int
1041 nfs_node_lock(nfsnode_t np)
1042 {
1043 return nfs_node_lock_internal(np, 0);
1044 }
1045
1046 void
1047 nfs_node_lock_force(nfsnode_t np)
1048 {
1049 nfs_node_lock_internal(np, 1);
1050 }
1051
1052 /*
1053 * Release an NFS node lock
1054 */
1055 void
1056 nfs_node_unlock(nfsnode_t np)
1057 {
1058 FSDBG(269, np, current_thread(), 0, 0);
1059 lck_mtx_unlock(&np->n_lock);
1060 }
1061
1062 /*
1063 * Acquire 2 NFS node locks
1064 * - locks taken in reverse address order
1065 * - both or neither of the locks are taken
1066 * - only one lock taken per node (dup nodes are skipped)
1067 */
1068 int
1069 nfs_node_lock2(nfsnode_t np1, nfsnode_t np2)
1070 {
1071 nfsnode_t first, second;
1072 int error;
1073
1074 first = (np1 > np2) ? np1 : np2;
1075 second = (np1 > np2) ? np2 : np1;
1076 if ((error = nfs_node_lock(first)))
1077 return (error);
1078 if (np1 == np2)
1079 return (error);
1080 if ((error = nfs_node_lock(second)))
1081 nfs_node_unlock(first);
1082 return (error);
1083 }
1084
1085 void
1086 nfs_node_unlock2(nfsnode_t np1, nfsnode_t np2)
1087 {
1088 nfs_node_unlock(np1);
1089 if (np1 != np2)
1090 nfs_node_unlock(np2);
1091 }
1092
1093 /*
1094 * Manage NFS node busy state.
1095 * (Similar to NFS node locks above)
1096 */
1097 int
1098 nfs_node_set_busy(nfsnode_t np, thread_t thd)
1099 {
1100 struct timespec ts = { 2, 0 };
1101 int error;
1102
1103 if ((error = nfs_node_lock(np)))
1104 return (error);
1105 while (ISSET(np->n_flag, NBUSY)) {
1106 SET(np->n_flag, NBUSYWANT);
1107 msleep(np, &np->n_lock, PZERO-1, "nfsbusywant", &ts);
1108 if ((error = nfs_sigintr(NFSTONMP(np), NULL, thd, 0)))
1109 break;
1110 }
1111 if (!error)
1112 SET(np->n_flag, NBUSY);
1113 nfs_node_unlock(np);
1114 return (error);
1115 }
1116
1117 void
1118 nfs_node_clear_busy(nfsnode_t np)
1119 {
1120 int wanted;
1121
1122 nfs_node_lock_force(np);
1123 wanted = ISSET(np->n_flag, NBUSYWANT);
1124 CLR(np->n_flag, NBUSY|NBUSYWANT);
1125 nfs_node_unlock(np);
1126 if (wanted)
1127 wakeup(np);
1128 }
1129
1130 int
1131 nfs_node_set_busy2(nfsnode_t np1, nfsnode_t np2, thread_t thd)
1132 {
1133 nfsnode_t first, second;
1134 int error;
1135
1136 first = (np1 > np2) ? np1 : np2;
1137 second = (np1 > np2) ? np2 : np1;
1138 if ((error = nfs_node_set_busy(first, thd)))
1139 return (error);
1140 if (np1 == np2)
1141 return (error);
1142 if ((error = nfs_node_set_busy(second, thd)))
1143 nfs_node_clear_busy(first);
1144 return (error);
1145 }
1146
1147 void
1148 nfs_node_clear_busy2(nfsnode_t np1, nfsnode_t np2)
1149 {
1150 nfs_node_clear_busy(np1);
1151 if (np1 != np2)
1152 nfs_node_clear_busy(np2);
1153 }
1154
1155 /* helper function to sort four nodes in reverse address order (no dupes) */
1156 static void
1157 nfs_node_sort4(nfsnode_t np1, nfsnode_t np2, nfsnode_t np3, nfsnode_t np4, nfsnode_t *list, int *lcntp)
1158 {
1159 nfsnode_t na[2], nb[2];
1160 int a, b, i, lcnt;
1161
1162 /* sort pairs then merge */
1163 na[0] = (np1 > np2) ? np1 : np2;
1164 na[1] = (np1 > np2) ? np2 : np1;
1165 nb[0] = (np3 > np4) ? np3 : np4;
1166 nb[1] = (np3 > np4) ? np4 : np3;
1167 for (a = b = i = lcnt = 0; i < 4; i++) {
1168 if (a >= 2)
1169 list[lcnt] = nb[b++];
1170 else if ((b >= 2) || (na[a] >= nb[b]))
1171 list[lcnt] = na[a++];
1172 else
1173 list[lcnt] = nb[b++];
1174 if ((lcnt <= 0) || (list[lcnt] != list[lcnt-1]))
1175 lcnt++; /* omit dups */
1176 }
1177 if (list[lcnt-1] == NULL)
1178 lcnt--;
1179 *lcntp = lcnt;
1180 }
1181
1182 int
1183 nfs_node_set_busy4(nfsnode_t np1, nfsnode_t np2, nfsnode_t np3, nfsnode_t np4, thread_t thd)
1184 {
1185 nfsnode_t list[4];
1186 int i, lcnt, error;
1187
1188 nfs_node_sort4(np1, np2, np3, np4, list, &lcnt);
1189
1190 /* Now we can lock using list[0 - lcnt-1] */
1191 for (i = 0; i < lcnt; ++i)
1192 if ((error = nfs_node_set_busy(list[i], thd))) {
1193 /* Drop any locks we acquired. */
1194 while (--i >= 0)
1195 nfs_node_clear_busy(list[i]);
1196 return (error);
1197 }
1198 return (0);
1199 }
1200
1201 void
1202 nfs_node_clear_busy4(nfsnode_t np1, nfsnode_t np2, nfsnode_t np3, nfsnode_t np4)
1203 {
1204 nfsnode_t list[4];
1205 int lcnt;
1206
1207 nfs_node_sort4(np1, np2, np3, np4, list, &lcnt);
1208 while (--lcnt >= 0)
1209 nfs_node_clear_busy(list[lcnt]);
1210 }
1211
1212 /*
1213 * Acquire an NFS node data lock
1214 */
1215 void
1216 nfs_data_lock(nfsnode_t np, int locktype)
1217 {
1218 nfs_data_lock_internal(np, locktype, 1);
1219 }
1220 void
1221 nfs_data_lock_noupdate(nfsnode_t np, int locktype)
1222 {
1223 nfs_data_lock_internal(np, locktype, 0);
1224 }
1225 void
1226 nfs_data_lock_internal(nfsnode_t np, int locktype, int updatesize)
1227 {
1228 FSDBG_TOP(270, np, locktype, np->n_datalockowner, 0);
1229 if (locktype == NFS_DATA_LOCK_SHARED) {
1230 if (updatesize && ISSET(np->n_flag, NUPDATESIZE))
1231 nfs_data_update_size(np, 0);
1232 lck_rw_lock_shared(&np->n_datalock);
1233 } else {
1234 lck_rw_lock_exclusive(&np->n_datalock);
1235 np->n_datalockowner = current_thread();
1236 if (updatesize && ISSET(np->n_flag, NUPDATESIZE))
1237 nfs_data_update_size(np, 1);
1238 }
1239 FSDBG_BOT(270, np, locktype, np->n_datalockowner, 0);
1240 }
1241
1242 /*
1243 * Release an NFS node data lock
1244 */
1245 void
1246 nfs_data_unlock(nfsnode_t np)
1247 {
1248 nfs_data_unlock_internal(np, 1);
1249 }
1250 void
1251 nfs_data_unlock_noupdate(nfsnode_t np)
1252 {
1253 nfs_data_unlock_internal(np, 0);
1254 }
1255 void
1256 nfs_data_unlock_internal(nfsnode_t np, int updatesize)
1257 {
1258 int mine = (np->n_datalockowner == current_thread());
1259 FSDBG_TOP(271, np, np->n_datalockowner, current_thread(), 0);
1260 if (updatesize && mine && ISSET(np->n_flag, NUPDATESIZE))
1261 nfs_data_update_size(np, 1);
1262 np->n_datalockowner = NULL;
1263 lck_rw_done(&np->n_datalock);
1264 if (updatesize && !mine && ISSET(np->n_flag, NUPDATESIZE))
1265 nfs_data_update_size(np, 0);
1266 FSDBG_BOT(271, np, np->n_datalockowner, current_thread(), 0);
1267 }
1268
1269
1270 /*
1271 * update an NFS node's size
1272 */
1273 void
1274 nfs_data_update_size(nfsnode_t np, int datalocked)
1275 {
1276 int error;
1277
1278 FSDBG_TOP(272, np, np->n_flag, np->n_size, np->n_newsize);
1279 if (!datalocked) {
1280 nfs_data_lock(np, NFS_DATA_LOCK_EXCLUSIVE);
1281 /* grabbing data lock will automatically update size */
1282 nfs_data_unlock(np);
1283 FSDBG_BOT(272, np, np->n_flag, np->n_size, np->n_newsize);
1284 return;
1285 }
1286 error = nfs_node_lock(np);
1287 if (error || !ISSET(np->n_flag, NUPDATESIZE)) {
1288 if (!error)
1289 nfs_node_unlock(np);
1290 FSDBG_BOT(272, np, np->n_flag, np->n_size, np->n_newsize);
1291 return;
1292 }
1293 CLR(np->n_flag, NUPDATESIZE);
1294 np->n_size = np->n_newsize;
1295 /* make sure we invalidate buffers the next chance we get */
1296 SET(np->n_flag, NNEEDINVALIDATE);
1297 nfs_node_unlock(np);
1298 ubc_setsize(NFSTOV(np), (off_t)np->n_size); /* XXX error? */
1299 FSDBG_BOT(272, np, np->n_flag, np->n_size, np->n_newsize);
1300 }
1301
1302 #define DODEBUG 1
1303 int
1304 nfs_mount_is_dirty(mount_t mp)
1305 {
1306 u_long i;
1307 nfsnode_t np;
1308 #ifdef DODEBUG
1309 struct timeval now, then, diff;
1310 u_long ncnt = 0;
1311 microuptime(&now);
1312 #endif
1313 lck_mtx_lock(nfs_node_hash_mutex);
1314 for (i = 0; i <= nfsnodehash; i++) {
1315 LIST_FOREACH(np, &nfsnodehashtbl[i], n_hash) {
1316 #ifdef DODEBUG
1317 ncnt++;
1318 #endif
1319 if (np->n_mount == mp && !LIST_EMPTY(&np->n_dirtyblkhd))
1320 goto out;
1321 }
1322 }
1323 out:
1324 lck_mtx_unlock(nfs_node_hash_mutex);
1325 #ifdef DODEBUG
1326 microuptime(&then);
1327 timersub(&then, &now, &diff);
1328
1329 printf("nfs_mount_is_dirty took %lld mics for %ld slots and %ld nodes return %d\n",
1330 (uint64_t)diff.tv_sec * 1000000LL + diff.tv_usec, i, ncnt, (i <= nfsnodehash));
1331 #endif
1332
1333 return (i <= nfsnodehash);
1334 }