2 * Copyright (c) 2000-2010 Apple Inc. All rights reserved.
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
28 /* Copyright (c) 1995 NeXT Computer, Inc. All Rights Reserved */
30 * Copyright (c) 1989, 1993
31 * The Regents of the University of California. All rights reserved.
33 * This code is derived from software contributed to Berkeley by
34 * Rick Macklem at The University of Guelph.
36 * Redistribution and use in source and binary forms, with or without
37 * modification, are permitted provided that the following conditions
39 * 1. Redistributions of source code must retain the above copyright
40 * notice, this list of conditions and the following disclaimer.
41 * 2. Redistributions in binary form must reproduce the above copyright
42 * notice, this list of conditions and the following disclaimer in the
43 * documentation and/or other materials provided with the distribution.
44 * 3. All advertising materials mentioning features or use of this software
45 * must display the following acknowledgement:
46 * This product includes software developed by the University of
47 * California, Berkeley and its contributors.
48 * 4. Neither the name of the University nor the names of its contributors
49 * may be used to endorse or promote products derived from this software
50 * without specific prior written permission.
52 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
53 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
54 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
55 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
56 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
57 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
58 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
59 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
60 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
61 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
64 * @(#)nfs_srvcache.c 8.3 (Berkeley) 3/30/95
65 * FreeBSD-Id: nfs_srvcache.c,v 1.15 1997/10/12 20:25:46 phk Exp $
70 * Reference: Chet Juszczak, "Improving the Performance and Correctness
71 * of an NFS Server", in Proc. Winter 1989 USENIX Conference,
72 * pages 53-63. San Diego, February 1989.
74 #include <sys/param.h>
75 #include <sys/vnode.h>
76 #include <sys/mount_internal.h>
77 #include <sys/kernel.h>
78 #include <sys/systm.h>
80 #include <sys/kpi_mbuf.h>
81 #include <sys/malloc.h>
82 #include <sys/socket.h>
83 #include <libkern/OSAtomic.h>
85 #include <netinet/in.h>
86 #include <nfs/rpcv2.h>
87 #include <nfs/nfsproto.h>
89 #include <nfs/nfsrvcache.h>
91 extern int nfsv2_procid
[NFS_NPROCS
];
92 static int nfsrv_reqcache_count
;
93 int nfsrv_reqcache_size
= NFSRVCACHESIZ
;
95 #define NFSRCHASH(xid) \
96 (&nfsrv_reqcache_hashtbl[((xid) + ((xid) >> 24)) & nfsrv_reqcache_hash])
97 LIST_HEAD(nfsrv_reqcache_hash
, nfsrvcache
) *nfsrv_reqcache_hashtbl
;
98 TAILQ_HEAD(nfsrv_reqcache_lru
, nfsrvcache
) nfsrv_reqcache_lruhead
;
99 u_long nfsrv_reqcache_hash
;
101 lck_grp_t
*nfsrv_reqcache_lck_grp
;
102 lck_mtx_t
*nfsrv_reqcache_mutex
;
105 * Static array that defines which nfs rpc's are nonidempotent
107 static int nonidempotent
[NFS_NPROCS
] = {
133 /* True iff the rpc reply is an nfs status ONLY! */
134 static int nfsv2_repstat
[NFS_NPROCS
] = {
156 * Initialize the server request cache list
159 nfsrv_initcache(void)
161 if (nfsrv_reqcache_size
<= 0)
164 lck_mtx_lock(nfsrv_reqcache_mutex
);
165 /* init nfs server request cache hash table */
166 nfsrv_reqcache_hashtbl
= hashinit(nfsrv_reqcache_size
, M_NFSD
, &nfsrv_reqcache_hash
);
167 TAILQ_INIT(&nfsrv_reqcache_lruhead
);
168 lck_mtx_unlock(nfsrv_reqcache_mutex
);
172 * This function compares two net addresses by family and returns TRUE
173 * if they are the same host.
174 * If there is any doubt, return FALSE.
175 * The AF_INET family is handled as a special case so that address mbufs
176 * don't need to be saved to store "struct in_addr", which is only 4 bytes.
177 * Ditto for AF_INET6 which is only 16 bytes.
182 union nethostaddr
*haddr
,
185 struct sockaddr_in
*inetaddr
;
186 struct sockaddr_in6
*inet6addr
;
190 inetaddr
= mbuf_data(nam
);
191 if ((inetaddr
->sin_family
== AF_INET
) &&
192 (inetaddr
->sin_addr
.s_addr
== haddr
->had_inetaddr
))
196 inet6addr
= mbuf_data(nam
);
197 if ((inet6addr
->sin6_family
== AF_INET6
) &&
198 !bcmp(&inet6addr
->sin6_addr
, &haddr
->had_inet6addr
, sizeof(inet6addr
->sin6_addr
)))
206 * Look for the request in the cache
208 * return action and optionally reply
210 * insert it in the cache
212 * The rules are as follows:
213 * - if in progress, return DROP request
214 * - if completed within DELAY of the current time, return DROP it
215 * - if completed a longer time ago return REPLY if the reply was cached or
217 * Update/add new request at end of lru list
221 struct nfsrv_descript
*nd
,
222 struct nfsrv_sock
*slp
,
225 struct nfsrvcache
*rp
;
226 struct nfsm_chain nmrep
;
227 struct sockaddr
*saddr
;
231 * Don't cache recent requests for reliable transport protocols.
232 * (Maybe we should for the case of a reconnect, but..)
236 lck_mtx_lock(nfsrv_reqcache_mutex
);
238 for (rp
= NFSRCHASH(nd
->nd_retxid
)->lh_first
; rp
!= 0;
239 rp
= rp
->rc_hash
.le_next
) {
240 if (nd
->nd_retxid
== rp
->rc_xid
&& nd
->nd_procnum
== rp
->rc_proc
&&
241 netaddr_match(rp
->rc_family
, &rp
->rc_haddr
, nd
->nd_nam
)) {
242 if ((rp
->rc_flag
& RC_LOCKED
) != 0) {
243 rp
->rc_flag
|= RC_WANTED
;
244 msleep(rp
, nfsrv_reqcache_mutex
, PZERO
-1, "nfsrc", NULL
);
247 rp
->rc_flag
|= RC_LOCKED
;
248 /* If not at end of LRU chain, move it there */
249 if (rp
->rc_lru
.tqe_next
) {
250 TAILQ_REMOVE(&nfsrv_reqcache_lruhead
, rp
, rc_lru
);
251 TAILQ_INSERT_TAIL(&nfsrv_reqcache_lruhead
, rp
, rc_lru
);
253 if (rp
->rc_state
== RC_UNUSED
)
254 panic("nfsrv cache");
255 if (rp
->rc_state
== RC_INPROG
) {
256 OSAddAtomic64(1, &nfsstats
.srvcache_inproghits
);
258 } else if (rp
->rc_flag
& RC_REPSTATUS
) {
259 OSAddAtomic64(1, &nfsstats
.srvcache_nonidemdonehits
);
260 nd
->nd_repstat
= rp
->rc_status
;
261 error
= nfsrv_rephead(nd
, slp
, &nmrep
, 0);
263 printf("nfsrv cache: reply alloc failed for nonidem request hit\n");
268 *mrepp
= nmrep
.nmc_mhead
;
270 } else if (rp
->rc_flag
& RC_REPMBUF
) {
271 OSAddAtomic64(1, &nfsstats
.srvcache_nonidemdonehits
);
272 error
= mbuf_copym(rp
->rc_reply
, 0, MBUF_COPYALL
, MBUF_WAITOK
, mrepp
);
274 printf("nfsrv cache: reply copym failed for nonidem request hit\n");
280 OSAddAtomic64(1, &nfsstats
.srvcache_idemdonehits
);
281 rp
->rc_state
= RC_INPROG
;
284 rp
->rc_flag
&= ~RC_LOCKED
;
285 if (rp
->rc_flag
& RC_WANTED
) {
286 rp
->rc_flag
&= ~RC_WANTED
;
289 lck_mtx_unlock(nfsrv_reqcache_mutex
);
293 OSAddAtomic64(1, &nfsstats
.srvcache_misses
);
294 if (nfsrv_reqcache_count
< nfsrv_reqcache_size
) {
295 /* try to allocate a new entry */
296 MALLOC(rp
, struct nfsrvcache
*, sizeof *rp
, M_NFSD
, M_WAITOK
);
298 bzero((char *)rp
, sizeof *rp
);
299 nfsrv_reqcache_count
++;
300 rp
->rc_flag
= RC_LOCKED
;
306 /* try to reuse the least recently used entry */
307 rp
= nfsrv_reqcache_lruhead
.tqh_first
;
309 /* no entry to reuse? */
310 /* OK, we just won't be able to cache this request */
311 lck_mtx_unlock(nfsrv_reqcache_mutex
);
314 while ((rp
->rc_flag
& RC_LOCKED
) != 0) {
315 rp
->rc_flag
|= RC_WANTED
;
316 msleep(rp
, nfsrv_reqcache_mutex
, PZERO
-1, "nfsrc", NULL
);
317 rp
= nfsrv_reqcache_lruhead
.tqh_first
;
319 rp
->rc_flag
|= RC_LOCKED
;
320 LIST_REMOVE(rp
, rc_hash
);
321 TAILQ_REMOVE(&nfsrv_reqcache_lruhead
, rp
, rc_lru
);
322 if (rp
->rc_flag
& RC_REPMBUF
)
323 mbuf_freem(rp
->rc_reply
);
324 if (rp
->rc_flag
& RC_NAM
)
325 mbuf_freem(rp
->rc_nam
);
326 rp
->rc_flag
&= (RC_LOCKED
| RC_WANTED
);
328 TAILQ_INSERT_TAIL(&nfsrv_reqcache_lruhead
, rp
, rc_lru
);
329 rp
->rc_state
= RC_INPROG
;
330 rp
->rc_xid
= nd
->nd_retxid
;
331 saddr
= mbuf_data(nd
->nd_nam
);
332 rp
->rc_family
= saddr
->sa_family
;
333 switch (saddr
->sa_family
) {
335 rp
->rc_flag
|= RC_INETADDR
;
336 rp
->rc_inetaddr
= ((struct sockaddr_in
*)saddr
)->sin_addr
.s_addr
;
339 rp
->rc_flag
|= RC_INETADDR
;
340 rp
->rc_inet6addr
= ((struct sockaddr_in6
*)saddr
)->sin6_addr
;
343 error
= mbuf_copym(nd
->nd_nam
, 0, MBUF_COPYALL
, MBUF_WAITOK
, &rp
->rc_nam
);
345 printf("nfsrv cache: nam copym failed\n");
347 rp
->rc_flag
|= RC_NAM
;
350 rp
->rc_proc
= nd
->nd_procnum
;
351 LIST_INSERT_HEAD(NFSRCHASH(nd
->nd_retxid
), rp
, rc_hash
);
352 rp
->rc_flag
&= ~RC_LOCKED
;
353 if (rp
->rc_flag
& RC_WANTED
) {
354 rp
->rc_flag
&= ~RC_WANTED
;
357 lck_mtx_unlock(nfsrv_reqcache_mutex
);
362 * Update a request cache entry after the rpc has been done
366 struct nfsrv_descript
*nd
,
370 struct nfsrvcache
*rp
;
375 lck_mtx_lock(nfsrv_reqcache_mutex
);
377 for (rp
= NFSRCHASH(nd
->nd_retxid
)->lh_first
; rp
!= 0;
378 rp
= rp
->rc_hash
.le_next
) {
379 if (nd
->nd_retxid
== rp
->rc_xid
&& nd
->nd_procnum
== rp
->rc_proc
&&
380 netaddr_match(rp
->rc_family
, &rp
->rc_haddr
, nd
->nd_nam
)) {
381 if ((rp
->rc_flag
& RC_LOCKED
) != 0) {
382 rp
->rc_flag
|= RC_WANTED
;
383 msleep(rp
, nfsrv_reqcache_mutex
, PZERO
-1, "nfsrc", NULL
);
386 rp
->rc_flag
|= RC_LOCKED
;
387 if (rp
->rc_state
== RC_DONE
) {
389 * This can occur if the cache is too small.
390 * Retransmits of the same request aren't
391 * dropped so we may see the operation
392 * complete more then once.
394 if (rp
->rc_flag
& RC_REPMBUF
) {
395 mbuf_freem(rp
->rc_reply
);
396 rp
->rc_flag
&= ~RC_REPMBUF
;
399 rp
->rc_state
= RC_DONE
;
401 * If we have a valid reply update status and save
402 * the reply for non-idempotent rpc's.
404 if (repvalid
&& nonidempotent
[nd
->nd_procnum
]) {
405 if ((nd
->nd_vers
== NFS_VER2
) &&
406 nfsv2_repstat
[nfsv2_procid
[nd
->nd_procnum
]]) {
407 rp
->rc_status
= nd
->nd_repstat
;
408 rp
->rc_flag
|= RC_REPSTATUS
;
410 error
= mbuf_copym(repmbuf
, 0, MBUF_COPYALL
, MBUF_WAITOK
, &rp
->rc_reply
);
412 rp
->rc_flag
|= RC_REPMBUF
;
415 rp
->rc_flag
&= ~RC_LOCKED
;
416 if (rp
->rc_flag
& RC_WANTED
) {
417 rp
->rc_flag
&= ~RC_WANTED
;
420 lck_mtx_unlock(nfsrv_reqcache_mutex
);
424 lck_mtx_unlock(nfsrv_reqcache_mutex
);
428 * Clean out the cache. Called when the last nfsd terminates.
431 nfsrv_cleancache(void)
433 struct nfsrvcache
*rp
, *nextrp
;
435 lck_mtx_lock(nfsrv_reqcache_mutex
);
436 for (rp
= nfsrv_reqcache_lruhead
.tqh_first
; rp
!= 0; rp
= nextrp
) {
437 nextrp
= rp
->rc_lru
.tqe_next
;
438 LIST_REMOVE(rp
, rc_hash
);
439 TAILQ_REMOVE(&nfsrv_reqcache_lruhead
, rp
, rc_lru
);
442 nfsrv_reqcache_count
= 0;
443 FREE(nfsrv_reqcache_hashtbl
, M_TEMP
);
444 lck_mtx_unlock(nfsrv_reqcache_mutex
);
447 #endif /* NFSSERVER */