2 * Copyright (c) 2000-2010 Apple Inc. All rights reserved.
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
28 /* Copyright (c) 1995 NeXT Computer, Inc. All Rights Reserved */
30 * Copyright (c) 1989, 1993
31 * The Regents of the University of California. All rights reserved.
33 * This code is derived from software contributed to Berkeley by
34 * Rick Macklem at The University of Guelph.
36 * Redistribution and use in source and binary forms, with or without
37 * modification, are permitted provided that the following conditions
39 * 1. Redistributions of source code must retain the above copyright
40 * notice, this list of conditions and the following disclaimer.
41 * 2. Redistributions in binary form must reproduce the above copyright
42 * notice, this list of conditions and the following disclaimer in the
43 * documentation and/or other materials provided with the distribution.
44 * 3. All advertising materials mentioning features or use of this software
45 * must display the following acknowledgement:
46 * This product includes software developed by the University of
47 * California, Berkeley and its contributors.
48 * 4. Neither the name of the University nor the names of its contributors
49 * may be used to endorse or promote products derived from this software
50 * without specific prior written permission.
52 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
53 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
54 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
55 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
56 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
57 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
58 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
59 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
60 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
61 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
64 * @(#)nfs_srvcache.c 8.3 (Berkeley) 3/30/95
65 * FreeBSD-Id: nfs_srvcache.c,v 1.15 1997/10/12 20:25:46 phk Exp $
68 #include <nfs/nfs_conf.h>
72 * Reference: Chet Juszczak, "Improving the Performance and Correctness
73 * of an NFS Server", in Proc. Winter 1989 USENIX Conference,
74 * pages 53-63. San Diego, February 1989.
76 #include <sys/param.h>
77 #include <sys/vnode.h>
78 #include <sys/mount_internal.h>
79 #include <sys/kernel.h>
80 #include <sys/systm.h>
82 #include <sys/kpi_mbuf.h>
83 #include <sys/malloc.h>
84 #include <sys/socket.h>
85 #include <libkern/OSAtomic.h>
87 #include <netinet/in.h>
88 #include <nfs/rpcv2.h>
89 #include <nfs/nfsproto.h>
91 #include <nfs/nfsrvcache.h>
93 extern int nfsv2_procid
[NFS_NPROCS
];
94 static int nfsrv_reqcache_count
;
95 int nfsrv_reqcache_size
= NFSRVCACHESIZ
;
97 #define NFSRCHASH(xid) \
98 (&nfsrv_reqcache_hashtbl[((xid) + ((xid) >> 24)) & nfsrv_reqcache_hash])
99 LIST_HEAD(nfsrv_reqcache_hash
, nfsrvcache
) * nfsrv_reqcache_hashtbl
;
100 TAILQ_HEAD(nfsrv_reqcache_lru
, nfsrvcache
) nfsrv_reqcache_lruhead
;
101 u_long nfsrv_reqcache_hash
;
103 static LCK_GRP_DECLARE(nfsrv_reqcache_lck_grp
, "nfsrv_reqcache");
104 LCK_MTX_DECLARE(nfsrv_reqcache_mutex
, &nfsrv_reqcache_lck_grp
);
107 * Static array that defines which nfs rpc's are nonidempotent
109 static int nonidempotent
[NFS_NPROCS
] = {
135 /* True iff the rpc reply is an nfs status ONLY! */
136 static int nfsv2_repstat
[NFS_NPROCS
] = {
158 * Initialize the server request cache list
161 nfsrv_initcache(void)
163 if (nfsrv_reqcache_size
<= 0) {
167 lck_mtx_lock(&nfsrv_reqcache_mutex
);
168 /* init nfs server request cache hash table */
169 nfsrv_reqcache_hashtbl
= hashinit(nfsrv_reqcache_size
, M_NFSD
, &nfsrv_reqcache_hash
);
170 TAILQ_INIT(&nfsrv_reqcache_lruhead
);
171 lck_mtx_unlock(&nfsrv_reqcache_mutex
);
175 * This function compares two net addresses by family and returns TRUE
176 * if they are the same host.
177 * If there is any doubt, return FALSE.
178 * The AF_INET family is handled as a special case so that address mbufs
179 * don't need to be saved to store "struct in_addr", which is only 4 bytes.
180 * Ditto for AF_INET6 which is only 16 bytes.
185 union nethostaddr
*haddr
,
188 struct sockaddr_in
*inetaddr
;
189 struct sockaddr_in6
*inet6addr
;
193 inetaddr
= mbuf_data(nam
);
194 if ((inetaddr
->sin_family
== AF_INET
) &&
195 (inetaddr
->sin_addr
.s_addr
== haddr
->had_inetaddr
)) {
200 inet6addr
= mbuf_data(nam
);
201 if ((inet6addr
->sin6_family
== AF_INET6
) &&
202 !bcmp(&inet6addr
->sin6_addr
, &haddr
->had_inet6addr
, sizeof(inet6addr
->sin6_addr
))) {
211 * Look for the request in the cache
213 * return action and optionally reply
215 * insert it in the cache
217 * The rules are as follows:
218 * - if in progress, return DROP request
219 * - if completed within DELAY of the current time, return DROP it
220 * - if completed a longer time ago return REPLY if the reply was cached or
222 * Update/add new request at end of lru list
226 struct nfsrv_descript
*nd
,
227 struct nfsrv_sock
*slp
,
230 struct nfsrvcache
*rp
;
231 struct nfsm_chain nmrep
;
232 struct sockaddr
*saddr
;
236 * Don't cache recent requests for reliable transport protocols.
237 * (Maybe we should for the case of a reconnect, but..)
242 lck_mtx_lock(&nfsrv_reqcache_mutex
);
244 for (rp
= NFSRCHASH(nd
->nd_retxid
)->lh_first
; rp
!= 0;
245 rp
= rp
->rc_hash
.le_next
) {
246 if (nd
->nd_retxid
== rp
->rc_xid
&& nd
->nd_procnum
== rp
->rc_proc
&&
247 netaddr_match(rp
->rc_family
, &rp
->rc_haddr
, nd
->nd_nam
)) {
248 if ((rp
->rc_flag
& RC_LOCKED
) != 0) {
249 rp
->rc_flag
|= RC_WANTED
;
250 msleep(rp
, &nfsrv_reqcache_mutex
, PZERO
- 1, "nfsrc", NULL
);
253 rp
->rc_flag
|= RC_LOCKED
;
254 /* If not at end of LRU chain, move it there */
255 if (rp
->rc_lru
.tqe_next
) {
256 TAILQ_REMOVE(&nfsrv_reqcache_lruhead
, rp
, rc_lru
);
257 TAILQ_INSERT_TAIL(&nfsrv_reqcache_lruhead
, rp
, rc_lru
);
259 if (rp
->rc_state
== RC_UNUSED
) {
260 panic("nfsrv cache");
262 if (rp
->rc_state
== RC_INPROG
) {
263 OSAddAtomic64(1, &nfsstats
.srvcache_inproghits
);
265 } else if (rp
->rc_flag
& RC_REPSTATUS
) {
266 OSAddAtomic64(1, &nfsstats
.srvcache_nonidemdonehits
);
267 nd
->nd_repstat
= rp
->rc_status
;
268 error
= nfsrv_rephead(nd
, slp
, &nmrep
, 0);
270 printf("nfsrv cache: reply alloc failed for nonidem request hit\n");
275 *mrepp
= nmrep
.nmc_mhead
;
277 } else if (rp
->rc_flag
& RC_REPMBUF
) {
278 OSAddAtomic64(1, &nfsstats
.srvcache_nonidemdonehits
);
279 error
= mbuf_copym(rp
->rc_reply
, 0, MBUF_COPYALL
, MBUF_WAITOK
, mrepp
);
281 printf("nfsrv cache: reply copym failed for nonidem request hit\n");
287 OSAddAtomic64(1, &nfsstats
.srvcache_idemdonehits
);
288 rp
->rc_state
= RC_INPROG
;
291 rp
->rc_flag
&= ~RC_LOCKED
;
292 if (rp
->rc_flag
& RC_WANTED
) {
293 rp
->rc_flag
&= ~RC_WANTED
;
296 lck_mtx_unlock(&nfsrv_reqcache_mutex
);
300 OSAddAtomic64(1, &nfsstats
.srvcache_misses
);
301 if (nfsrv_reqcache_count
< nfsrv_reqcache_size
) {
302 /* try to allocate a new entry */
303 MALLOC(rp
, struct nfsrvcache
*, sizeof *rp
, M_NFSD
, M_WAITOK
);
305 bzero((char *)rp
, sizeof *rp
);
306 nfsrv_reqcache_count
++;
307 rp
->rc_flag
= RC_LOCKED
;
313 /* try to reuse the least recently used entry */
314 rp
= nfsrv_reqcache_lruhead
.tqh_first
;
316 /* no entry to reuse? */
317 /* OK, we just won't be able to cache this request */
318 lck_mtx_unlock(&nfsrv_reqcache_mutex
);
321 while ((rp
->rc_flag
& RC_LOCKED
) != 0) {
322 rp
->rc_flag
|= RC_WANTED
;
323 msleep(rp
, &nfsrv_reqcache_mutex
, PZERO
- 1, "nfsrc", NULL
);
324 rp
= nfsrv_reqcache_lruhead
.tqh_first
;
326 rp
->rc_flag
|= RC_LOCKED
;
327 LIST_REMOVE(rp
, rc_hash
);
328 TAILQ_REMOVE(&nfsrv_reqcache_lruhead
, rp
, rc_lru
);
329 if (rp
->rc_flag
& RC_REPMBUF
) {
330 mbuf_freem(rp
->rc_reply
);
332 if (rp
->rc_flag
& RC_NAM
) {
333 mbuf_freem(rp
->rc_nam
);
335 rp
->rc_flag
&= (RC_LOCKED
| RC_WANTED
);
337 TAILQ_INSERT_TAIL(&nfsrv_reqcache_lruhead
, rp
, rc_lru
);
338 rp
->rc_state
= RC_INPROG
;
339 rp
->rc_xid
= nd
->nd_retxid
;
340 saddr
= mbuf_data(nd
->nd_nam
);
341 rp
->rc_family
= saddr
->sa_family
;
342 switch (saddr
->sa_family
) {
344 rp
->rc_flag
|= RC_INETADDR
;
345 rp
->rc_inetaddr
= ((struct sockaddr_in
*)saddr
)->sin_addr
.s_addr
;
348 rp
->rc_flag
|= RC_INETADDR
;
349 rp
->rc_inet6addr
= ((struct sockaddr_in6
*)saddr
)->sin6_addr
;
352 error
= mbuf_copym(nd
->nd_nam
, 0, MBUF_COPYALL
, MBUF_WAITOK
, &rp
->rc_nam
);
354 printf("nfsrv cache: nam copym failed\n");
356 rp
->rc_flag
|= RC_NAM
;
361 rp
->rc_proc
= nd
->nd_procnum
;
362 LIST_INSERT_HEAD(NFSRCHASH(nd
->nd_retxid
), rp
, rc_hash
);
363 rp
->rc_flag
&= ~RC_LOCKED
;
364 if (rp
->rc_flag
& RC_WANTED
) {
365 rp
->rc_flag
&= ~RC_WANTED
;
368 lck_mtx_unlock(&nfsrv_reqcache_mutex
);
373 * Update a request cache entry after the rpc has been done
377 struct nfsrv_descript
*nd
,
381 struct nfsrvcache
*rp
;
387 lck_mtx_lock(&nfsrv_reqcache_mutex
);
389 for (rp
= NFSRCHASH(nd
->nd_retxid
)->lh_first
; rp
!= 0;
390 rp
= rp
->rc_hash
.le_next
) {
391 if (nd
->nd_retxid
== rp
->rc_xid
&& nd
->nd_procnum
== rp
->rc_proc
&&
392 netaddr_match(rp
->rc_family
, &rp
->rc_haddr
, nd
->nd_nam
)) {
393 if ((rp
->rc_flag
& RC_LOCKED
) != 0) {
394 rp
->rc_flag
|= RC_WANTED
;
395 msleep(rp
, &nfsrv_reqcache_mutex
, PZERO
- 1, "nfsrc", NULL
);
398 rp
->rc_flag
|= RC_LOCKED
;
399 if (rp
->rc_state
== RC_DONE
) {
401 * This can occur if the cache is too small.
402 * Retransmits of the same request aren't
403 * dropped so we may see the operation
404 * complete more then once.
406 if (rp
->rc_flag
& RC_REPMBUF
) {
407 mbuf_freem(rp
->rc_reply
);
408 rp
->rc_flag
&= ~RC_REPMBUF
;
411 rp
->rc_state
= RC_DONE
;
413 * If we have a valid reply update status and save
414 * the reply for non-idempotent rpc's.
416 if (repvalid
&& nonidempotent
[nd
->nd_procnum
]) {
417 if ((nd
->nd_vers
== NFS_VER2
) &&
418 nfsv2_repstat
[nfsv2_procid
[nd
->nd_procnum
]]) {
419 rp
->rc_status
= nd
->nd_repstat
;
420 rp
->rc_flag
|= RC_REPSTATUS
;
422 error
= mbuf_copym(repmbuf
, 0, MBUF_COPYALL
, MBUF_WAITOK
, &rp
->rc_reply
);
424 rp
->rc_flag
|= RC_REPMBUF
;
428 rp
->rc_flag
&= ~RC_LOCKED
;
429 if (rp
->rc_flag
& RC_WANTED
) {
430 rp
->rc_flag
&= ~RC_WANTED
;
433 lck_mtx_unlock(&nfsrv_reqcache_mutex
);
437 lck_mtx_unlock(&nfsrv_reqcache_mutex
);
441 * Clean out the cache. Called when the last nfsd terminates.
444 nfsrv_cleancache(void)
446 struct nfsrvcache
*rp
, *nextrp
;
448 lck_mtx_lock(&nfsrv_reqcache_mutex
);
449 for (rp
= nfsrv_reqcache_lruhead
.tqh_first
; rp
!= 0; rp
= nextrp
) {
450 nextrp
= rp
->rc_lru
.tqe_next
;
451 LIST_REMOVE(rp
, rc_hash
);
452 TAILQ_REMOVE(&nfsrv_reqcache_lruhead
, rp
, rc_lru
);
455 nfsrv_reqcache_count
= 0;
456 FREE(nfsrv_reqcache_hashtbl
, M_TEMP
);
457 lck_mtx_unlock(&nfsrv_reqcache_mutex
);
460 #endif /* CONFIG_NFS_SERVER */