]> git.saurik.com Git - apple/xnu.git/blob - bsd/nfs/nfs_srvcache.c
xnu-4570.71.2.tar.gz
[apple/xnu.git] / bsd / nfs / nfs_srvcache.c
1 /*
2 * Copyright (c) 2000-2010 Apple Inc. All rights reserved.
3 *
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
5 *
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
14 *
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
17 *
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
25 *
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
27 */
28 /* Copyright (c) 1995 NeXT Computer, Inc. All Rights Reserved */
29 /*
30 * Copyright (c) 1989, 1993
31 * The Regents of the University of California. All rights reserved.
32 *
33 * This code is derived from software contributed to Berkeley by
34 * Rick Macklem at The University of Guelph.
35 *
36 * Redistribution and use in source and binary forms, with or without
37 * modification, are permitted provided that the following conditions
38 * are met:
39 * 1. Redistributions of source code must retain the above copyright
40 * notice, this list of conditions and the following disclaimer.
41 * 2. Redistributions in binary form must reproduce the above copyright
42 * notice, this list of conditions and the following disclaimer in the
43 * documentation and/or other materials provided with the distribution.
44 * 3. All advertising materials mentioning features or use of this software
45 * must display the following acknowledgement:
46 * This product includes software developed by the University of
47 * California, Berkeley and its contributors.
48 * 4. Neither the name of the University nor the names of its contributors
49 * may be used to endorse or promote products derived from this software
50 * without specific prior written permission.
51 *
52 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
53 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
54 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
55 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
56 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
57 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
58 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
59 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
60 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
61 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
62 * SUCH DAMAGE.
63 *
64 * @(#)nfs_srvcache.c 8.3 (Berkeley) 3/30/95
65 * FreeBSD-Id: nfs_srvcache.c,v 1.15 1997/10/12 20:25:46 phk Exp $
66 */
67
68 #if NFSSERVER
69 /*
70 * Reference: Chet Juszczak, "Improving the Performance and Correctness
71 * of an NFS Server", in Proc. Winter 1989 USENIX Conference,
72 * pages 53-63. San Diego, February 1989.
73 */
74 #include <sys/param.h>
75 #include <sys/vnode.h>
76 #include <sys/mount_internal.h>
77 #include <sys/kernel.h>
78 #include <sys/systm.h>
79 #include <sys/proc.h>
80 #include <sys/kpi_mbuf.h>
81 #include <sys/malloc.h>
82 #include <sys/socket.h>
83 #include <libkern/OSAtomic.h>
84
85 #include <netinet/in.h>
86 #include <nfs/rpcv2.h>
87 #include <nfs/nfsproto.h>
88 #include <nfs/nfs.h>
89 #include <nfs/nfsrvcache.h>
90
91 extern int nfsv2_procid[NFS_NPROCS];
92 static int nfsrv_reqcache_count;
93 int nfsrv_reqcache_size = NFSRVCACHESIZ;
94
95 #define NFSRCHASH(xid) \
96 (&nfsrv_reqcache_hashtbl[((xid) + ((xid) >> 24)) & nfsrv_reqcache_hash])
97 LIST_HEAD(nfsrv_reqcache_hash, nfsrvcache) *nfsrv_reqcache_hashtbl;
98 TAILQ_HEAD(nfsrv_reqcache_lru, nfsrvcache) nfsrv_reqcache_lruhead;
99 u_long nfsrv_reqcache_hash;
100
101 lck_grp_t *nfsrv_reqcache_lck_grp;
102 lck_mtx_t *nfsrv_reqcache_mutex;
103
104 /*
105 * Static array that defines which nfs rpc's are nonidempotent
106 */
107 static int nonidempotent[NFS_NPROCS] = {
108 FALSE,
109 FALSE,
110 TRUE,
111 FALSE,
112 FALSE,
113 FALSE,
114 FALSE,
115 TRUE,
116 TRUE,
117 TRUE,
118 TRUE,
119 TRUE,
120 TRUE,
121 TRUE,
122 TRUE,
123 TRUE,
124 FALSE,
125 FALSE,
126 FALSE,
127 FALSE,
128 FALSE,
129 FALSE,
130 FALSE,
131 };
132
133 /* True iff the rpc reply is an nfs status ONLY! */
134 static int nfsv2_repstat[NFS_NPROCS] = {
135 FALSE,
136 FALSE,
137 FALSE,
138 FALSE,
139 FALSE,
140 FALSE,
141 FALSE,
142 FALSE,
143 FALSE,
144 FALSE,
145 TRUE,
146 TRUE,
147 TRUE,
148 TRUE,
149 FALSE,
150 TRUE,
151 FALSE,
152 FALSE,
153 };
154
155 /*
156 * Initialize the server request cache list
157 */
158 void
159 nfsrv_initcache(void)
160 {
161 if (nfsrv_reqcache_size <= 0)
162 return;
163
164 lck_mtx_lock(nfsrv_reqcache_mutex);
165 /* init nfs server request cache hash table */
166 nfsrv_reqcache_hashtbl = hashinit(nfsrv_reqcache_size, M_NFSD, &nfsrv_reqcache_hash);
167 TAILQ_INIT(&nfsrv_reqcache_lruhead);
168 lck_mtx_unlock(nfsrv_reqcache_mutex);
169 }
170
171 /*
172 * This function compares two net addresses by family and returns TRUE
173 * if they are the same host.
174 * If there is any doubt, return FALSE.
175 * The AF_INET family is handled as a special case so that address mbufs
176 * don't need to be saved to store "struct in_addr", which is only 4 bytes.
177 * Ditto for AF_INET6 which is only 16 bytes.
178 */
179 static int
180 netaddr_match(
181 int family,
182 union nethostaddr *haddr,
183 mbuf_t nam)
184 {
185 struct sockaddr_in *inetaddr;
186 struct sockaddr_in6 *inet6addr;
187
188 switch (family) {
189 case AF_INET:
190 inetaddr = mbuf_data(nam);
191 if ((inetaddr->sin_family == AF_INET) &&
192 (inetaddr->sin_addr.s_addr == haddr->had_inetaddr))
193 return (1);
194 break;
195 case AF_INET6:
196 inet6addr = mbuf_data(nam);
197 if ((inet6addr->sin6_family == AF_INET6) &&
198 !bcmp(&inet6addr->sin6_addr, &haddr->had_inet6addr, sizeof(inet6addr->sin6_addr)))
199 return (1);
200 break;
201 }
202 return (0);
203 }
204
205 /*
206 * Look for the request in the cache
207 * If found then
208 * return action and optionally reply
209 * else
210 * insert it in the cache
211 *
212 * The rules are as follows:
213 * - if in progress, return DROP request
214 * - if completed within DELAY of the current time, return DROP it
215 * - if completed a longer time ago return REPLY if the reply was cached or
216 * return DOIT
217 * Update/add new request at end of lru list
218 */
219 int
220 nfsrv_getcache(
221 struct nfsrv_descript *nd,
222 struct nfsrv_sock *slp,
223 mbuf_t *mrepp)
224 {
225 struct nfsrvcache *rp;
226 struct nfsm_chain nmrep;
227 struct sockaddr *saddr;
228 int ret, error;
229
230 /*
231 * Don't cache recent requests for reliable transport protocols.
232 * (Maybe we should for the case of a reconnect, but..)
233 */
234 if (!nd->nd_nam2)
235 return (RC_DOIT);
236 lck_mtx_lock(nfsrv_reqcache_mutex);
237 loop:
238 for (rp = NFSRCHASH(nd->nd_retxid)->lh_first; rp != 0;
239 rp = rp->rc_hash.le_next) {
240 if (nd->nd_retxid == rp->rc_xid && nd->nd_procnum == rp->rc_proc &&
241 netaddr_match(rp->rc_family, &rp->rc_haddr, nd->nd_nam)) {
242 if ((rp->rc_flag & RC_LOCKED) != 0) {
243 rp->rc_flag |= RC_WANTED;
244 msleep(rp, nfsrv_reqcache_mutex, PZERO-1, "nfsrc", NULL);
245 goto loop;
246 }
247 rp->rc_flag |= RC_LOCKED;
248 /* If not at end of LRU chain, move it there */
249 if (rp->rc_lru.tqe_next) {
250 TAILQ_REMOVE(&nfsrv_reqcache_lruhead, rp, rc_lru);
251 TAILQ_INSERT_TAIL(&nfsrv_reqcache_lruhead, rp, rc_lru);
252 }
253 if (rp->rc_state == RC_UNUSED)
254 panic("nfsrv cache");
255 if (rp->rc_state == RC_INPROG) {
256 OSAddAtomic64(1, &nfsstats.srvcache_inproghits);
257 ret = RC_DROPIT;
258 } else if (rp->rc_flag & RC_REPSTATUS) {
259 OSAddAtomic64(1, &nfsstats.srvcache_nonidemdonehits);
260 nd->nd_repstat = rp->rc_status;
261 error = nfsrv_rephead(nd, slp, &nmrep, 0);
262 if (error) {
263 printf("nfsrv cache: reply alloc failed for nonidem request hit\n");
264 ret = RC_DROPIT;
265 *mrepp = NULL;
266 } else {
267 ret = RC_REPLY;
268 *mrepp = nmrep.nmc_mhead;
269 }
270 } else if (rp->rc_flag & RC_REPMBUF) {
271 OSAddAtomic64(1, &nfsstats.srvcache_nonidemdonehits);
272 error = mbuf_copym(rp->rc_reply, 0, MBUF_COPYALL, MBUF_WAITOK, mrepp);
273 if (error) {
274 printf("nfsrv cache: reply copym failed for nonidem request hit\n");
275 ret = RC_DROPIT;
276 } else {
277 ret = RC_REPLY;
278 }
279 } else {
280 OSAddAtomic64(1, &nfsstats.srvcache_idemdonehits);
281 rp->rc_state = RC_INPROG;
282 ret = RC_DOIT;
283 }
284 rp->rc_flag &= ~RC_LOCKED;
285 if (rp->rc_flag & RC_WANTED) {
286 rp->rc_flag &= ~RC_WANTED;
287 wakeup(rp);
288 }
289 lck_mtx_unlock(nfsrv_reqcache_mutex);
290 return (ret);
291 }
292 }
293 OSAddAtomic64(1, &nfsstats.srvcache_misses);
294 if (nfsrv_reqcache_count < nfsrv_reqcache_size) {
295 /* try to allocate a new entry */
296 MALLOC(rp, struct nfsrvcache *, sizeof *rp, M_NFSD, M_WAITOK);
297 if (rp) {
298 bzero((char *)rp, sizeof *rp);
299 nfsrv_reqcache_count++;
300 rp->rc_flag = RC_LOCKED;
301 }
302 } else {
303 rp = NULL;
304 }
305 if (!rp) {
306 /* try to reuse the least recently used entry */
307 rp = nfsrv_reqcache_lruhead.tqh_first;
308 if (!rp) {
309 /* no entry to reuse? */
310 /* OK, we just won't be able to cache this request */
311 lck_mtx_unlock(nfsrv_reqcache_mutex);
312 return (RC_DOIT);
313 }
314 while ((rp->rc_flag & RC_LOCKED) != 0) {
315 rp->rc_flag |= RC_WANTED;
316 msleep(rp, nfsrv_reqcache_mutex, PZERO-1, "nfsrc", NULL);
317 rp = nfsrv_reqcache_lruhead.tqh_first;
318 }
319 rp->rc_flag |= RC_LOCKED;
320 LIST_REMOVE(rp, rc_hash);
321 TAILQ_REMOVE(&nfsrv_reqcache_lruhead, rp, rc_lru);
322 if (rp->rc_flag & RC_REPMBUF)
323 mbuf_freem(rp->rc_reply);
324 if (rp->rc_flag & RC_NAM)
325 mbuf_freem(rp->rc_nam);
326 rp->rc_flag &= (RC_LOCKED | RC_WANTED);
327 }
328 TAILQ_INSERT_TAIL(&nfsrv_reqcache_lruhead, rp, rc_lru);
329 rp->rc_state = RC_INPROG;
330 rp->rc_xid = nd->nd_retxid;
331 saddr = mbuf_data(nd->nd_nam);
332 rp->rc_family = saddr->sa_family;
333 switch (saddr->sa_family) {
334 case AF_INET:
335 rp->rc_flag |= RC_INETADDR;
336 rp->rc_inetaddr = ((struct sockaddr_in*)saddr)->sin_addr.s_addr;
337 break;
338 case AF_INET6:
339 rp->rc_flag |= RC_INETADDR;
340 rp->rc_inet6addr = ((struct sockaddr_in6*)saddr)->sin6_addr;
341 break;
342 default:
343 error = mbuf_copym(nd->nd_nam, 0, MBUF_COPYALL, MBUF_WAITOK, &rp->rc_nam);
344 if (error)
345 printf("nfsrv cache: nam copym failed\n");
346 else
347 rp->rc_flag |= RC_NAM;
348 break;
349 };
350 rp->rc_proc = nd->nd_procnum;
351 LIST_INSERT_HEAD(NFSRCHASH(nd->nd_retxid), rp, rc_hash);
352 rp->rc_flag &= ~RC_LOCKED;
353 if (rp->rc_flag & RC_WANTED) {
354 rp->rc_flag &= ~RC_WANTED;
355 wakeup(rp);
356 }
357 lck_mtx_unlock(nfsrv_reqcache_mutex);
358 return (RC_DOIT);
359 }
360
361 /*
362 * Update a request cache entry after the rpc has been done
363 */
364 void
365 nfsrv_updatecache(
366 struct nfsrv_descript *nd,
367 int repvalid,
368 mbuf_t repmbuf)
369 {
370 struct nfsrvcache *rp;
371 int error;
372
373 if (!nd->nd_nam2)
374 return;
375 lck_mtx_lock(nfsrv_reqcache_mutex);
376 loop:
377 for (rp = NFSRCHASH(nd->nd_retxid)->lh_first; rp != 0;
378 rp = rp->rc_hash.le_next) {
379 if (nd->nd_retxid == rp->rc_xid && nd->nd_procnum == rp->rc_proc &&
380 netaddr_match(rp->rc_family, &rp->rc_haddr, nd->nd_nam)) {
381 if ((rp->rc_flag & RC_LOCKED) != 0) {
382 rp->rc_flag |= RC_WANTED;
383 msleep(rp, nfsrv_reqcache_mutex, PZERO-1, "nfsrc", NULL);
384 goto loop;
385 }
386 rp->rc_flag |= RC_LOCKED;
387 if (rp->rc_state == RC_DONE) {
388 /*
389 * This can occur if the cache is too small.
390 * Retransmits of the same request aren't
391 * dropped so we may see the operation
392 * complete more then once.
393 */
394 if (rp->rc_flag & RC_REPMBUF) {
395 mbuf_freem(rp->rc_reply);
396 rp->rc_flag &= ~RC_REPMBUF;
397 }
398 }
399 rp->rc_state = RC_DONE;
400 /*
401 * If we have a valid reply update status and save
402 * the reply for non-idempotent rpc's.
403 */
404 if (repvalid && nonidempotent[nd->nd_procnum]) {
405 if ((nd->nd_vers == NFS_VER2) &&
406 nfsv2_repstat[nfsv2_procid[nd->nd_procnum]]) {
407 rp->rc_status = nd->nd_repstat;
408 rp->rc_flag |= RC_REPSTATUS;
409 } else {
410 error = mbuf_copym(repmbuf, 0, MBUF_COPYALL, MBUF_WAITOK, &rp->rc_reply);
411 if (!error)
412 rp->rc_flag |= RC_REPMBUF;
413 }
414 }
415 rp->rc_flag &= ~RC_LOCKED;
416 if (rp->rc_flag & RC_WANTED) {
417 rp->rc_flag &= ~RC_WANTED;
418 wakeup(rp);
419 }
420 lck_mtx_unlock(nfsrv_reqcache_mutex);
421 return;
422 }
423 }
424 lck_mtx_unlock(nfsrv_reqcache_mutex);
425 }
426
427 /*
428 * Clean out the cache. Called when the last nfsd terminates.
429 */
430 void
431 nfsrv_cleancache(void)
432 {
433 struct nfsrvcache *rp, *nextrp;
434
435 lck_mtx_lock(nfsrv_reqcache_mutex);
436 for (rp = nfsrv_reqcache_lruhead.tqh_first; rp != 0; rp = nextrp) {
437 nextrp = rp->rc_lru.tqe_next;
438 LIST_REMOVE(rp, rc_hash);
439 TAILQ_REMOVE(&nfsrv_reqcache_lruhead, rp, rc_lru);
440 _FREE(rp, M_NFSD);
441 }
442 nfsrv_reqcache_count = 0;
443 FREE(nfsrv_reqcache_hashtbl, M_TEMP);
444 lck_mtx_unlock(nfsrv_reqcache_mutex);
445 }
446
447 #endif /* NFSSERVER */