2 * Copyright (c) 1989, 1993
3 * The Regents of the University of California. All rights reserved.
5 * This code is derived from software contributed to Berkeley by
6 * Rick Macklem at The University of Guelph.
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution.
16 * 3. All advertising materials mentioning features or use of this software
17 * must display the following acknowledgement:
18 * This product includes software developed by the University of
19 * California, Berkeley and its contributors.
20 * 4. Neither the name of the University nor the names of its contributors
21 * may be used to endorse or promote products derived from this software
22 * without specific prior written permission.
24 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
25 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
26 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
27 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
28 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
29 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
30 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
31 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
32 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
33 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
36 * @(#)nfs_srvcache.c 8.3 (Berkeley) 3/30/95
37 * $FreeBSD: src/sys/nfs/nfs_srvcache.c,v 1.21 2000/02/13 03:32:06 peter Exp $
41 * Reference: Chet Juszczak, "Improving the Performance and Correctness
42 * of an NFS Server", in Proc. Winter 1989 USENIX Conference,
43 * pages 53-63. San Diego, February 1989.
45 #include <sys/param.h>
46 #include <sys/malloc.h>
47 #include <sys/mount.h>
48 #include <sys/systm.h>
50 #include <sys/socket.h>
51 #include <sys/socketvar.h> /* for dup_sockaddr */
53 #include <netinet/in.h>
57 #include "nfsrvcache.h"
60 static long numnfsrvcache;
61 static long desirednfsrvcache;
63 #define NFSRCHASH(xid) \
64 (&nfsrvhashtbl[((xid) + ((xid) >> 24)) & nfsrvhash])
65 static LIST_HEAD(nfsrvhash, nfsrvcache) *nfsrvhashtbl;
66 static TAILQ_HEAD(nfsrvlru, nfsrvcache) nfsrvlruhead;
67 static u_long nfsrvhash;
72 #define NETFAMILY(rp) \
73 (((rp)->rc_flag & RC_INETADDR) ? AF_INET : AF_ISO)
75 struct lwkt_token srvcache_token = LWKT_TOKEN_INITIALIZER(srvcache_token);
78 * Static array that defines which nfs rpc's are nonidempotent
80 static int nonidempotent[NFS_NPROCS] = {
109 /* True iff the rpc reply is an nfs status ONLY! */
110 static int nfsv2_repstat[NFS_NPROCS] = {
132 * Size the NFS server's duplicate request cache at 1/2 the nmbclusters,
133 * within a (64, 2048) range. This is to prevent all mbuf clusters being
134 * tied up in the NFS dupreq cache for small values of nmbclusters.
137 nfsrvcache_size_change(void)
139 desirednfsrvcache = nmbclusters / 2;
140 desirednfsrvcache = MIN(desirednfsrvcache, NFSRVCACHE_MAX_SIZE);
141 desirednfsrvcache = MAX(desirednfsrvcache, NFSRVCACHE_MIN_SIZE);
145 * Initialize the server request cache list
148 nfsrv_initcache(void)
150 nfsrvcache_size_change();
151 nfsrvhashtbl = hashinit(desirednfsrvcache, M_NFSD, &nfsrvhash);
152 TAILQ_INIT(&nfsrvlruhead);
156 * Look for the request in the cache
158 * return action and optionally reply
160 * insert it in the cache
162 * The rules are as follows:
163 * - if in progress, return DROP request
164 * - if completed within DELAY of the current time, return DROP it
165 * - if completed a longer time ago return REPLY if the reply was cached or
167 * Update/add new request at end of lru list
170 nfsrv_getcache(struct nfsrv_descript *nd, struct nfssvc_sock *slp,
173 struct nfsrvcache *rp;
175 struct sockaddr_in *saddr;
180 * Don't cache recent requests for reliable transport protocols.
181 * (Maybe we should for the case of a reconnect, but..)
186 lwkt_gettoken(&srvcache_token);
188 for (rp = NFSRCHASH(nd->nd_retxid)->lh_first; rp != NULL;
189 rp = rp->rc_hash.le_next) {
190 if (nd->nd_retxid == rp->rc_xid && nd->nd_procnum == rp->rc_proc &&
191 netaddr_match(NETFAMILY(rp), &rp->rc_haddr, nd->nd_nam)) {
192 NFS_DPF(RC, ("H%03x", rp->rc_xid & 0xfff));
193 if ((rp->rc_flag & RC_LOCKED) != 0) {
194 rp->rc_flag |= RC_WANTED;
195 tsleep((caddr_t)rp, 0, "nfsrc", 0);
198 rp->rc_flag |= RC_LOCKED;
199 /* If not at end of LRU chain, move it there */
200 if (TAILQ_NEXT(rp, rc_lru) != NULL) {
201 TAILQ_REMOVE(&nfsrvlruhead, rp, rc_lru);
202 TAILQ_INSERT_TAIL(&nfsrvlruhead, rp, rc_lru);
204 if (rp->rc_state == RC_UNUSED)
205 panic("nfsrv cache");
206 if (rp->rc_state == RC_INPROG) {
207 nfsstats.srvcache_inproghits++;
209 } else if (rp->rc_flag & RC_REPSTATUS) {
210 nfsstats.srvcache_nonidemdonehits++;
211 nfs_rephead(0, nd, slp, rp->rc_status,
214 } else if (rp->rc_flag & RC_REPMBUF) {
215 nfsstats.srvcache_nonidemdonehits++;
216 *repp = m_copym(rp->rc_reply, 0, M_COPYALL,
220 nfsstats.srvcache_idemdonehits++;
221 rp->rc_state = RC_INPROG;
224 rp->rc_flag &= ~RC_LOCKED;
225 if (rp->rc_flag & RC_WANTED) {
226 rp->rc_flag &= ~RC_WANTED;
229 lwkt_reltoken(&srvcache_token);
234 nfsstats.srvcache_misses++;
235 NFS_DPF(RC, ("M%03x", nd->nd_retxid & 0xfff));
236 if (numnfsrvcache < desirednfsrvcache) {
237 rp = kmalloc((u_long)sizeof *rp, M_NFSD, M_WAITOK | M_ZERO);
239 rp->rc_flag = RC_LOCKED;
241 rp = TAILQ_FIRST(&nfsrvlruhead);
242 while ((rp->rc_flag & RC_LOCKED) != 0) {
243 rp->rc_flag |= RC_WANTED;
244 tsleep((caddr_t)rp, 0, "nfsrc", 0);
245 rp = TAILQ_FIRST(&nfsrvlruhead);
247 rp->rc_flag |= RC_LOCKED;
248 LIST_REMOVE(rp, rc_hash);
249 TAILQ_REMOVE(&nfsrvlruhead, rp, rc_lru);
250 if (rp->rc_flag & RC_REPMBUF) {
251 m_freem(rp->rc_reply);
253 rp->rc_flag &= ~RC_REPMBUF;
255 if (rp->rc_flag & RC_NAM) {
256 kfree(rp->rc_nam, M_SONAME);
258 rp->rc_flag &= ~RC_NAM;
261 TAILQ_INSERT_TAIL(&nfsrvlruhead, rp, rc_lru);
263 rp->rc_state = RC_INPROG;
264 rp->rc_xid = nd->nd_retxid;
265 saddr = (struct sockaddr_in *)nd->nd_nam;
266 switch (saddr->sin_family) {
268 rp->rc_flag |= RC_INETADDR;
269 rp->rc_inetaddr = saddr->sin_addr.s_addr;
273 rp->rc_flag |= RC_NAM;
274 rp->rc_nam = dup_sockaddr(nd->nd_nam);
277 rp->rc_proc = nd->nd_procnum;
278 LIST_INSERT_HEAD(NFSRCHASH(nd->nd_retxid), rp, rc_hash);
279 rp->rc_flag &= ~RC_LOCKED;
280 if (rp->rc_flag & RC_WANTED) {
281 rp->rc_flag &= ~RC_WANTED;
284 lwkt_reltoken(&srvcache_token);
290 * Update a request cache entry after the rpc has been done
293 nfsrv_updatecache(struct nfsrv_descript *nd, int repvalid, struct mbuf *repmbuf)
295 struct nfsrvcache *rp;
300 lwkt_gettoken(&srvcache_token);
302 for (rp = NFSRCHASH(nd->nd_retxid)->lh_first; rp != NULL;
303 rp = rp->rc_hash.le_next) {
304 if (nd->nd_retxid == rp->rc_xid && nd->nd_procnum == rp->rc_proc &&
305 netaddr_match(NETFAMILY(rp), &rp->rc_haddr, nd->nd_nam)) {
306 NFS_DPF(RC, ("U%03x", rp->rc_xid & 0xfff));
307 if ((rp->rc_flag & RC_LOCKED) != 0) {
308 rp->rc_flag |= RC_WANTED;
309 tsleep((caddr_t)rp, 0, "nfsrc", 0);
312 rp->rc_flag |= RC_LOCKED;
313 if (rp->rc_state == RC_DONE) {
315 * This can occur if the cache is too small.
316 * Retransmits of the same request aren't
317 * dropped so we may see the operation
318 * complete more then once.
320 if (rp->rc_flag & RC_REPMBUF) {
321 m_freem(rp->rc_reply);
323 rp->rc_flag &= ~RC_REPMBUF;
326 rp->rc_state = RC_DONE;
329 * If we have a valid reply update status and save
330 * the reply for non-idempotent rpc's.
332 if (repvalid && nonidempotent[nd->nd_procnum]) {
333 if ((nd->nd_flag & ND_NFSV3) == 0 &&
334 nfsv2_repstat[nfsv2_procid[nd->nd_procnum]]) {
335 rp->rc_status = nd->nd_repstat;
336 rp->rc_flag |= RC_REPSTATUS;
338 if (rp->rc_flag & RC_REPMBUF) {
339 m_freem(rp->rc_reply);
341 rp->rc_flag &= ~RC_REPMBUF;
343 rp->rc_reply = m_copym(repmbuf, 0,
345 rp->rc_flag |= RC_REPMBUF;
348 rp->rc_flag &= ~RC_LOCKED;
349 if (rp->rc_flag & RC_WANTED) {
350 rp->rc_flag &= ~RC_WANTED;
356 lwkt_reltoken(&srvcache_token);
357 NFS_DPF(RC, ("L%03x", nd->nd_retxid & 0xfff));
361 * Clean out the cache. Called when the last nfsd terminates.
364 nfsrv_cleancache(void)
366 struct nfsrvcache *rp;
368 lwkt_gettoken(&srvcache_token);
369 while ((rp = TAILQ_FIRST(&nfsrvlruhead)) != NULL) {
370 if (rp->rc_flag & RC_LOCKED) {
371 rp->rc_flag |= RC_WANTED;
372 tsleep((caddr_t)rp, 0, "nfsrc", 0);
375 LIST_REMOVE(rp, rc_hash);
376 TAILQ_REMOVE(&nfsrvlruhead, rp, rc_lru);
377 if (rp->rc_flag & RC_REPMBUF) {
378 m_freem(rp->rc_reply);
380 rp->rc_flag &= ~RC_REPMBUF;
382 if (rp->rc_flag & RC_NAM) {
383 kfree(rp->rc_nam, M_SONAME);
385 rp->rc_flag &= ~RC_NAM;
390 lwkt_reltoken(&srvcache_token);
393 #endif /* NFS_NOSERVER */