| 1 | /* |
| 2 | * Copyright (c) 2000-2010 Apple Inc. All rights reserved. |
| 3 | * |
| 4 | * @APPLE_OSREFERENCE_LICENSE_HEADER_START@ |
| 5 | * |
| 6 | * This file contains Original Code and/or Modifications of Original Code |
| 7 | * as defined in and that are subject to the Apple Public Source License |
| 8 | * Version 2.0 (the 'License'). You may not use this file except in |
| 9 | * compliance with the License. The rights granted to you under the License |
| 10 | * may not be used to create, or enable the creation or redistribution of, |
| 11 | * unlawful or unlicensed copies of an Apple operating system, or to |
| 12 | * circumvent, violate, or enable the circumvention or violation of, any |
| 13 | * terms of an Apple operating system software license agreement. |
| 14 | * |
| 15 | * Please obtain a copy of the License at |
| 16 | * http://www.opensource.apple.com/apsl/ and read it before using this file. |
| 17 | * |
| 18 | * The Original Code and all software distributed under the License are |
| 19 | * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER |
| 20 | * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES, |
| 21 | * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY, |
| 22 | * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT. |
| 23 | * Please see the License for the specific language governing rights and |
| 24 | * limitations under the License. |
| 25 | * |
| 26 | * @APPLE_OSREFERENCE_LICENSE_HEADER_END@ |
| 27 | */ |
| 28 | /* Copyright (c) 1995 NeXT Computer, Inc. All Rights Reserved */ |
| 29 | /* |
| 30 | * Copyright (c) 1989, 1993 |
| 31 | * The Regents of the University of California. All rights reserved. |
| 32 | * |
| 33 | * This code is derived from software contributed to Berkeley by |
| 34 | * Rick Macklem at The University of Guelph. |
| 35 | * |
| 36 | * Redistribution and use in source and binary forms, with or without |
| 37 | * modification, are permitted provided that the following conditions |
| 38 | * are met: |
| 39 | * 1. Redistributions of source code must retain the above copyright |
| 40 | * notice, this list of conditions and the following disclaimer. |
| 41 | * 2. Redistributions in binary form must reproduce the above copyright |
| 42 | * notice, this list of conditions and the following disclaimer in the |
| 43 | * documentation and/or other materials provided with the distribution. |
| 44 | * 3. All advertising materials mentioning features or use of this software |
| 45 | * must display the following acknowledgement: |
| 46 | * This product includes software developed by the University of |
| 47 | * California, Berkeley and its contributors. |
| 48 | * 4. Neither the name of the University nor the names of its contributors |
| 49 | * may be used to endorse or promote products derived from this software |
| 50 | * without specific prior written permission. |
| 51 | * |
| 52 | * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND |
| 53 | * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE |
| 54 | * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE |
| 55 | * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE |
| 56 | * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL |
| 57 | * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS |
| 58 | * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) |
| 59 | * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT |
| 60 | * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY |
| 61 | * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF |
| 62 | * SUCH DAMAGE. |
| 63 | * |
| 64 | * @(#)nfs_srvcache.c 8.3 (Berkeley) 3/30/95 |
| 65 | * FreeBSD-Id: nfs_srvcache.c,v 1.15 1997/10/12 20:25:46 phk Exp $ |
| 66 | */ |
| 67 | |
| 68 | #if NFSSERVER |
| 69 | /* |
| 70 | * Reference: Chet Juszczak, "Improving the Performance and Correctness |
| 71 | * of an NFS Server", in Proc. Winter 1989 USENIX Conference, |
| 72 | * pages 53-63. San Diego, February 1989. |
| 73 | */ |
| 74 | #include <sys/param.h> |
| 75 | #include <sys/vnode.h> |
| 76 | #include <sys/mount_internal.h> |
| 77 | #include <sys/kernel.h> |
| 78 | #include <sys/systm.h> |
| 79 | #include <sys/proc.h> |
| 80 | #include <sys/kpi_mbuf.h> |
| 81 | #include <sys/malloc.h> |
| 82 | #include <sys/socket.h> |
| 83 | #include <libkern/OSAtomic.h> |
| 84 | |
| 85 | #include <netinet/in.h> |
| 86 | #include <nfs/rpcv2.h> |
| 87 | #include <nfs/nfsproto.h> |
| 88 | #include <nfs/nfs.h> |
| 89 | #include <nfs/nfsrvcache.h> |
| 90 | |
| 91 | extern int nfsv2_procid[NFS_NPROCS]; |
| 92 | static int nfsrv_reqcache_count; |
| 93 | int nfsrv_reqcache_size = NFSRVCACHESIZ; |
| 94 | |
| 95 | #define NFSRCHASH(xid) \ |
| 96 | (&nfsrv_reqcache_hashtbl[((xid) + ((xid) >> 24)) & nfsrv_reqcache_hash]) |
| 97 | LIST_HEAD(nfsrv_reqcache_hash, nfsrvcache) *nfsrv_reqcache_hashtbl; |
| 98 | TAILQ_HEAD(nfsrv_reqcache_lru, nfsrvcache) nfsrv_reqcache_lruhead; |
| 99 | u_long nfsrv_reqcache_hash; |
| 100 | |
| 101 | lck_grp_t *nfsrv_reqcache_lck_grp; |
| 102 | lck_mtx_t *nfsrv_reqcache_mutex; |
| 103 | |
| 104 | /* |
| 105 | * Static array that defines which nfs rpc's are nonidempotent |
| 106 | */ |
| 107 | static int nonidempotent[NFS_NPROCS] = { |
| 108 | FALSE, |
| 109 | FALSE, |
| 110 | TRUE, |
| 111 | FALSE, |
| 112 | FALSE, |
| 113 | FALSE, |
| 114 | FALSE, |
| 115 | TRUE, |
| 116 | TRUE, |
| 117 | TRUE, |
| 118 | TRUE, |
| 119 | TRUE, |
| 120 | TRUE, |
| 121 | TRUE, |
| 122 | TRUE, |
| 123 | TRUE, |
| 124 | FALSE, |
| 125 | FALSE, |
| 126 | FALSE, |
| 127 | FALSE, |
| 128 | FALSE, |
| 129 | FALSE, |
| 130 | FALSE, |
| 131 | }; |
| 132 | |
| 133 | /* True iff the rpc reply is an nfs status ONLY! */ |
| 134 | static int nfsv2_repstat[NFS_NPROCS] = { |
| 135 | FALSE, |
| 136 | FALSE, |
| 137 | FALSE, |
| 138 | FALSE, |
| 139 | FALSE, |
| 140 | FALSE, |
| 141 | FALSE, |
| 142 | FALSE, |
| 143 | FALSE, |
| 144 | FALSE, |
| 145 | TRUE, |
| 146 | TRUE, |
| 147 | TRUE, |
| 148 | TRUE, |
| 149 | FALSE, |
| 150 | TRUE, |
| 151 | FALSE, |
| 152 | FALSE, |
| 153 | }; |
| 154 | |
| 155 | /* |
| 156 | * Initialize the server request cache list |
| 157 | */ |
| 158 | void |
| 159 | nfsrv_initcache(void) |
| 160 | { |
| 161 | if (nfsrv_reqcache_size <= 0) |
| 162 | return; |
| 163 | |
| 164 | lck_mtx_lock(nfsrv_reqcache_mutex); |
| 165 | /* init nfs server request cache hash table */ |
| 166 | nfsrv_reqcache_hashtbl = hashinit(nfsrv_reqcache_size, M_NFSD, &nfsrv_reqcache_hash); |
| 167 | TAILQ_INIT(&nfsrv_reqcache_lruhead); |
| 168 | lck_mtx_unlock(nfsrv_reqcache_mutex); |
| 169 | } |
| 170 | |
| 171 | /* |
| 172 | * This function compares two net addresses by family and returns TRUE |
| 173 | * if they are the same host. |
| 174 | * If there is any doubt, return FALSE. |
| 175 | * The AF_INET family is handled as a special case so that address mbufs |
| 176 | * don't need to be saved to store "struct in_addr", which is only 4 bytes. |
| 177 | * Ditto for AF_INET6 which is only 16 bytes. |
| 178 | */ |
| 179 | static int |
| 180 | netaddr_match( |
| 181 | int family, |
| 182 | union nethostaddr *haddr, |
| 183 | mbuf_t nam) |
| 184 | { |
| 185 | struct sockaddr_in *inetaddr; |
| 186 | struct sockaddr_in6 *inet6addr; |
| 187 | |
| 188 | switch (family) { |
| 189 | case AF_INET: |
| 190 | inetaddr = mbuf_data(nam); |
| 191 | if ((inetaddr->sin_family == AF_INET) && |
| 192 | (inetaddr->sin_addr.s_addr == haddr->had_inetaddr)) |
| 193 | return (1); |
| 194 | break; |
| 195 | case AF_INET6: |
| 196 | inet6addr = mbuf_data(nam); |
| 197 | if ((inet6addr->sin6_family == AF_INET6) && |
| 198 | !bcmp(&inet6addr->sin6_addr, &haddr->had_inet6addr, sizeof(inet6addr->sin6_addr))) |
| 199 | return (1); |
| 200 | break; |
| 201 | } |
| 202 | return (0); |
| 203 | } |
| 204 | |
| 205 | /* |
| 206 | * Look for the request in the cache |
| 207 | * If found then |
| 208 | * return action and optionally reply |
| 209 | * else |
| 210 | * insert it in the cache |
| 211 | * |
| 212 | * The rules are as follows: |
| 213 | * - if in progress, return DROP request |
| 214 | * - if completed within DELAY of the current time, return DROP it |
| 215 | * - if completed a longer time ago return REPLY if the reply was cached or |
| 216 | * return DOIT |
| 217 | * Update/add new request at end of lru list |
| 218 | */ |
| 219 | int |
| 220 | nfsrv_getcache( |
| 221 | struct nfsrv_descript *nd, |
| 222 | struct nfsrv_sock *slp, |
| 223 | mbuf_t *mrepp) |
| 224 | { |
| 225 | struct nfsrvcache *rp; |
| 226 | struct nfsm_chain nmrep; |
| 227 | struct sockaddr *saddr; |
| 228 | int ret, error; |
| 229 | |
| 230 | /* |
| 231 | * Don't cache recent requests for reliable transport protocols. |
| 232 | * (Maybe we should for the case of a reconnect, but..) |
| 233 | */ |
| 234 | if (!nd->nd_nam2) |
| 235 | return (RC_DOIT); |
| 236 | lck_mtx_lock(nfsrv_reqcache_mutex); |
| 237 | loop: |
| 238 | for (rp = NFSRCHASH(nd->nd_retxid)->lh_first; rp != 0; |
| 239 | rp = rp->rc_hash.le_next) { |
| 240 | if (nd->nd_retxid == rp->rc_xid && nd->nd_procnum == rp->rc_proc && |
| 241 | netaddr_match(rp->rc_family, &rp->rc_haddr, nd->nd_nam)) { |
| 242 | if ((rp->rc_flag & RC_LOCKED) != 0) { |
| 243 | rp->rc_flag |= RC_WANTED; |
| 244 | msleep(rp, nfsrv_reqcache_mutex, PZERO-1, "nfsrc" , NULL); |
| 245 | goto loop; |
| 246 | } |
| 247 | rp->rc_flag |= RC_LOCKED; |
| 248 | /* If not at end of LRU chain, move it there */ |
| 249 | if (rp->rc_lru.tqe_next) { |
| 250 | TAILQ_REMOVE(&nfsrv_reqcache_lruhead, rp, rc_lru); |
| 251 | TAILQ_INSERT_TAIL(&nfsrv_reqcache_lruhead, rp, rc_lru); |
| 252 | } |
| 253 | if (rp->rc_state == RC_UNUSED) |
| 254 | panic("nfsrv cache" ); |
| 255 | if (rp->rc_state == RC_INPROG) { |
| 256 | OSAddAtomic64(1, &nfsstats.srvcache_inproghits); |
| 257 | ret = RC_DROPIT; |
| 258 | } else if (rp->rc_flag & RC_REPSTATUS) { |
| 259 | OSAddAtomic64(1, &nfsstats.srvcache_nonidemdonehits); |
| 260 | nd->nd_repstat = rp->rc_status; |
| 261 | error = nfsrv_rephead(nd, slp, &nmrep, 0); |
| 262 | if (error) { |
| 263 | printf("nfsrv cache: reply alloc failed for nonidem request hit\n" ); |
| 264 | ret = RC_DROPIT; |
| 265 | *mrepp = NULL; |
| 266 | } else { |
| 267 | ret = RC_REPLY; |
| 268 | *mrepp = nmrep.nmc_mhead; |
| 269 | } |
| 270 | } else if (rp->rc_flag & RC_REPMBUF) { |
| 271 | OSAddAtomic64(1, &nfsstats.srvcache_nonidemdonehits); |
| 272 | error = mbuf_copym(rp->rc_reply, 0, MBUF_COPYALL, MBUF_WAITOK, mrepp); |
| 273 | if (error) { |
| 274 | printf("nfsrv cache: reply copym failed for nonidem request hit\n" ); |
| 275 | ret = RC_DROPIT; |
| 276 | } else { |
| 277 | ret = RC_REPLY; |
| 278 | } |
| 279 | } else { |
| 280 | OSAddAtomic64(1, &nfsstats.srvcache_idemdonehits); |
| 281 | rp->rc_state = RC_INPROG; |
| 282 | ret = RC_DOIT; |
| 283 | } |
| 284 | rp->rc_flag &= ~RC_LOCKED; |
| 285 | if (rp->rc_flag & RC_WANTED) { |
| 286 | rp->rc_flag &= ~RC_WANTED; |
| 287 | wakeup(rp); |
| 288 | } |
| 289 | lck_mtx_unlock(nfsrv_reqcache_mutex); |
| 290 | return (ret); |
| 291 | } |
| 292 | } |
| 293 | OSAddAtomic64(1, &nfsstats.srvcache_misses); |
| 294 | if (nfsrv_reqcache_count < nfsrv_reqcache_size) { |
| 295 | /* try to allocate a new entry */ |
| 296 | MALLOC(rp, struct nfsrvcache *, sizeof *rp, M_NFSD, M_WAITOK); |
| 297 | if (rp) { |
| 298 | bzero((char *)rp, sizeof *rp); |
| 299 | nfsrv_reqcache_count++; |
| 300 | rp->rc_flag = RC_LOCKED; |
| 301 | } |
| 302 | } else { |
| 303 | rp = NULL; |
| 304 | } |
| 305 | if (!rp) { |
| 306 | /* try to reuse the least recently used entry */ |
| 307 | rp = nfsrv_reqcache_lruhead.tqh_first; |
| 308 | if (!rp) { |
| 309 | /* no entry to reuse? */ |
| 310 | /* OK, we just won't be able to cache this request */ |
| 311 | lck_mtx_unlock(nfsrv_reqcache_mutex); |
| 312 | return (RC_DOIT); |
| 313 | } |
| 314 | while ((rp->rc_flag & RC_LOCKED) != 0) { |
| 315 | rp->rc_flag |= RC_WANTED; |
| 316 | msleep(rp, nfsrv_reqcache_mutex, PZERO-1, "nfsrc" , NULL); |
| 317 | rp = nfsrv_reqcache_lruhead.tqh_first; |
| 318 | } |
| 319 | rp->rc_flag |= RC_LOCKED; |
| 320 | LIST_REMOVE(rp, rc_hash); |
| 321 | TAILQ_REMOVE(&nfsrv_reqcache_lruhead, rp, rc_lru); |
| 322 | if (rp->rc_flag & RC_REPMBUF) |
| 323 | mbuf_freem(rp->rc_reply); |
| 324 | if (rp->rc_flag & RC_NAM) |
| 325 | mbuf_freem(rp->rc_nam); |
| 326 | rp->rc_flag &= (RC_LOCKED | RC_WANTED); |
| 327 | } |
| 328 | TAILQ_INSERT_TAIL(&nfsrv_reqcache_lruhead, rp, rc_lru); |
| 329 | rp->rc_state = RC_INPROG; |
| 330 | rp->rc_xid = nd->nd_retxid; |
| 331 | saddr = mbuf_data(nd->nd_nam); |
| 332 | rp->rc_family = saddr->sa_family; |
| 333 | switch (saddr->sa_family) { |
| 334 | case AF_INET: |
| 335 | rp->rc_flag |= RC_INETADDR; |
| 336 | rp->rc_inetaddr = ((struct sockaddr_in*)saddr)->sin_addr.s_addr; |
| 337 | break; |
| 338 | case AF_INET6: |
| 339 | rp->rc_flag |= RC_INETADDR; |
| 340 | rp->rc_inet6addr = ((struct sockaddr_in6*)saddr)->sin6_addr; |
| 341 | break; |
| 342 | default: |
| 343 | error = mbuf_copym(nd->nd_nam, 0, MBUF_COPYALL, MBUF_WAITOK, &rp->rc_nam); |
| 344 | if (error) |
| 345 | printf("nfsrv cache: nam copym failed\n" ); |
| 346 | else |
| 347 | rp->rc_flag |= RC_NAM; |
| 348 | break; |
| 349 | }; |
| 350 | rp->rc_proc = nd->nd_procnum; |
| 351 | LIST_INSERT_HEAD(NFSRCHASH(nd->nd_retxid), rp, rc_hash); |
| 352 | rp->rc_flag &= ~RC_LOCKED; |
| 353 | if (rp->rc_flag & RC_WANTED) { |
| 354 | rp->rc_flag &= ~RC_WANTED; |
| 355 | wakeup(rp); |
| 356 | } |
| 357 | lck_mtx_unlock(nfsrv_reqcache_mutex); |
| 358 | return (RC_DOIT); |
| 359 | } |
| 360 | |
| 361 | /* |
| 362 | * Update a request cache entry after the rpc has been done |
| 363 | */ |
| 364 | void |
| 365 | nfsrv_updatecache( |
| 366 | struct nfsrv_descript *nd, |
| 367 | int repvalid, |
| 368 | mbuf_t repmbuf) |
| 369 | { |
| 370 | struct nfsrvcache *rp; |
| 371 | int error; |
| 372 | |
| 373 | if (!nd->nd_nam2) |
| 374 | return; |
| 375 | lck_mtx_lock(nfsrv_reqcache_mutex); |
| 376 | loop: |
| 377 | for (rp = NFSRCHASH(nd->nd_retxid)->lh_first; rp != 0; |
| 378 | rp = rp->rc_hash.le_next) { |
| 379 | if (nd->nd_retxid == rp->rc_xid && nd->nd_procnum == rp->rc_proc && |
| 380 | netaddr_match(rp->rc_family, &rp->rc_haddr, nd->nd_nam)) { |
| 381 | if ((rp->rc_flag & RC_LOCKED) != 0) { |
| 382 | rp->rc_flag |= RC_WANTED; |
| 383 | msleep(rp, nfsrv_reqcache_mutex, PZERO-1, "nfsrc" , NULL); |
| 384 | goto loop; |
| 385 | } |
| 386 | rp->rc_flag |= RC_LOCKED; |
| 387 | if (rp->rc_state == RC_DONE) { |
| 388 | /* |
| 389 | * This can occur if the cache is too small. |
| 390 | * Retransmits of the same request aren't |
| 391 | * dropped so we may see the operation |
| 392 | * complete more then once. |
| 393 | */ |
| 394 | if (rp->rc_flag & RC_REPMBUF) { |
| 395 | mbuf_freem(rp->rc_reply); |
| 396 | rp->rc_flag &= ~RC_REPMBUF; |
| 397 | } |
| 398 | } |
| 399 | rp->rc_state = RC_DONE; |
| 400 | /* |
| 401 | * If we have a valid reply update status and save |
| 402 | * the reply for non-idempotent rpc's. |
| 403 | */ |
| 404 | if (repvalid && nonidempotent[nd->nd_procnum]) { |
| 405 | if ((nd->nd_vers == NFS_VER2) && |
| 406 | nfsv2_repstat[nfsv2_procid[nd->nd_procnum]]) { |
| 407 | rp->rc_status = nd->nd_repstat; |
| 408 | rp->rc_flag |= RC_REPSTATUS; |
| 409 | } else { |
| 410 | error = mbuf_copym(repmbuf, 0, MBUF_COPYALL, MBUF_WAITOK, &rp->rc_reply); |
| 411 | if (!error) |
| 412 | rp->rc_flag |= RC_REPMBUF; |
| 413 | } |
| 414 | } |
| 415 | rp->rc_flag &= ~RC_LOCKED; |
| 416 | if (rp->rc_flag & RC_WANTED) { |
| 417 | rp->rc_flag &= ~RC_WANTED; |
| 418 | wakeup(rp); |
| 419 | } |
| 420 | lck_mtx_unlock(nfsrv_reqcache_mutex); |
| 421 | return; |
| 422 | } |
| 423 | } |
| 424 | lck_mtx_unlock(nfsrv_reqcache_mutex); |
| 425 | } |
| 426 | |
| 427 | /* |
| 428 | * Clean out the cache. Called when the last nfsd terminates. |
| 429 | */ |
| 430 | void |
| 431 | nfsrv_cleancache(void) |
| 432 | { |
| 433 | struct nfsrvcache *rp, *nextrp; |
| 434 | |
| 435 | lck_mtx_lock(nfsrv_reqcache_mutex); |
| 436 | for (rp = nfsrv_reqcache_lruhead.tqh_first; rp != 0; rp = nextrp) { |
| 437 | nextrp = rp->rc_lru.tqe_next; |
| 438 | LIST_REMOVE(rp, rc_hash); |
| 439 | TAILQ_REMOVE(&nfsrv_reqcache_lruhead, rp, rc_lru); |
| 440 | _FREE(rp, M_NFSD); |
| 441 | } |
| 442 | nfsrv_reqcache_count = 0; |
| 443 | FREE(nfsrv_reqcache_hashtbl, M_TEMP); |
| 444 | lck_mtx_unlock(nfsrv_reqcache_mutex); |
| 445 | } |
| 446 | |
| 447 | #endif /* NFSSERVER */ |
| 448 | |