| 1 | /* |
| 2 | * Copyright (c) 2016 Apple Inc. All rights reserved. |
| 3 | * |
| 4 | * @APPLE_LICENSE_HEADER_START@ |
| 5 | * |
| 6 | * This file contains Original Code and/or Modifications of Original Code |
| 7 | * as defined in and that are subject to the Apple Public Source License |
| 8 | * Version 2.0 (the 'License'). You may not use this file except in |
| 9 | * compliance with the License. Please obtain a copy of the License at |
| 10 | * http://www.opensource.apple.com/apsl/ and read it before using this |
| 11 | * file. |
| 12 | * |
| 13 | * The Original Code and all software distributed under the License are |
| 14 | * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER |
| 15 | * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES, |
| 16 | * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY, |
| 17 | * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT. |
| 18 | * Please see the License for the specific language governing rights and |
| 19 | * limitations under the License. |
| 20 | * |
| 21 | * @APPLE_LICENSE_HEADER_END@ |
| 22 | */ |
| 23 | |
| 24 | /*- |
| 25 | * Portions Copyright (c) 1992, 1993 |
| 26 | * The Regents of the University of California. All rights reserved. |
| 27 | * |
| 28 | * This code is derived from software donated to Berkeley by |
| 29 | * Jan-Simon Pendry. |
| 30 | * |
| 31 | * Redistribution and use in source and binary forms, with or without |
| 32 | * modification, are permitted provided that the following conditions |
| 33 | * are met: |
| 34 | * 1. Redistributions of source code must retain the above copyright |
| 35 | * notice, this list of conditions and the following disclaimer. |
| 36 | * 2. Redistributions in binary form must reproduce the above copyright |
| 37 | * notice, this list of conditions and the following disclaimer in the |
| 38 | * documentation and/or other materials provided with the distribution. |
| 39 | * 4. Neither the name of the University nor the names of its contributors |
| 40 | * may be used to endorse or promote products derived from this software |
| 41 | * without specific prior written permission. |
| 42 | * |
| 43 | * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND |
| 44 | * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE |
| 45 | * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE |
| 46 | * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE |
| 47 | * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL |
| 48 | * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS |
| 49 | * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) |
| 50 | * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT |
| 51 | * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY |
| 52 | * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF |
| 53 | * SUCH DAMAGE. |
| 54 | * |
| 55 | * @(#)null_subr.c 8.7 (Berkeley) 5/14/95 |
| 56 | * |
| 57 | * $FreeBSD$ |
| 58 | */ |
| 59 | #include <sys/param.h> |
| 60 | #include <sys/systm.h> |
| 61 | #include <sys/kernel.h> |
| 62 | #include <sys/lock.h> |
| 63 | #include <sys/malloc.h> |
| 64 | #include <sys/mount.h> |
| 65 | #include <sys/proc.h> |
| 66 | #include <sys/vnode.h> |
| 67 | |
| 68 | #include "nullfs.h" |
| 69 | |
| 70 | /* |
| 71 | * Null layer cache: |
| 72 | * Each cache entry holds a reference to the lower vnode |
| 73 | * along with a pointer to the alias vnode. When an |
| 74 | * entry is added the lower vnode is VREF'd. When the |
| 75 | * alias is removed the lower vnode is vrele'd. |
| 76 | */ |
| 77 | |
| 78 | #define NULL_HASH_SIZE (desiredvnodes / 10) |
| 79 | |
| 80 | /* osx doesn't really have the functionality freebsd uses here..gonna try this |
| 81 | * hacked hash...*/ |
| 82 | #define NULL_NHASH(vp) (&null_node_hashtbl[((((uintptr_t)vp) >> vnsz2log) + (uintptr_t)vnode_mount(vp)) & null_hash_mask]) |
| 83 | |
| 84 | static LIST_HEAD(null_node_hashhead, null_node) * null_node_hashtbl; |
| 85 | static lck_mtx_t null_hashmtx; |
| 86 | static lck_attr_t * null_hashlck_attr; |
| 87 | static lck_grp_t * null_hashlck_grp; |
| 88 | static lck_grp_attr_t * null_hashlck_grp_attr; |
| 89 | static u_long null_hash_mask; |
| 90 | |
| 91 | /* os x doesn't have hashes built into vnode. gonna try doing what freebsd does |
| 92 | anyway |
| 93 | Don't want to create a dependency on vnode_internal.h and the real struct |
| 94 | vnode. |
| 95 | 9 is an eyeball of the log 2 size of vnode */ |
| 96 | static int vnsz2log = 9; |
| 97 | |
| 98 | static int null_hashins(struct mount *, struct null_node *, struct vnode **); |
| 99 | |
| 100 | int |
| 101 | nullfs_init_lck(lck_mtx_t * lck) |
| 102 | { |
| 103 | int error = 1; |
| 104 | if (lck && null_hashlck_grp && null_hashlck_attr) { |
| 105 | lck_mtx_init(lck, null_hashlck_grp, null_hashlck_attr); |
| 106 | error = 0; |
| 107 | } |
| 108 | return error; |
| 109 | } |
| 110 | |
| 111 | int |
| 112 | nullfs_destroy_lck(lck_mtx_t * lck) |
| 113 | { |
| 114 | int error = 1; |
| 115 | if (lck && null_hashlck_grp) { |
| 116 | lck_mtx_destroy(lck, null_hashlck_grp); |
| 117 | error = 0; |
| 118 | } |
| 119 | return error; |
| 120 | } |
| 121 | |
| 122 | /* |
| 123 | * Initialise cache headers |
| 124 | */ |
| 125 | int |
| 126 | nullfs_init(__unused struct vfsconf * vfsp) |
| 127 | { |
| 128 | NULLFSDEBUG("%s\n" , __FUNCTION__); |
| 129 | |
| 130 | /* assuming for now that this happens immediately and by default after fs |
| 131 | * installation */ |
| 132 | null_hashlck_grp_attr = lck_grp_attr_alloc_init(); |
| 133 | if (null_hashlck_grp_attr == NULL) { |
| 134 | goto error; |
| 135 | } |
| 136 | null_hashlck_grp = lck_grp_alloc_init("com.apple.filesystems.nullfs" , null_hashlck_grp_attr); |
| 137 | if (null_hashlck_grp == NULL) { |
| 138 | goto error; |
| 139 | } |
| 140 | null_hashlck_attr = lck_attr_alloc_init(); |
| 141 | if (null_hashlck_attr == NULL) { |
| 142 | goto error; |
| 143 | } |
| 144 | |
| 145 | lck_mtx_init(&null_hashmtx, null_hashlck_grp, null_hashlck_attr); |
| 146 | null_node_hashtbl = hashinit(NULL_HASH_SIZE, M_TEMP, &null_hash_mask); |
| 147 | NULLFSDEBUG("%s finished\n" , __FUNCTION__); |
| 148 | return (0); |
| 149 | error: |
| 150 | printf("NULLFS: failed to get lock element\n" ); |
| 151 | if (null_hashlck_grp_attr) { |
| 152 | lck_grp_attr_free(null_hashlck_grp_attr); |
| 153 | null_hashlck_grp_attr = NULL; |
| 154 | } |
| 155 | if (null_hashlck_grp) { |
| 156 | lck_grp_free(null_hashlck_grp); |
| 157 | null_hashlck_grp = NULL; |
| 158 | } |
| 159 | if (null_hashlck_attr) { |
| 160 | lck_attr_free(null_hashlck_attr); |
| 161 | null_hashlck_attr = NULL; |
| 162 | } |
| 163 | return KERN_FAILURE; |
| 164 | } |
| 165 | |
| 166 | int |
| 167 | nullfs_uninit() |
| 168 | { |
| 169 | /* This gets called when the fs is uninstalled, there wasn't an exact |
| 170 | * equivalent in vfsops */ |
| 171 | lck_mtx_destroy(&null_hashmtx, null_hashlck_grp); |
| 172 | FREE(null_node_hashtbl, M_TEMP); |
| 173 | if (null_hashlck_grp_attr) { |
| 174 | lck_grp_attr_free(null_hashlck_grp_attr); |
| 175 | null_hashlck_grp_attr = NULL; |
| 176 | } |
| 177 | if (null_hashlck_grp) { |
| 178 | lck_grp_free(null_hashlck_grp); |
| 179 | null_hashlck_grp = NULL; |
| 180 | } |
| 181 | if (null_hashlck_attr) { |
| 182 | lck_attr_free(null_hashlck_attr); |
| 183 | null_hashlck_attr = NULL; |
| 184 | } |
| 185 | return (0); |
| 186 | } |
| 187 | |
| 188 | /* |
| 189 | * Find the nullfs vnode mapped to lowervp. Return it in *vpp with an iocount if found. |
| 190 | * Return 0 on success. On failure *vpp will be null and a non-zero error code will be returned. |
| 191 | */ |
| 192 | int |
| 193 | null_hashget(struct mount * mp, struct vnode * lowervp, struct vnode ** vpp) |
| 194 | { |
| 195 | struct null_node_hashhead * hd; |
| 196 | struct null_node * a; |
| 197 | struct vnode * vp; |
| 198 | int error = ENOENT; |
| 199 | |
| 200 | /* |
| 201 | * Find hash base, and then search the (two-way) linked |
| 202 | * list looking for a null_node structure which is referencing |
| 203 | * the lower vnode. We only give up our reference at reclaim so |
| 204 | * just check whether the lowervp has gotten pulled from under us |
| 205 | */ |
| 206 | hd = NULL_NHASH(lowervp); |
| 207 | lck_mtx_lock(&null_hashmtx); |
| 208 | LIST_FOREACH(a, hd, null_hash) |
| 209 | { |
| 210 | if (a->null_lowervp == lowervp && vnode_mount(NULLTOV(a)) == mp) { |
| 211 | vp = NULLTOV(a); |
| 212 | if (a->null_lowervid != vnode_vid(lowervp)) { |
| 213 | /*lowervp has reved */ |
| 214 | error = EIO; |
| 215 | } else { |
| 216 | /* if we found something then get an iocount on it */ |
| 217 | error = vnode_getwithvid(vp, a->null_myvid); |
| 218 | if (error == 0) { |
| 219 | *vpp = vp; |
| 220 | } |
| 221 | } |
| 222 | break; |
| 223 | } |
| 224 | } |
| 225 | lck_mtx_unlock(&null_hashmtx); |
| 226 | return error; |
| 227 | } |
| 228 | |
| 229 | /* |
| 230 | * Act like null_hashget, but add passed null_node to hash if no existing |
| 231 | * node found. |
| 232 | */ |
| 233 | static int |
| 234 | null_hashins(struct mount * mp, struct null_node * xp, struct vnode ** vpp) |
| 235 | { |
| 236 | struct null_node_hashhead * hd; |
| 237 | struct null_node * oxp; |
| 238 | struct vnode * ovp; |
| 239 | int error = 0; |
| 240 | |
| 241 | hd = NULL_NHASH(xp->null_lowervp); |
| 242 | lck_mtx_lock(&null_hashmtx); |
| 243 | LIST_FOREACH(oxp, hd, null_hash) |
| 244 | { |
| 245 | if (oxp->null_lowervp == xp->null_lowervp && vnode_mount(NULLTOV(oxp)) == mp) { |
| 246 | /* |
| 247 | * See null_hashget for a description of this |
| 248 | * operation. |
| 249 | */ |
| 250 | ovp = NULLTOV(oxp); |
| 251 | if (oxp->null_lowervid != vnode_vid(oxp->null_lowervp)) { |
| 252 | /*vp doesn't exist so return null (not sure we are actually gonna catch |
| 253 | recycle right now |
| 254 | This is an exceptional case right now, it suggests the vnode we are |
| 255 | trying to add has been recycled |
| 256 | don't add it.*/ |
| 257 | error = EIO; |
| 258 | goto end; |
| 259 | } |
| 260 | /* if we found something in the hash map then grab an iocount */ |
| 261 | error = vnode_getwithvid(ovp, oxp->null_myvid); |
| 262 | if (error == 0) { |
| 263 | *vpp = ovp; |
| 264 | } |
| 265 | goto end; |
| 266 | } |
| 267 | } |
| 268 | /* if it wasn't in the hash map then the vnode pointed to by xp already has a |
| 269 | * iocount so don't bother */ |
| 270 | LIST_INSERT_HEAD(hd, xp, null_hash); |
| 271 | xp->null_flags |= NULL_FLAG_HASHED; |
| 272 | end: |
| 273 | lck_mtx_unlock(&null_hashmtx); |
| 274 | return error; |
| 275 | } |
| 276 | |
| 277 | /* |
| 278 | * Remove node from hash. |
| 279 | */ |
| 280 | void |
| 281 | null_hashrem(struct null_node * xp) |
| 282 | { |
| 283 | lck_mtx_lock(&null_hashmtx); |
| 284 | LIST_REMOVE(xp, null_hash); |
| 285 | lck_mtx_unlock(&null_hashmtx); |
| 286 | } |
| 287 | |
| 288 | static struct null_node * |
| 289 | null_nodecreate(struct vnode * lowervp) |
| 290 | { |
| 291 | struct null_node * xp; |
| 292 | |
| 293 | MALLOC(xp, struct null_node *, sizeof(struct null_node), M_TEMP, M_WAITOK | M_ZERO); |
| 294 | if (xp != NULL) { |
| 295 | if (lowervp) { |
| 296 | xp->null_lowervp = lowervp; |
| 297 | xp->null_lowervid = vnode_vid(lowervp); |
| 298 | } |
| 299 | } |
| 300 | return xp; |
| 301 | } |
| 302 | |
| 303 | /* assumption is that vnode has iocount on it after vnode create */ |
| 304 | int |
| 305 | null_getnewvnode( |
| 306 | struct mount * mp, struct vnode * lowervp, struct vnode * dvp, struct vnode ** vpp, struct componentname * cnp, int root) |
| 307 | { |
| 308 | struct vnode_fsparam vnfs_param; |
| 309 | int error = 0; |
| 310 | enum vtype type = VDIR; |
| 311 | struct null_node * xp = null_nodecreate(lowervp); |
| 312 | |
| 313 | if (xp == NULL) { |
| 314 | return ENOMEM; |
| 315 | } |
| 316 | |
| 317 | if (lowervp) { |
| 318 | type = vnode_vtype(lowervp); |
| 319 | } |
| 320 | |
| 321 | vnfs_param.vnfs_mp = mp; |
| 322 | vnfs_param.vnfs_vtype = type; |
| 323 | vnfs_param.vnfs_str = "nullfs" ; |
| 324 | vnfs_param.vnfs_dvp = dvp; |
| 325 | vnfs_param.vnfs_fsnode = (void *)xp; |
| 326 | vnfs_param.vnfs_vops = nullfs_vnodeop_p; |
| 327 | vnfs_param.vnfs_markroot = root; |
| 328 | vnfs_param.vnfs_marksystem = 0; |
| 329 | vnfs_param.vnfs_rdev = 0; |
| 330 | vnfs_param.vnfs_filesize = 0; // set this to 0 since we should only be shadowing non-regular files |
| 331 | vnfs_param.vnfs_cnp = cnp; |
| 332 | vnfs_param.vnfs_flags = VNFS_ADDFSREF; |
| 333 | |
| 334 | error = vnode_create(VNCREATE_FLAVOR, VCREATESIZE, &vnfs_param, vpp); |
| 335 | if (error == 0) { |
| 336 | xp->null_vnode = *vpp; |
| 337 | xp->null_myvid = vnode_vid(*vpp); |
| 338 | vnode_settag(*vpp, VT_NULL); |
| 339 | } else { |
| 340 | FREE(xp, M_TEMP); |
| 341 | } |
| 342 | return error; |
| 343 | } |
| 344 | |
| 345 | /* |
| 346 | * Make a new or get existing nullfs node. |
| 347 | * Vp is the alias vnode, lowervp is the lower vnode. |
| 348 | * |
| 349 | * lowervp is assumed to have an iocount on it from the caller |
| 350 | */ |
| 351 | int |
| 352 | null_nodeget( |
| 353 | struct mount * mp, struct vnode * lowervp, struct vnode * dvp, struct vnode ** vpp, struct componentname * cnp, int root) |
| 354 | { |
| 355 | struct vnode * vp; |
| 356 | int error; |
| 357 | |
| 358 | /* Lookup the hash firstly. */ |
| 359 | error = null_hashget(mp, lowervp, vpp); |
| 360 | /* ENOENT means it wasn't found, EIO is a failure we should bail from, 0 is it |
| 361 | * was found */ |
| 362 | if (error != ENOENT) { |
| 363 | /* null_hashget checked the vid, so if we got something here its legit to |
| 364 | * the best of our knowledge*/ |
| 365 | /* if we found something then there is an iocount on vpp, |
| 366 | if we didn't find something then vpp shouldn't be used by the caller */ |
| 367 | return error; |
| 368 | } |
| 369 | |
| 370 | /* |
| 371 | * We do not serialize vnode creation, instead we will check for |
| 372 | * duplicates later, when adding new vnode to hash. |
| 373 | */ |
| 374 | error = vnode_ref(lowervp); // take a ref on lowervp so we let the system know we care about it |
| 375 | if(error) |
| 376 | { |
| 377 | // Failed to get a reference on the lower vp so bail. Lowervp may be gone already. |
| 378 | return error; |
| 379 | } |
| 380 | |
| 381 | error = null_getnewvnode(mp, lowervp, dvp, &vp, cnp, root); |
| 382 | |
| 383 | if (error) { |
| 384 | vnode_rele(lowervp); |
| 385 | return (error); |
| 386 | } |
| 387 | |
| 388 | /* |
| 389 | * Atomically insert our new node into the hash or vget existing |
| 390 | * if someone else has beaten us to it. |
| 391 | */ |
| 392 | error = null_hashins(mp, VTONULL(vp), vpp); |
| 393 | if (error || *vpp != NULL) { |
| 394 | /* recycle will call reclaim which will get rid of the internals */ |
| 395 | vnode_recycle(vp); |
| 396 | vnode_put(vp); |
| 397 | /* if we found vpp, then null_hashins put an iocount on it */ |
| 398 | return error; |
| 399 | } |
| 400 | |
| 401 | /* vp has an iocount from null_getnewvnode */ |
| 402 | *vpp = vp; |
| 403 | |
| 404 | return (0); |
| 405 | } |
| 406 | |